{ "best_metric": null, "best_model_checkpoint": null, "epoch": 3.0, "eval_steps": 500, "global_step": 16215, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 0.0, "learning_rate": 4.1067761806981525e-08, "loss": 1.5921, "step": 1 }, { "epoch": 0.0, "learning_rate": 8.213552361396305e-08, "loss": 1.6189, "step": 2 }, { "epoch": 0.0, "learning_rate": 1.2320328542094456e-07, "loss": 1.65, "step": 3 }, { "epoch": 0.0, "learning_rate": 1.642710472279261e-07, "loss": 1.6296, "step": 4 }, { "epoch": 0.0, "learning_rate": 2.053388090349076e-07, "loss": 1.6896, "step": 5 }, { "epoch": 0.0, "learning_rate": 2.464065708418891e-07, "loss": 1.6875, "step": 6 }, { "epoch": 0.0, "learning_rate": 2.8747433264887066e-07, "loss": 1.6377, "step": 7 }, { "epoch": 0.0, "learning_rate": 3.285420944558522e-07, "loss": 1.614, "step": 8 }, { "epoch": 0.0, "learning_rate": 3.696098562628337e-07, "loss": 1.6377, "step": 9 }, { "epoch": 0.0, "learning_rate": 4.106776180698152e-07, "loss": 1.6128, "step": 10 }, { "epoch": 0.0, "learning_rate": 4.517453798767968e-07, "loss": 1.6458, "step": 11 }, { "epoch": 0.0, "learning_rate": 4.928131416837782e-07, "loss": 1.6069, "step": 12 }, { "epoch": 0.0, "learning_rate": 5.338809034907598e-07, "loss": 1.6434, "step": 13 }, { "epoch": 0.0, "learning_rate": 5.749486652977413e-07, "loss": 1.6765, "step": 14 }, { "epoch": 0.0, "learning_rate": 6.160164271047228e-07, "loss": 1.6565, "step": 15 }, { "epoch": 0.0, "learning_rate": 6.570841889117044e-07, "loss": 1.6038, "step": 16 }, { "epoch": 0.0, "learning_rate": 6.981519507186859e-07, "loss": 1.6178, "step": 17 }, { "epoch": 0.0, "learning_rate": 7.392197125256674e-07, "loss": 1.6411, "step": 18 }, { "epoch": 0.0, "learning_rate": 7.80287474332649e-07, "loss": 1.6315, "step": 19 }, { "epoch": 0.0, "learning_rate": 8.213552361396304e-07, "loss": 1.614, "step": 20 }, { "epoch": 0.0, "learning_rate": 8.62422997946612e-07, "loss": 1.605, "step": 21 }, { "epoch": 0.0, "learning_rate": 9.034907597535936e-07, "loss": 1.6322, "step": 22 }, { "epoch": 0.0, "learning_rate": 9.44558521560575e-07, "loss": 1.6252, "step": 23 }, { "epoch": 0.0, "learning_rate": 9.856262833675565e-07, "loss": 1.6237, "step": 24 }, { "epoch": 0.0, "learning_rate": 1.026694045174538e-06, "loss": 1.616, "step": 25 }, { "epoch": 0.0, "learning_rate": 1.0677618069815197e-06, "loss": 1.6543, "step": 26 }, { "epoch": 0.0, "learning_rate": 1.1088295687885013e-06, "loss": 1.6383, "step": 27 }, { "epoch": 0.01, "learning_rate": 1.1498973305954826e-06, "loss": 1.542, "step": 28 }, { "epoch": 0.01, "learning_rate": 1.1909650924024642e-06, "loss": 1.6225, "step": 29 }, { "epoch": 0.01, "learning_rate": 1.2320328542094456e-06, "loss": 1.5896, "step": 30 }, { "epoch": 0.01, "learning_rate": 1.2731006160164272e-06, "loss": 1.599, "step": 31 }, { "epoch": 0.01, "learning_rate": 1.3141683778234088e-06, "loss": 1.5987, "step": 32 }, { "epoch": 0.01, "learning_rate": 1.3552361396303904e-06, "loss": 1.6034, "step": 33 }, { "epoch": 0.01, "learning_rate": 1.3963039014373718e-06, "loss": 1.5964, "step": 34 }, { "epoch": 0.01, "learning_rate": 1.4373716632443531e-06, "loss": 1.6306, "step": 35 }, { "epoch": 0.01, "learning_rate": 1.4784394250513347e-06, "loss": 1.5944, "step": 36 }, { "epoch": 0.01, "learning_rate": 1.5195071868583163e-06, "loss": 1.6477, "step": 37 }, { "epoch": 0.01, "learning_rate": 1.560574948665298e-06, "loss": 1.5564, "step": 38 }, { "epoch": 0.01, "learning_rate": 1.6016427104722793e-06, "loss": 1.6156, "step": 39 }, { "epoch": 0.01, "learning_rate": 1.6427104722792609e-06, "loss": 1.5686, "step": 40 }, { "epoch": 0.01, "learning_rate": 1.6837782340862425e-06, "loss": 1.584, "step": 41 }, { "epoch": 0.01, "learning_rate": 1.724845995893224e-06, "loss": 1.5863, "step": 42 }, { "epoch": 0.01, "learning_rate": 1.7659137577002056e-06, "loss": 1.584, "step": 43 }, { "epoch": 0.01, "learning_rate": 1.8069815195071872e-06, "loss": 1.5985, "step": 44 }, { "epoch": 0.01, "learning_rate": 1.8480492813141684e-06, "loss": 1.6193, "step": 45 }, { "epoch": 0.01, "learning_rate": 1.88911704312115e-06, "loss": 1.5394, "step": 46 }, { "epoch": 0.01, "learning_rate": 1.930184804928132e-06, "loss": 1.5745, "step": 47 }, { "epoch": 0.01, "learning_rate": 1.971252566735113e-06, "loss": 1.5318, "step": 48 }, { "epoch": 0.01, "learning_rate": 2.0123203285420946e-06, "loss": 1.512, "step": 49 }, { "epoch": 0.01, "learning_rate": 2.053388090349076e-06, "loss": 1.5366, "step": 50 }, { "epoch": 0.01, "learning_rate": 2.0944558521560577e-06, "loss": 1.4609, "step": 51 }, { "epoch": 0.01, "learning_rate": 2.1355236139630393e-06, "loss": 1.5394, "step": 52 }, { "epoch": 0.01, "learning_rate": 2.176591375770021e-06, "loss": 1.5072, "step": 53 }, { "epoch": 0.01, "learning_rate": 2.2176591375770025e-06, "loss": 1.5492, "step": 54 }, { "epoch": 0.01, "learning_rate": 2.2587268993839837e-06, "loss": 1.5154, "step": 55 }, { "epoch": 0.01, "learning_rate": 2.2997946611909653e-06, "loss": 1.5406, "step": 56 }, { "epoch": 0.01, "learning_rate": 2.340862422997947e-06, "loss": 1.5162, "step": 57 }, { "epoch": 0.01, "learning_rate": 2.3819301848049284e-06, "loss": 1.4792, "step": 58 }, { "epoch": 0.01, "learning_rate": 2.42299794661191e-06, "loss": 1.5302, "step": 59 }, { "epoch": 0.01, "learning_rate": 2.464065708418891e-06, "loss": 1.4581, "step": 60 }, { "epoch": 0.01, "learning_rate": 2.505133470225873e-06, "loss": 1.4871, "step": 61 }, { "epoch": 0.01, "learning_rate": 2.5462012320328544e-06, "loss": 1.4376, "step": 62 }, { "epoch": 0.01, "learning_rate": 2.587268993839836e-06, "loss": 1.4595, "step": 63 }, { "epoch": 0.01, "learning_rate": 2.6283367556468176e-06, "loss": 1.4794, "step": 64 }, { "epoch": 0.01, "learning_rate": 2.669404517453799e-06, "loss": 1.4563, "step": 65 }, { "epoch": 0.01, "learning_rate": 2.7104722792607808e-06, "loss": 1.4671, "step": 66 }, { "epoch": 0.01, "learning_rate": 2.7515400410677623e-06, "loss": 1.3944, "step": 67 }, { "epoch": 0.01, "learning_rate": 2.7926078028747435e-06, "loss": 1.4477, "step": 68 }, { "epoch": 0.01, "learning_rate": 2.833675564681725e-06, "loss": 1.4591, "step": 69 }, { "epoch": 0.01, "learning_rate": 2.8747433264887063e-06, "loss": 1.4739, "step": 70 }, { "epoch": 0.01, "learning_rate": 2.915811088295688e-06, "loss": 1.4006, "step": 71 }, { "epoch": 0.01, "learning_rate": 2.9568788501026694e-06, "loss": 1.384, "step": 72 }, { "epoch": 0.01, "learning_rate": 2.997946611909651e-06, "loss": 1.4237, "step": 73 }, { "epoch": 0.01, "learning_rate": 3.0390143737166326e-06, "loss": 1.4268, "step": 74 }, { "epoch": 0.01, "learning_rate": 3.0800821355236142e-06, "loss": 1.3925, "step": 75 }, { "epoch": 0.01, "learning_rate": 3.121149897330596e-06, "loss": 1.3998, "step": 76 }, { "epoch": 0.01, "learning_rate": 3.1622176591375774e-06, "loss": 1.4031, "step": 77 }, { "epoch": 0.01, "learning_rate": 3.2032854209445586e-06, "loss": 1.4244, "step": 78 }, { "epoch": 0.01, "learning_rate": 3.24435318275154e-06, "loss": 1.3795, "step": 79 }, { "epoch": 0.01, "learning_rate": 3.2854209445585218e-06, "loss": 1.3856, "step": 80 }, { "epoch": 0.01, "learning_rate": 3.3264887063655033e-06, "loss": 1.3722, "step": 81 }, { "epoch": 0.02, "learning_rate": 3.367556468172485e-06, "loss": 1.3555, "step": 82 }, { "epoch": 0.02, "learning_rate": 3.4086242299794665e-06, "loss": 1.3352, "step": 83 }, { "epoch": 0.02, "learning_rate": 3.449691991786448e-06, "loss": 1.3832, "step": 84 }, { "epoch": 0.02, "learning_rate": 3.4907597535934297e-06, "loss": 1.3633, "step": 85 }, { "epoch": 0.02, "learning_rate": 3.5318275154004113e-06, "loss": 1.3248, "step": 86 }, { "epoch": 0.02, "learning_rate": 3.572895277207393e-06, "loss": 1.3418, "step": 87 }, { "epoch": 0.02, "learning_rate": 3.6139630390143745e-06, "loss": 1.3228, "step": 88 }, { "epoch": 0.02, "learning_rate": 3.6550308008213552e-06, "loss": 1.3426, "step": 89 }, { "epoch": 0.02, "learning_rate": 3.696098562628337e-06, "loss": 1.3487, "step": 90 }, { "epoch": 0.02, "learning_rate": 3.7371663244353184e-06, "loss": 1.2986, "step": 91 }, { "epoch": 0.02, "learning_rate": 3.7782340862423e-06, "loss": 1.3711, "step": 92 }, { "epoch": 0.02, "learning_rate": 3.819301848049282e-06, "loss": 1.3521, "step": 93 }, { "epoch": 0.02, "learning_rate": 3.860369609856264e-06, "loss": 1.2946, "step": 94 }, { "epoch": 0.02, "learning_rate": 3.901437371663245e-06, "loss": 1.2649, "step": 95 }, { "epoch": 0.02, "learning_rate": 3.942505133470226e-06, "loss": 1.2981, "step": 96 }, { "epoch": 0.02, "learning_rate": 3.9835728952772075e-06, "loss": 1.309, "step": 97 }, { "epoch": 0.02, "learning_rate": 4.024640657084189e-06, "loss": 1.2554, "step": 98 }, { "epoch": 0.02, "learning_rate": 4.065708418891171e-06, "loss": 1.267, "step": 99 }, { "epoch": 0.02, "learning_rate": 4.106776180698152e-06, "loss": 1.2729, "step": 100 }, { "epoch": 0.02, "learning_rate": 4.147843942505134e-06, "loss": 1.2901, "step": 101 }, { "epoch": 0.02, "learning_rate": 4.1889117043121155e-06, "loss": 1.2582, "step": 102 }, { "epoch": 0.02, "learning_rate": 4.229979466119097e-06, "loss": 1.2625, "step": 103 }, { "epoch": 0.02, "learning_rate": 4.271047227926079e-06, "loss": 1.2356, "step": 104 }, { "epoch": 0.02, "learning_rate": 4.31211498973306e-06, "loss": 1.2274, "step": 105 }, { "epoch": 0.02, "learning_rate": 4.353182751540042e-06, "loss": 1.2261, "step": 106 }, { "epoch": 0.02, "learning_rate": 4.3942505133470234e-06, "loss": 1.2069, "step": 107 }, { "epoch": 0.02, "learning_rate": 4.435318275154005e-06, "loss": 1.2444, "step": 108 }, { "epoch": 0.02, "learning_rate": 4.476386036960986e-06, "loss": 1.1964, "step": 109 }, { "epoch": 0.02, "learning_rate": 4.517453798767967e-06, "loss": 1.2257, "step": 110 }, { "epoch": 0.02, "learning_rate": 4.558521560574949e-06, "loss": 1.2506, "step": 111 }, { "epoch": 0.02, "learning_rate": 4.5995893223819305e-06, "loss": 1.1949, "step": 112 }, { "epoch": 0.02, "learning_rate": 4.640657084188912e-06, "loss": 1.1882, "step": 113 }, { "epoch": 0.02, "learning_rate": 4.681724845995894e-06, "loss": 1.1805, "step": 114 }, { "epoch": 0.02, "learning_rate": 4.722792607802875e-06, "loss": 1.1712, "step": 115 }, { "epoch": 0.02, "learning_rate": 4.763860369609857e-06, "loss": 1.1835, "step": 116 }, { "epoch": 0.02, "learning_rate": 4.8049281314168385e-06, "loss": 1.162, "step": 117 }, { "epoch": 0.02, "learning_rate": 4.84599589322382e-06, "loss": 1.1772, "step": 118 }, { "epoch": 0.02, "learning_rate": 4.887063655030802e-06, "loss": 1.1715, "step": 119 }, { "epoch": 0.02, "learning_rate": 4.928131416837782e-06, "loss": 1.1467, "step": 120 }, { "epoch": 0.02, "learning_rate": 4.969199178644764e-06, "loss": 1.1494, "step": 121 }, { "epoch": 0.02, "learning_rate": 5.010266940451746e-06, "loss": 1.156, "step": 122 }, { "epoch": 0.02, "learning_rate": 5.051334702258728e-06, "loss": 1.1536, "step": 123 }, { "epoch": 0.02, "learning_rate": 5.092402464065709e-06, "loss": 1.1388, "step": 124 }, { "epoch": 0.02, "learning_rate": 5.1334702258726895e-06, "loss": 1.118, "step": 125 }, { "epoch": 0.02, "learning_rate": 5.174537987679672e-06, "loss": 1.1114, "step": 126 }, { "epoch": 0.02, "learning_rate": 5.215605749486653e-06, "loss": 1.1198, "step": 127 }, { "epoch": 0.02, "learning_rate": 5.256673511293635e-06, "loss": 1.0861, "step": 128 }, { "epoch": 0.02, "learning_rate": 5.297741273100616e-06, "loss": 1.1017, "step": 129 }, { "epoch": 0.02, "learning_rate": 5.338809034907598e-06, "loss": 1.0916, "step": 130 }, { "epoch": 0.02, "learning_rate": 5.379876796714579e-06, "loss": 1.0729, "step": 131 }, { "epoch": 0.02, "learning_rate": 5.4209445585215615e-06, "loss": 1.0893, "step": 132 }, { "epoch": 0.02, "learning_rate": 5.462012320328542e-06, "loss": 1.0481, "step": 133 }, { "epoch": 0.02, "learning_rate": 5.503080082135525e-06, "loss": 1.0302, "step": 134 }, { "epoch": 0.02, "learning_rate": 5.5441478439425054e-06, "loss": 1.0627, "step": 135 }, { "epoch": 0.03, "learning_rate": 5.585215605749487e-06, "loss": 1.0522, "step": 136 }, { "epoch": 0.03, "learning_rate": 5.626283367556469e-06, "loss": 1.0263, "step": 137 }, { "epoch": 0.03, "learning_rate": 5.66735112936345e-06, "loss": 1.0533, "step": 138 }, { "epoch": 0.03, "learning_rate": 5.708418891170432e-06, "loss": 1.0875, "step": 139 }, { "epoch": 0.03, "learning_rate": 5.7494866529774125e-06, "loss": 1.0711, "step": 140 }, { "epoch": 0.03, "learning_rate": 5.790554414784395e-06, "loss": 1.0188, "step": 141 }, { "epoch": 0.03, "learning_rate": 5.831622176591376e-06, "loss": 1.0533, "step": 142 }, { "epoch": 0.03, "learning_rate": 5.872689938398358e-06, "loss": 1.0159, "step": 143 }, { "epoch": 0.03, "learning_rate": 5.913757700205339e-06, "loss": 1.0139, "step": 144 }, { "epoch": 0.03, "learning_rate": 5.954825462012321e-06, "loss": 1.0056, "step": 145 }, { "epoch": 0.03, "learning_rate": 5.995893223819302e-06, "loss": 1.0155, "step": 146 }, { "epoch": 0.03, "learning_rate": 6.036960985626284e-06, "loss": 0.9924, "step": 147 }, { "epoch": 0.03, "learning_rate": 6.078028747433265e-06, "loss": 1.0199, "step": 148 }, { "epoch": 0.03, "learning_rate": 6.119096509240247e-06, "loss": 0.9819, "step": 149 }, { "epoch": 0.03, "learning_rate": 6.1601642710472284e-06, "loss": 0.9725, "step": 150 }, { "epoch": 0.03, "learning_rate": 6.20123203285421e-06, "loss": 0.9829, "step": 151 }, { "epoch": 0.03, "learning_rate": 6.242299794661192e-06, "loss": 1.0171, "step": 152 }, { "epoch": 0.03, "learning_rate": 6.283367556468173e-06, "loss": 0.972, "step": 153 }, { "epoch": 0.03, "learning_rate": 6.324435318275155e-06, "loss": 0.9502, "step": 154 }, { "epoch": 0.03, "learning_rate": 6.365503080082136e-06, "loss": 0.9582, "step": 155 }, { "epoch": 0.03, "learning_rate": 6.406570841889117e-06, "loss": 0.9367, "step": 156 }, { "epoch": 0.03, "learning_rate": 6.4476386036960996e-06, "loss": 0.9357, "step": 157 }, { "epoch": 0.03, "learning_rate": 6.48870636550308e-06, "loss": 0.9376, "step": 158 }, { "epoch": 0.03, "learning_rate": 6.529774127310062e-06, "loss": 0.9349, "step": 159 }, { "epoch": 0.03, "learning_rate": 6.5708418891170435e-06, "loss": 0.9053, "step": 160 }, { "epoch": 0.03, "learning_rate": 6.611909650924025e-06, "loss": 0.9021, "step": 161 }, { "epoch": 0.03, "learning_rate": 6.652977412731007e-06, "loss": 0.8971, "step": 162 }, { "epoch": 0.03, "learning_rate": 6.694045174537988e-06, "loss": 0.9295, "step": 163 }, { "epoch": 0.03, "learning_rate": 6.73511293634497e-06, "loss": 0.9197, "step": 164 }, { "epoch": 0.03, "learning_rate": 6.7761806981519515e-06, "loss": 0.8802, "step": 165 }, { "epoch": 0.03, "learning_rate": 6.817248459958933e-06, "loss": 0.8498, "step": 166 }, { "epoch": 0.03, "learning_rate": 6.858316221765914e-06, "loss": 0.8743, "step": 167 }, { "epoch": 0.03, "learning_rate": 6.899383983572896e-06, "loss": 0.8762, "step": 168 }, { "epoch": 0.03, "learning_rate": 6.940451745379877e-06, "loss": 0.8755, "step": 169 }, { "epoch": 0.03, "learning_rate": 6.981519507186859e-06, "loss": 0.8496, "step": 170 }, { "epoch": 0.03, "learning_rate": 7.02258726899384e-06, "loss": 0.862, "step": 171 }, { "epoch": 0.03, "learning_rate": 7.063655030800823e-06, "loss": 0.8651, "step": 172 }, { "epoch": 0.03, "learning_rate": 7.104722792607803e-06, "loss": 0.8268, "step": 173 }, { "epoch": 0.03, "learning_rate": 7.145790554414786e-06, "loss": 0.8538, "step": 174 }, { "epoch": 0.03, "learning_rate": 7.1868583162217665e-06, "loss": 0.842, "step": 175 }, { "epoch": 0.03, "learning_rate": 7.227926078028749e-06, "loss": 0.8586, "step": 176 }, { "epoch": 0.03, "learning_rate": 7.26899383983573e-06, "loss": 0.8243, "step": 177 }, { "epoch": 0.03, "learning_rate": 7.3100616016427104e-06, "loss": 0.8373, "step": 178 }, { "epoch": 0.03, "learning_rate": 7.351129363449693e-06, "loss": 0.8561, "step": 179 }, { "epoch": 0.03, "learning_rate": 7.392197125256674e-06, "loss": 0.8077, "step": 180 }, { "epoch": 0.03, "learning_rate": 7.433264887063656e-06, "loss": 0.8385, "step": 181 }, { "epoch": 0.03, "learning_rate": 7.474332648870637e-06, "loss": 0.8184, "step": 182 }, { "epoch": 0.03, "learning_rate": 7.515400410677619e-06, "loss": 0.806, "step": 183 }, { "epoch": 0.03, "learning_rate": 7.5564681724846e-06, "loss": 0.8054, "step": 184 }, { "epoch": 0.03, "learning_rate": 7.597535934291582e-06, "loss": 0.7851, "step": 185 }, { "epoch": 0.03, "learning_rate": 7.638603696098564e-06, "loss": 0.7806, "step": 186 }, { "epoch": 0.03, "learning_rate": 7.679671457905545e-06, "loss": 0.7686, "step": 187 }, { "epoch": 0.03, "learning_rate": 7.720739219712527e-06, "loss": 0.7664, "step": 188 }, { "epoch": 0.03, "learning_rate": 7.761806981519508e-06, "loss": 0.7518, "step": 189 }, { "epoch": 0.04, "learning_rate": 7.80287474332649e-06, "loss": 0.7764, "step": 190 }, { "epoch": 0.04, "learning_rate": 7.843942505133471e-06, "loss": 0.7932, "step": 191 }, { "epoch": 0.04, "learning_rate": 7.885010266940452e-06, "loss": 0.7809, "step": 192 }, { "epoch": 0.04, "learning_rate": 7.926078028747434e-06, "loss": 0.7871, "step": 193 }, { "epoch": 0.04, "learning_rate": 7.967145790554415e-06, "loss": 0.7555, "step": 194 }, { "epoch": 0.04, "learning_rate": 8.008213552361397e-06, "loss": 0.7412, "step": 195 }, { "epoch": 0.04, "learning_rate": 8.049281314168378e-06, "loss": 0.7625, "step": 196 }, { "epoch": 0.04, "learning_rate": 8.09034907597536e-06, "loss": 0.7529, "step": 197 }, { "epoch": 0.04, "learning_rate": 8.131416837782341e-06, "loss": 0.7601, "step": 198 }, { "epoch": 0.04, "learning_rate": 8.172484599589324e-06, "loss": 0.7577, "step": 199 }, { "epoch": 0.04, "learning_rate": 8.213552361396305e-06, "loss": 0.7613, "step": 200 }, { "epoch": 0.04, "learning_rate": 8.254620123203287e-06, "loss": 0.7566, "step": 201 }, { "epoch": 0.04, "learning_rate": 8.295687885010268e-06, "loss": 0.7382, "step": 202 }, { "epoch": 0.04, "learning_rate": 8.33675564681725e-06, "loss": 0.7445, "step": 203 }, { "epoch": 0.04, "learning_rate": 8.377823408624231e-06, "loss": 0.7262, "step": 204 }, { "epoch": 0.04, "learning_rate": 8.418891170431213e-06, "loss": 0.7281, "step": 205 }, { "epoch": 0.04, "learning_rate": 8.459958932238194e-06, "loss": 0.7359, "step": 206 }, { "epoch": 0.04, "learning_rate": 8.501026694045177e-06, "loss": 0.7009, "step": 207 }, { "epoch": 0.04, "learning_rate": 8.542094455852157e-06, "loss": 0.7243, "step": 208 }, { "epoch": 0.04, "learning_rate": 8.583162217659138e-06, "loss": 0.744, "step": 209 }, { "epoch": 0.04, "learning_rate": 8.62422997946612e-06, "loss": 0.742, "step": 210 }, { "epoch": 0.04, "learning_rate": 8.665297741273101e-06, "loss": 0.685, "step": 211 }, { "epoch": 0.04, "learning_rate": 8.706365503080084e-06, "loss": 0.6918, "step": 212 }, { "epoch": 0.04, "learning_rate": 8.747433264887064e-06, "loss": 0.6991, "step": 213 }, { "epoch": 0.04, "learning_rate": 8.788501026694047e-06, "loss": 0.7303, "step": 214 }, { "epoch": 0.04, "learning_rate": 8.829568788501028e-06, "loss": 0.6993, "step": 215 }, { "epoch": 0.04, "learning_rate": 8.87063655030801e-06, "loss": 0.6792, "step": 216 }, { "epoch": 0.04, "learning_rate": 8.91170431211499e-06, "loss": 0.7262, "step": 217 }, { "epoch": 0.04, "learning_rate": 8.952772073921972e-06, "loss": 0.6923, "step": 218 }, { "epoch": 0.04, "learning_rate": 8.993839835728954e-06, "loss": 0.7157, "step": 219 }, { "epoch": 0.04, "learning_rate": 9.034907597535935e-06, "loss": 0.6956, "step": 220 }, { "epoch": 0.04, "learning_rate": 9.075975359342917e-06, "loss": 0.6977, "step": 221 }, { "epoch": 0.04, "learning_rate": 9.117043121149898e-06, "loss": 0.6926, "step": 222 }, { "epoch": 0.04, "learning_rate": 9.15811088295688e-06, "loss": 0.6883, "step": 223 }, { "epoch": 0.04, "learning_rate": 9.199178644763861e-06, "loss": 0.6827, "step": 224 }, { "epoch": 0.04, "learning_rate": 9.240246406570844e-06, "loss": 0.6686, "step": 225 }, { "epoch": 0.04, "learning_rate": 9.281314168377824e-06, "loss": 0.6764, "step": 226 }, { "epoch": 0.04, "learning_rate": 9.322381930184807e-06, "loss": 0.6979, "step": 227 }, { "epoch": 0.04, "learning_rate": 9.363449691991787e-06, "loss": 0.699, "step": 228 }, { "epoch": 0.04, "learning_rate": 9.404517453798768e-06, "loss": 0.68, "step": 229 }, { "epoch": 0.04, "learning_rate": 9.44558521560575e-06, "loss": 0.6762, "step": 230 }, { "epoch": 0.04, "learning_rate": 9.486652977412731e-06, "loss": 0.697, "step": 231 }, { "epoch": 0.04, "learning_rate": 9.527720739219714e-06, "loss": 0.6723, "step": 232 }, { "epoch": 0.04, "learning_rate": 9.568788501026695e-06, "loss": 0.6701, "step": 233 }, { "epoch": 0.04, "learning_rate": 9.609856262833677e-06, "loss": 0.6753, "step": 234 }, { "epoch": 0.04, "learning_rate": 9.650924024640658e-06, "loss": 0.6646, "step": 235 }, { "epoch": 0.04, "learning_rate": 9.69199178644764e-06, "loss": 0.6682, "step": 236 }, { "epoch": 0.04, "learning_rate": 9.733059548254621e-06, "loss": 0.7046, "step": 237 }, { "epoch": 0.04, "learning_rate": 9.774127310061603e-06, "loss": 0.6578, "step": 238 }, { "epoch": 0.04, "learning_rate": 9.815195071868584e-06, "loss": 0.6501, "step": 239 }, { "epoch": 0.04, "learning_rate": 9.856262833675565e-06, "loss": 0.6819, "step": 240 }, { "epoch": 0.04, "learning_rate": 9.897330595482547e-06, "loss": 0.6911, "step": 241 }, { "epoch": 0.04, "learning_rate": 9.938398357289528e-06, "loss": 0.6745, "step": 242 }, { "epoch": 0.04, "learning_rate": 9.97946611909651e-06, "loss": 0.6593, "step": 243 }, { "epoch": 0.05, "learning_rate": 1.0020533880903491e-05, "loss": 0.6496, "step": 244 }, { "epoch": 0.05, "learning_rate": 1.0061601642710472e-05, "loss": 0.6481, "step": 245 }, { "epoch": 0.05, "learning_rate": 1.0102669404517456e-05, "loss": 0.6551, "step": 246 }, { "epoch": 0.05, "learning_rate": 1.0143737166324437e-05, "loss": 0.6225, "step": 247 }, { "epoch": 0.05, "learning_rate": 1.0184804928131418e-05, "loss": 0.6431, "step": 248 }, { "epoch": 0.05, "learning_rate": 1.0225872689938398e-05, "loss": 0.6256, "step": 249 }, { "epoch": 0.05, "learning_rate": 1.0266940451745379e-05, "loss": 0.6478, "step": 250 }, { "epoch": 0.05, "learning_rate": 1.0308008213552363e-05, "loss": 0.6625, "step": 251 }, { "epoch": 0.05, "learning_rate": 1.0349075975359344e-05, "loss": 0.6483, "step": 252 }, { "epoch": 0.05, "learning_rate": 1.0390143737166325e-05, "loss": 0.6399, "step": 253 }, { "epoch": 0.05, "learning_rate": 1.0431211498973305e-05, "loss": 0.6475, "step": 254 }, { "epoch": 0.05, "learning_rate": 1.047227926078029e-05, "loss": 0.648, "step": 255 }, { "epoch": 0.05, "learning_rate": 1.051334702258727e-05, "loss": 0.6511, "step": 256 }, { "epoch": 0.05, "learning_rate": 1.0554414784394251e-05, "loss": 0.6466, "step": 257 }, { "epoch": 0.05, "learning_rate": 1.0595482546201232e-05, "loss": 0.6491, "step": 258 }, { "epoch": 0.05, "learning_rate": 1.0636550308008216e-05, "loss": 0.6408, "step": 259 }, { "epoch": 0.05, "learning_rate": 1.0677618069815197e-05, "loss": 0.6533, "step": 260 }, { "epoch": 0.05, "learning_rate": 1.0718685831622177e-05, "loss": 0.6216, "step": 261 }, { "epoch": 0.05, "learning_rate": 1.0759753593429158e-05, "loss": 0.6441, "step": 262 }, { "epoch": 0.05, "learning_rate": 1.0800821355236139e-05, "loss": 0.6611, "step": 263 }, { "epoch": 0.05, "learning_rate": 1.0841889117043123e-05, "loss": 0.6383, "step": 264 }, { "epoch": 0.05, "learning_rate": 1.0882956878850104e-05, "loss": 0.6385, "step": 265 }, { "epoch": 0.05, "learning_rate": 1.0924024640657084e-05, "loss": 0.6318, "step": 266 }, { "epoch": 0.05, "learning_rate": 1.0965092402464065e-05, "loss": 0.6562, "step": 267 }, { "epoch": 0.05, "learning_rate": 1.100616016427105e-05, "loss": 0.6302, "step": 268 }, { "epoch": 0.05, "learning_rate": 1.104722792607803e-05, "loss": 0.6272, "step": 269 }, { "epoch": 0.05, "learning_rate": 1.1088295687885011e-05, "loss": 0.6133, "step": 270 }, { "epoch": 0.05, "learning_rate": 1.1129363449691992e-05, "loss": 0.6275, "step": 271 }, { "epoch": 0.05, "learning_rate": 1.1170431211498974e-05, "loss": 0.6737, "step": 272 }, { "epoch": 0.05, "learning_rate": 1.1211498973305956e-05, "loss": 0.6561, "step": 273 }, { "epoch": 0.05, "learning_rate": 1.1252566735112937e-05, "loss": 0.644, "step": 274 }, { "epoch": 0.05, "learning_rate": 1.1293634496919918e-05, "loss": 0.621, "step": 275 }, { "epoch": 0.05, "learning_rate": 1.13347022587269e-05, "loss": 0.6279, "step": 276 }, { "epoch": 0.05, "learning_rate": 1.1375770020533883e-05, "loss": 0.6373, "step": 277 }, { "epoch": 0.05, "learning_rate": 1.1416837782340864e-05, "loss": 0.6285, "step": 278 }, { "epoch": 0.05, "learning_rate": 1.1457905544147844e-05, "loss": 0.6238, "step": 279 }, { "epoch": 0.05, "learning_rate": 1.1498973305954825e-05, "loss": 0.6577, "step": 280 }, { "epoch": 0.05, "learning_rate": 1.1540041067761808e-05, "loss": 0.6148, "step": 281 }, { "epoch": 0.05, "learning_rate": 1.158110882956879e-05, "loss": 0.631, "step": 282 }, { "epoch": 0.05, "learning_rate": 1.162217659137577e-05, "loss": 0.6358, "step": 283 }, { "epoch": 0.05, "learning_rate": 1.1663244353182751e-05, "loss": 0.6263, "step": 284 }, { "epoch": 0.05, "learning_rate": 1.1704312114989734e-05, "loss": 0.6399, "step": 285 }, { "epoch": 0.05, "learning_rate": 1.1745379876796716e-05, "loss": 0.6223, "step": 286 }, { "epoch": 0.05, "learning_rate": 1.1786447638603697e-05, "loss": 0.6139, "step": 287 }, { "epoch": 0.05, "learning_rate": 1.1827515400410678e-05, "loss": 0.6226, "step": 288 }, { "epoch": 0.05, "learning_rate": 1.186858316221766e-05, "loss": 0.6307, "step": 289 }, { "epoch": 0.05, "learning_rate": 1.1909650924024643e-05, "loss": 0.609, "step": 290 }, { "epoch": 0.05, "learning_rate": 1.1950718685831623e-05, "loss": 0.6487, "step": 291 }, { "epoch": 0.05, "learning_rate": 1.1991786447638604e-05, "loss": 0.6048, "step": 292 }, { "epoch": 0.05, "learning_rate": 1.2032854209445587e-05, "loss": 0.6241, "step": 293 }, { "epoch": 0.05, "learning_rate": 1.2073921971252567e-05, "loss": 0.6075, "step": 294 }, { "epoch": 0.05, "learning_rate": 1.211498973305955e-05, "loss": 0.5846, "step": 295 }, { "epoch": 0.05, "learning_rate": 1.215605749486653e-05, "loss": 0.6212, "step": 296 }, { "epoch": 0.05, "learning_rate": 1.2197125256673511e-05, "loss": 0.6161, "step": 297 }, { "epoch": 0.06, "learning_rate": 1.2238193018480494e-05, "loss": 0.6277, "step": 298 }, { "epoch": 0.06, "learning_rate": 1.2279260780287476e-05, "loss": 0.6009, "step": 299 }, { "epoch": 0.06, "learning_rate": 1.2320328542094457e-05, "loss": 0.6175, "step": 300 }, { "epoch": 0.06, "learning_rate": 1.2361396303901438e-05, "loss": 0.6204, "step": 301 }, { "epoch": 0.06, "learning_rate": 1.240246406570842e-05, "loss": 0.6204, "step": 302 }, { "epoch": 0.06, "learning_rate": 1.24435318275154e-05, "loss": 0.6298, "step": 303 }, { "epoch": 0.06, "learning_rate": 1.2484599589322383e-05, "loss": 0.6048, "step": 304 }, { "epoch": 0.06, "learning_rate": 1.2525667351129364e-05, "loss": 0.599, "step": 305 }, { "epoch": 0.06, "learning_rate": 1.2566735112936346e-05, "loss": 0.6148, "step": 306 }, { "epoch": 0.06, "learning_rate": 1.2607802874743327e-05, "loss": 0.601, "step": 307 }, { "epoch": 0.06, "learning_rate": 1.264887063655031e-05, "loss": 0.605, "step": 308 }, { "epoch": 0.06, "learning_rate": 1.268993839835729e-05, "loss": 0.6145, "step": 309 }, { "epoch": 0.06, "learning_rate": 1.2731006160164273e-05, "loss": 0.6189, "step": 310 }, { "epoch": 0.06, "learning_rate": 1.2772073921971254e-05, "loss": 0.6045, "step": 311 }, { "epoch": 0.06, "learning_rate": 1.2813141683778234e-05, "loss": 0.6075, "step": 312 }, { "epoch": 0.06, "learning_rate": 1.2854209445585217e-05, "loss": 0.6022, "step": 313 }, { "epoch": 0.06, "learning_rate": 1.2895277207392199e-05, "loss": 0.6151, "step": 314 }, { "epoch": 0.06, "learning_rate": 1.293634496919918e-05, "loss": 0.5987, "step": 315 }, { "epoch": 0.06, "learning_rate": 1.297741273100616e-05, "loss": 0.6088, "step": 316 }, { "epoch": 0.06, "learning_rate": 1.3018480492813143e-05, "loss": 0.6217, "step": 317 }, { "epoch": 0.06, "learning_rate": 1.3059548254620124e-05, "loss": 0.6195, "step": 318 }, { "epoch": 0.06, "learning_rate": 1.3100616016427106e-05, "loss": 0.6033, "step": 319 }, { "epoch": 0.06, "learning_rate": 1.3141683778234087e-05, "loss": 0.5959, "step": 320 }, { "epoch": 0.06, "learning_rate": 1.318275154004107e-05, "loss": 0.611, "step": 321 }, { "epoch": 0.06, "learning_rate": 1.322381930184805e-05, "loss": 0.6147, "step": 322 }, { "epoch": 0.06, "learning_rate": 1.3264887063655033e-05, "loss": 0.6118, "step": 323 }, { "epoch": 0.06, "learning_rate": 1.3305954825462013e-05, "loss": 0.5926, "step": 324 }, { "epoch": 0.06, "learning_rate": 1.3347022587268994e-05, "loss": 0.6177, "step": 325 }, { "epoch": 0.06, "learning_rate": 1.3388090349075977e-05, "loss": 0.5829, "step": 326 }, { "epoch": 0.06, "learning_rate": 1.3429158110882959e-05, "loss": 0.6082, "step": 327 }, { "epoch": 0.06, "learning_rate": 1.347022587268994e-05, "loss": 0.5834, "step": 328 }, { "epoch": 0.06, "learning_rate": 1.351129363449692e-05, "loss": 0.6076, "step": 329 }, { "epoch": 0.06, "learning_rate": 1.3552361396303903e-05, "loss": 0.6203, "step": 330 }, { "epoch": 0.06, "learning_rate": 1.3593429158110885e-05, "loss": 0.5809, "step": 331 }, { "epoch": 0.06, "learning_rate": 1.3634496919917866e-05, "loss": 0.5991, "step": 332 }, { "epoch": 0.06, "learning_rate": 1.3675564681724847e-05, "loss": 0.577, "step": 333 }, { "epoch": 0.06, "learning_rate": 1.3716632443531828e-05, "loss": 0.5739, "step": 334 }, { "epoch": 0.06, "learning_rate": 1.3757700205338812e-05, "loss": 0.5638, "step": 335 }, { "epoch": 0.06, "learning_rate": 1.3798767967145792e-05, "loss": 0.6108, "step": 336 }, { "epoch": 0.06, "learning_rate": 1.3839835728952773e-05, "loss": 0.5778, "step": 337 }, { "epoch": 0.06, "learning_rate": 1.3880903490759754e-05, "loss": 0.5952, "step": 338 }, { "epoch": 0.06, "learning_rate": 1.3921971252566736e-05, "loss": 0.6117, "step": 339 }, { "epoch": 0.06, "learning_rate": 1.3963039014373719e-05, "loss": 0.6102, "step": 340 }, { "epoch": 0.06, "learning_rate": 1.40041067761807e-05, "loss": 0.588, "step": 341 }, { "epoch": 0.06, "learning_rate": 1.404517453798768e-05, "loss": 0.5934, "step": 342 }, { "epoch": 0.06, "learning_rate": 1.4086242299794661e-05, "loss": 0.6019, "step": 343 }, { "epoch": 0.06, "learning_rate": 1.4127310061601645e-05, "loss": 0.6105, "step": 344 }, { "epoch": 0.06, "learning_rate": 1.4168377823408626e-05, "loss": 0.591, "step": 345 }, { "epoch": 0.06, "learning_rate": 1.4209445585215607e-05, "loss": 0.6019, "step": 346 }, { "epoch": 0.06, "learning_rate": 1.4250513347022587e-05, "loss": 0.5856, "step": 347 }, { "epoch": 0.06, "learning_rate": 1.4291581108829572e-05, "loss": 0.6106, "step": 348 }, { "epoch": 0.06, "learning_rate": 1.4332648870636552e-05, "loss": 0.5721, "step": 349 }, { "epoch": 0.06, "learning_rate": 1.4373716632443533e-05, "loss": 0.5963, "step": 350 }, { "epoch": 0.06, "learning_rate": 1.4414784394250514e-05, "loss": 0.6104, "step": 351 }, { "epoch": 0.07, "learning_rate": 1.4455852156057498e-05, "loss": 0.5981, "step": 352 }, { "epoch": 0.07, "learning_rate": 1.4496919917864479e-05, "loss": 0.5918, "step": 353 }, { "epoch": 0.07, "learning_rate": 1.453798767967146e-05, "loss": 0.5663, "step": 354 }, { "epoch": 0.07, "learning_rate": 1.457905544147844e-05, "loss": 0.5769, "step": 355 }, { "epoch": 0.07, "learning_rate": 1.4620123203285421e-05, "loss": 0.5731, "step": 356 }, { "epoch": 0.07, "learning_rate": 1.4661190965092405e-05, "loss": 0.5699, "step": 357 }, { "epoch": 0.07, "learning_rate": 1.4702258726899386e-05, "loss": 0.6187, "step": 358 }, { "epoch": 0.07, "learning_rate": 1.4743326488706366e-05, "loss": 0.578, "step": 359 }, { "epoch": 0.07, "learning_rate": 1.4784394250513347e-05, "loss": 0.5836, "step": 360 }, { "epoch": 0.07, "learning_rate": 1.4825462012320331e-05, "loss": 0.5938, "step": 361 }, { "epoch": 0.07, "learning_rate": 1.4866529774127312e-05, "loss": 0.6304, "step": 362 }, { "epoch": 0.07, "learning_rate": 1.4907597535934293e-05, "loss": 0.5716, "step": 363 }, { "epoch": 0.07, "learning_rate": 1.4948665297741274e-05, "loss": 0.5952, "step": 364 }, { "epoch": 0.07, "learning_rate": 1.4989733059548254e-05, "loss": 0.5716, "step": 365 }, { "epoch": 0.07, "learning_rate": 1.5030800821355238e-05, "loss": 0.5722, "step": 366 }, { "epoch": 0.07, "learning_rate": 1.507186858316222e-05, "loss": 0.598, "step": 367 }, { "epoch": 0.07, "learning_rate": 1.51129363449692e-05, "loss": 0.5661, "step": 368 }, { "epoch": 0.07, "learning_rate": 1.515400410677618e-05, "loss": 0.5907, "step": 369 }, { "epoch": 0.07, "learning_rate": 1.5195071868583165e-05, "loss": 0.5948, "step": 370 }, { "epoch": 0.07, "learning_rate": 1.5236139630390146e-05, "loss": 0.5596, "step": 371 }, { "epoch": 0.07, "learning_rate": 1.5277207392197128e-05, "loss": 0.5797, "step": 372 }, { "epoch": 0.07, "learning_rate": 1.531827515400411e-05, "loss": 0.5861, "step": 373 }, { "epoch": 0.07, "learning_rate": 1.535934291581109e-05, "loss": 0.5752, "step": 374 }, { "epoch": 0.07, "learning_rate": 1.540041067761807e-05, "loss": 0.5743, "step": 375 }, { "epoch": 0.07, "learning_rate": 1.5441478439425054e-05, "loss": 0.5729, "step": 376 }, { "epoch": 0.07, "learning_rate": 1.5482546201232035e-05, "loss": 0.5766, "step": 377 }, { "epoch": 0.07, "learning_rate": 1.5523613963039016e-05, "loss": 0.5753, "step": 378 }, { "epoch": 0.07, "learning_rate": 1.5564681724845997e-05, "loss": 0.5692, "step": 379 }, { "epoch": 0.07, "learning_rate": 1.560574948665298e-05, "loss": 0.5982, "step": 380 }, { "epoch": 0.07, "learning_rate": 1.564681724845996e-05, "loss": 0.5923, "step": 381 }, { "epoch": 0.07, "learning_rate": 1.5687885010266942e-05, "loss": 0.5809, "step": 382 }, { "epoch": 0.07, "learning_rate": 1.5728952772073923e-05, "loss": 0.5891, "step": 383 }, { "epoch": 0.07, "learning_rate": 1.5770020533880904e-05, "loss": 0.5829, "step": 384 }, { "epoch": 0.07, "learning_rate": 1.5811088295687888e-05, "loss": 0.5825, "step": 385 }, { "epoch": 0.07, "learning_rate": 1.585215605749487e-05, "loss": 0.5625, "step": 386 }, { "epoch": 0.07, "learning_rate": 1.589322381930185e-05, "loss": 0.5788, "step": 387 }, { "epoch": 0.07, "learning_rate": 1.593429158110883e-05, "loss": 0.5794, "step": 388 }, { "epoch": 0.07, "learning_rate": 1.5975359342915814e-05, "loss": 0.5849, "step": 389 }, { "epoch": 0.07, "learning_rate": 1.6016427104722795e-05, "loss": 0.5848, "step": 390 }, { "epoch": 0.07, "learning_rate": 1.6057494866529776e-05, "loss": 0.5743, "step": 391 }, { "epoch": 0.07, "learning_rate": 1.6098562628336756e-05, "loss": 0.5421, "step": 392 }, { "epoch": 0.07, "learning_rate": 1.613963039014374e-05, "loss": 0.5924, "step": 393 }, { "epoch": 0.07, "learning_rate": 1.618069815195072e-05, "loss": 0.5791, "step": 394 }, { "epoch": 0.07, "learning_rate": 1.6221765913757702e-05, "loss": 0.5656, "step": 395 }, { "epoch": 0.07, "learning_rate": 1.6262833675564683e-05, "loss": 0.5914, "step": 396 }, { "epoch": 0.07, "learning_rate": 1.6303901437371667e-05, "loss": 0.5714, "step": 397 }, { "epoch": 0.07, "learning_rate": 1.6344969199178648e-05, "loss": 0.5465, "step": 398 }, { "epoch": 0.07, "learning_rate": 1.638603696098563e-05, "loss": 0.5776, "step": 399 }, { "epoch": 0.07, "learning_rate": 1.642710472279261e-05, "loss": 0.5769, "step": 400 }, { "epoch": 0.07, "learning_rate": 1.6468172484599593e-05, "loss": 0.595, "step": 401 }, { "epoch": 0.07, "learning_rate": 1.6509240246406574e-05, "loss": 0.5777, "step": 402 }, { "epoch": 0.07, "learning_rate": 1.6550308008213555e-05, "loss": 0.5801, "step": 403 }, { "epoch": 0.07, "learning_rate": 1.6591375770020536e-05, "loss": 0.586, "step": 404 }, { "epoch": 0.07, "learning_rate": 1.6632443531827516e-05, "loss": 0.5651, "step": 405 }, { "epoch": 0.08, "learning_rate": 1.66735112936345e-05, "loss": 0.5637, "step": 406 }, { "epoch": 0.08, "learning_rate": 1.671457905544148e-05, "loss": 0.587, "step": 407 }, { "epoch": 0.08, "learning_rate": 1.6755646817248462e-05, "loss": 0.6006, "step": 408 }, { "epoch": 0.08, "learning_rate": 1.6796714579055443e-05, "loss": 0.5531, "step": 409 }, { "epoch": 0.08, "learning_rate": 1.6837782340862427e-05, "loss": 0.587, "step": 410 }, { "epoch": 0.08, "learning_rate": 1.6878850102669408e-05, "loss": 0.5817, "step": 411 }, { "epoch": 0.08, "learning_rate": 1.6919917864476388e-05, "loss": 0.5755, "step": 412 }, { "epoch": 0.08, "learning_rate": 1.696098562628337e-05, "loss": 0.5754, "step": 413 }, { "epoch": 0.08, "learning_rate": 1.7002053388090353e-05, "loss": 0.5731, "step": 414 }, { "epoch": 0.08, "learning_rate": 1.7043121149897334e-05, "loss": 0.5803, "step": 415 }, { "epoch": 0.08, "learning_rate": 1.7084188911704315e-05, "loss": 0.5536, "step": 416 }, { "epoch": 0.08, "learning_rate": 1.7125256673511295e-05, "loss": 0.5927, "step": 417 }, { "epoch": 0.08, "learning_rate": 1.7166324435318276e-05, "loss": 0.5764, "step": 418 }, { "epoch": 0.08, "learning_rate": 1.720739219712526e-05, "loss": 0.5852, "step": 419 }, { "epoch": 0.08, "learning_rate": 1.724845995893224e-05, "loss": 0.6041, "step": 420 }, { "epoch": 0.08, "learning_rate": 1.7289527720739222e-05, "loss": 0.5864, "step": 421 }, { "epoch": 0.08, "learning_rate": 1.7330595482546202e-05, "loss": 0.5629, "step": 422 }, { "epoch": 0.08, "learning_rate": 1.7371663244353187e-05, "loss": 0.5748, "step": 423 }, { "epoch": 0.08, "learning_rate": 1.7412731006160167e-05, "loss": 0.5765, "step": 424 }, { "epoch": 0.08, "learning_rate": 1.7453798767967148e-05, "loss": 0.5663, "step": 425 }, { "epoch": 0.08, "learning_rate": 1.749486652977413e-05, "loss": 0.5737, "step": 426 }, { "epoch": 0.08, "learning_rate": 1.753593429158111e-05, "loss": 0.5734, "step": 427 }, { "epoch": 0.08, "learning_rate": 1.7577002053388094e-05, "loss": 0.5766, "step": 428 }, { "epoch": 0.08, "learning_rate": 1.7618069815195074e-05, "loss": 0.5807, "step": 429 }, { "epoch": 0.08, "learning_rate": 1.7659137577002055e-05, "loss": 0.6036, "step": 430 }, { "epoch": 0.08, "learning_rate": 1.7700205338809036e-05, "loss": 0.563, "step": 431 }, { "epoch": 0.08, "learning_rate": 1.774127310061602e-05, "loss": 0.5931, "step": 432 }, { "epoch": 0.08, "learning_rate": 1.7782340862423e-05, "loss": 0.5767, "step": 433 }, { "epoch": 0.08, "learning_rate": 1.782340862422998e-05, "loss": 0.5937, "step": 434 }, { "epoch": 0.08, "learning_rate": 1.7864476386036962e-05, "loss": 0.5873, "step": 435 }, { "epoch": 0.08, "learning_rate": 1.7905544147843943e-05, "loss": 0.5719, "step": 436 }, { "epoch": 0.08, "learning_rate": 1.7946611909650927e-05, "loss": 0.5796, "step": 437 }, { "epoch": 0.08, "learning_rate": 1.7987679671457908e-05, "loss": 0.5834, "step": 438 }, { "epoch": 0.08, "learning_rate": 1.802874743326489e-05, "loss": 0.5861, "step": 439 }, { "epoch": 0.08, "learning_rate": 1.806981519507187e-05, "loss": 0.5848, "step": 440 }, { "epoch": 0.08, "learning_rate": 1.8110882956878854e-05, "loss": 0.5399, "step": 441 }, { "epoch": 0.08, "learning_rate": 1.8151950718685834e-05, "loss": 0.5608, "step": 442 }, { "epoch": 0.08, "learning_rate": 1.8193018480492815e-05, "loss": 0.5603, "step": 443 }, { "epoch": 0.08, "learning_rate": 1.8234086242299796e-05, "loss": 0.5767, "step": 444 }, { "epoch": 0.08, "learning_rate": 1.827515400410678e-05, "loss": 0.5745, "step": 445 }, { "epoch": 0.08, "learning_rate": 1.831622176591376e-05, "loss": 0.5675, "step": 446 }, { "epoch": 0.08, "learning_rate": 1.835728952772074e-05, "loss": 0.5839, "step": 447 }, { "epoch": 0.08, "learning_rate": 1.8398357289527722e-05, "loss": 0.5896, "step": 448 }, { "epoch": 0.08, "learning_rate": 1.8439425051334703e-05, "loss": 0.5734, "step": 449 }, { "epoch": 0.08, "learning_rate": 1.8480492813141687e-05, "loss": 0.5605, "step": 450 }, { "epoch": 0.08, "learning_rate": 1.8521560574948668e-05, "loss": 0.5655, "step": 451 }, { "epoch": 0.08, "learning_rate": 1.856262833675565e-05, "loss": 0.5715, "step": 452 }, { "epoch": 0.08, "learning_rate": 1.860369609856263e-05, "loss": 0.5805, "step": 453 }, { "epoch": 0.08, "learning_rate": 1.8644763860369613e-05, "loss": 0.5615, "step": 454 }, { "epoch": 0.08, "learning_rate": 1.8685831622176594e-05, "loss": 0.5759, "step": 455 }, { "epoch": 0.08, "learning_rate": 1.8726899383983575e-05, "loss": 0.5779, "step": 456 }, { "epoch": 0.08, "learning_rate": 1.8767967145790556e-05, "loss": 0.5725, "step": 457 }, { "epoch": 0.08, "learning_rate": 1.8809034907597536e-05, "loss": 0.5765, "step": 458 }, { "epoch": 0.08, "learning_rate": 1.885010266940452e-05, "loss": 0.5623, "step": 459 }, { "epoch": 0.09, "learning_rate": 1.88911704312115e-05, "loss": 0.5572, "step": 460 }, { "epoch": 0.09, "learning_rate": 1.8932238193018482e-05, "loss": 0.5767, "step": 461 }, { "epoch": 0.09, "learning_rate": 1.8973305954825463e-05, "loss": 0.5711, "step": 462 }, { "epoch": 0.09, "learning_rate": 1.9014373716632447e-05, "loss": 0.5438, "step": 463 }, { "epoch": 0.09, "learning_rate": 1.9055441478439428e-05, "loss": 0.5662, "step": 464 }, { "epoch": 0.09, "learning_rate": 1.909650924024641e-05, "loss": 0.5679, "step": 465 }, { "epoch": 0.09, "learning_rate": 1.913757700205339e-05, "loss": 0.583, "step": 466 }, { "epoch": 0.09, "learning_rate": 1.917864476386037e-05, "loss": 0.5561, "step": 467 }, { "epoch": 0.09, "learning_rate": 1.9219712525667354e-05, "loss": 0.5622, "step": 468 }, { "epoch": 0.09, "learning_rate": 1.9260780287474335e-05, "loss": 0.56, "step": 469 }, { "epoch": 0.09, "learning_rate": 1.9301848049281315e-05, "loss": 0.5481, "step": 470 }, { "epoch": 0.09, "learning_rate": 1.9342915811088296e-05, "loss": 0.5825, "step": 471 }, { "epoch": 0.09, "learning_rate": 1.938398357289528e-05, "loss": 0.5728, "step": 472 }, { "epoch": 0.09, "learning_rate": 1.942505133470226e-05, "loss": 0.5668, "step": 473 }, { "epoch": 0.09, "learning_rate": 1.9466119096509242e-05, "loss": 0.5839, "step": 474 }, { "epoch": 0.09, "learning_rate": 1.9507186858316223e-05, "loss": 0.5619, "step": 475 }, { "epoch": 0.09, "learning_rate": 1.9548254620123207e-05, "loss": 0.574, "step": 476 }, { "epoch": 0.09, "learning_rate": 1.9589322381930187e-05, "loss": 0.5744, "step": 477 }, { "epoch": 0.09, "learning_rate": 1.9630390143737168e-05, "loss": 0.5523, "step": 478 }, { "epoch": 0.09, "learning_rate": 1.967145790554415e-05, "loss": 0.5781, "step": 479 }, { "epoch": 0.09, "learning_rate": 1.971252566735113e-05, "loss": 0.5615, "step": 480 }, { "epoch": 0.09, "learning_rate": 1.9753593429158114e-05, "loss": 0.5997, "step": 481 }, { "epoch": 0.09, "learning_rate": 1.9794661190965095e-05, "loss": 0.5598, "step": 482 }, { "epoch": 0.09, "learning_rate": 1.9835728952772075e-05, "loss": 0.5771, "step": 483 }, { "epoch": 0.09, "learning_rate": 1.9876796714579056e-05, "loss": 0.561, "step": 484 }, { "epoch": 0.09, "learning_rate": 1.991786447638604e-05, "loss": 0.5719, "step": 485 }, { "epoch": 0.09, "learning_rate": 1.995893223819302e-05, "loss": 0.5743, "step": 486 }, { "epoch": 0.09, "learning_rate": 2e-05, "loss": 0.55, "step": 487 }, { "epoch": 0.09, "learning_rate": 1.9999999800509258e-05, "loss": 0.5646, "step": 488 }, { "epoch": 0.09, "learning_rate": 1.999999920203704e-05, "loss": 0.5532, "step": 489 }, { "epoch": 0.09, "learning_rate": 1.9999998204583362e-05, "loss": 0.5668, "step": 490 }, { "epoch": 0.09, "learning_rate": 1.9999996808148278e-05, "loss": 0.566, "step": 491 }, { "epoch": 0.09, "learning_rate": 1.999999501273183e-05, "loss": 0.5526, "step": 492 }, { "epoch": 0.09, "learning_rate": 1.99999928183341e-05, "loss": 0.5706, "step": 493 }, { "epoch": 0.09, "learning_rate": 1.9999990224955167e-05, "loss": 0.5561, "step": 494 }, { "epoch": 0.09, "learning_rate": 1.9999987232595138e-05, "loss": 0.5605, "step": 495 }, { "epoch": 0.09, "learning_rate": 1.9999983841254135e-05, "loss": 0.5943, "step": 496 }, { "epoch": 0.09, "learning_rate": 1.999998005093229e-05, "loss": 0.5757, "step": 497 }, { "epoch": 0.09, "learning_rate": 1.999997586162976e-05, "loss": 0.5458, "step": 498 }, { "epoch": 0.09, "learning_rate": 1.9999971273346706e-05, "loss": 0.5648, "step": 499 }, { "epoch": 0.09, "learning_rate": 1.9999966286083306e-05, "loss": 0.5744, "step": 500 }, { "epoch": 0.09, "learning_rate": 1.9999960899839772e-05, "loss": 0.5947, "step": 501 }, { "epoch": 0.09, "learning_rate": 1.9999955114616313e-05, "loss": 0.564, "step": 502 }, { "epoch": 0.09, "learning_rate": 1.999994893041316e-05, "loss": 0.5719, "step": 503 }, { "epoch": 0.09, "learning_rate": 1.9999942347230555e-05, "loss": 0.5726, "step": 504 }, { "epoch": 0.09, "learning_rate": 1.9999935365068765e-05, "loss": 0.5687, "step": 505 }, { "epoch": 0.09, "learning_rate": 1.999992798392807e-05, "loss": 0.5778, "step": 506 }, { "epoch": 0.09, "learning_rate": 1.999992020380876e-05, "loss": 0.5812, "step": 507 }, { "epoch": 0.09, "learning_rate": 1.9999912024711154e-05, "loss": 0.5558, "step": 508 }, { "epoch": 0.09, "learning_rate": 1.999990344663557e-05, "loss": 0.5618, "step": 509 }, { "epoch": 0.09, "learning_rate": 1.999989446958235e-05, "loss": 0.5598, "step": 510 }, { "epoch": 0.09, "learning_rate": 1.9999885093551855e-05, "loss": 0.5573, "step": 511 }, { "epoch": 0.09, "learning_rate": 1.9999875318544463e-05, "loss": 0.5492, "step": 512 }, { "epoch": 0.09, "learning_rate": 1.9999865144560557e-05, "loss": 0.5632, "step": 513 }, { "epoch": 0.1, "learning_rate": 1.999985457160055e-05, "loss": 0.5768, "step": 514 }, { "epoch": 0.1, "learning_rate": 1.9999843599664855e-05, "loss": 0.561, "step": 515 }, { "epoch": 0.1, "learning_rate": 1.9999832228753914e-05, "loss": 0.5471, "step": 516 }, { "epoch": 0.1, "learning_rate": 1.9999820458868186e-05, "loss": 0.5616, "step": 517 }, { "epoch": 0.1, "learning_rate": 1.9999808290008133e-05, "loss": 0.5562, "step": 518 }, { "epoch": 0.1, "learning_rate": 1.9999795722174244e-05, "loss": 0.5779, "step": 519 }, { "epoch": 0.1, "learning_rate": 1.999978275536702e-05, "loss": 0.5849, "step": 520 }, { "epoch": 0.1, "learning_rate": 1.999976938958698e-05, "loss": 0.5737, "step": 521 }, { "epoch": 0.1, "learning_rate": 1.999975562483465e-05, "loss": 0.5512, "step": 522 }, { "epoch": 0.1, "learning_rate": 1.9999741461110587e-05, "loss": 0.5286, "step": 523 }, { "epoch": 0.1, "learning_rate": 1.9999726898415357e-05, "loss": 0.5795, "step": 524 }, { "epoch": 0.1, "learning_rate": 1.9999711936749536e-05, "loss": 0.5813, "step": 525 }, { "epoch": 0.1, "learning_rate": 1.999969657611372e-05, "loss": 0.5718, "step": 526 }, { "epoch": 0.1, "learning_rate": 1.999968081650853e-05, "loss": 0.5677, "step": 527 }, { "epoch": 0.1, "learning_rate": 1.9999664657934582e-05, "loss": 0.5846, "step": 528 }, { "epoch": 0.1, "learning_rate": 1.9999648100392536e-05, "loss": 0.5694, "step": 529 }, { "epoch": 0.1, "learning_rate": 1.999963114388304e-05, "loss": 0.5756, "step": 530 }, { "epoch": 0.1, "learning_rate": 1.9999613788406774e-05, "loss": 0.5664, "step": 531 }, { "epoch": 0.1, "learning_rate": 1.9999596033964435e-05, "loss": 0.5264, "step": 532 }, { "epoch": 0.1, "learning_rate": 1.9999577880556727e-05, "loss": 0.5553, "step": 533 }, { "epoch": 0.1, "learning_rate": 1.9999559328184374e-05, "loss": 0.5566, "step": 534 }, { "epoch": 0.1, "learning_rate": 1.999954037684812e-05, "loss": 0.555, "step": 535 }, { "epoch": 0.1, "learning_rate": 1.9999521026548718e-05, "loss": 0.5593, "step": 536 }, { "epoch": 0.1, "learning_rate": 1.999950127728694e-05, "loss": 0.5578, "step": 537 }, { "epoch": 0.1, "learning_rate": 1.999948112906357e-05, "loss": 0.5492, "step": 538 }, { "epoch": 0.1, "learning_rate": 1.999946058187942e-05, "loss": 0.5666, "step": 539 }, { "epoch": 0.1, "learning_rate": 1.999943963573531e-05, "loss": 0.5516, "step": 540 }, { "epoch": 0.1, "learning_rate": 1.9999418290632067e-05, "loss": 0.5716, "step": 541 }, { "epoch": 0.1, "learning_rate": 1.9999396546570553e-05, "loss": 0.5461, "step": 542 }, { "epoch": 0.1, "learning_rate": 1.9999374403551625e-05, "loss": 0.5667, "step": 543 }, { "epoch": 0.1, "learning_rate": 1.9999351861576174e-05, "loss": 0.5613, "step": 544 }, { "epoch": 0.1, "learning_rate": 1.9999328920645098e-05, "loss": 0.5478, "step": 545 }, { "epoch": 0.1, "learning_rate": 1.9999305580759308e-05, "loss": 0.5498, "step": 546 }, { "epoch": 0.1, "learning_rate": 1.999928184191974e-05, "loss": 0.5627, "step": 547 }, { "epoch": 0.1, "learning_rate": 1.999925770412734e-05, "loss": 0.5227, "step": 548 }, { "epoch": 0.1, "learning_rate": 1.9999233167383072e-05, "loss": 0.5584, "step": 549 }, { "epoch": 0.1, "learning_rate": 1.9999208231687914e-05, "loss": 0.5356, "step": 550 }, { "epoch": 0.1, "learning_rate": 1.9999182897042857e-05, "loss": 0.5768, "step": 551 }, { "epoch": 0.1, "learning_rate": 1.9999157163448918e-05, "loss": 0.5642, "step": 552 }, { "epoch": 0.1, "learning_rate": 1.9999131030907122e-05, "loss": 0.5559, "step": 553 }, { "epoch": 0.1, "learning_rate": 1.999910449941851e-05, "loss": 0.559, "step": 554 }, { "epoch": 0.1, "learning_rate": 1.999907756898414e-05, "loss": 0.5643, "step": 555 }, { "epoch": 0.1, "learning_rate": 1.9999050239605088e-05, "loss": 0.5559, "step": 556 }, { "epoch": 0.1, "learning_rate": 1.9999022511282446e-05, "loss": 0.5531, "step": 557 }, { "epoch": 0.1, "learning_rate": 1.9998994384017318e-05, "loss": 0.5449, "step": 558 }, { "epoch": 0.1, "learning_rate": 1.9998965857810825e-05, "loss": 0.5744, "step": 559 }, { "epoch": 0.1, "learning_rate": 1.9998936932664107e-05, "loss": 0.5433, "step": 560 }, { "epoch": 0.1, "learning_rate": 1.9998907608578317e-05, "loss": 0.5443, "step": 561 }, { "epoch": 0.1, "learning_rate": 1.999887788555463e-05, "loss": 0.5724, "step": 562 }, { "epoch": 0.1, "learning_rate": 1.9998847763594226e-05, "loss": 0.5483, "step": 563 }, { "epoch": 0.1, "learning_rate": 1.9998817242698306e-05, "loss": 0.5507, "step": 564 }, { "epoch": 0.1, "learning_rate": 1.9998786322868093e-05, "loss": 0.5467, "step": 565 }, { "epoch": 0.1, "learning_rate": 1.999875500410482e-05, "loss": 0.5366, "step": 566 }, { "epoch": 0.1, "learning_rate": 1.9998723286409732e-05, "loss": 0.5595, "step": 567 }, { "epoch": 0.11, "learning_rate": 1.9998691169784096e-05, "loss": 0.5562, "step": 568 }, { "epoch": 0.11, "learning_rate": 1.9998658654229194e-05, "loss": 0.5677, "step": 569 }, { "epoch": 0.11, "learning_rate": 1.9998625739746328e-05, "loss": 0.5599, "step": 570 }, { "epoch": 0.11, "learning_rate": 1.9998592426336802e-05, "loss": 0.5576, "step": 571 }, { "epoch": 0.11, "learning_rate": 1.999855871400195e-05, "loss": 0.5503, "step": 572 }, { "epoch": 0.11, "learning_rate": 1.999852460274312e-05, "loss": 0.5606, "step": 573 }, { "epoch": 0.11, "learning_rate": 1.9998490092561668e-05, "loss": 0.5565, "step": 574 }, { "epoch": 0.11, "learning_rate": 1.9998455183458976e-05, "loss": 0.5417, "step": 575 }, { "epoch": 0.11, "learning_rate": 1.9998419875436435e-05, "loss": 0.5498, "step": 576 }, { "epoch": 0.11, "learning_rate": 1.9998384168495447e-05, "loss": 0.5716, "step": 577 }, { "epoch": 0.11, "learning_rate": 1.999834806263745e-05, "loss": 0.5384, "step": 578 }, { "epoch": 0.11, "learning_rate": 1.9998311557863866e-05, "loss": 0.5849, "step": 579 }, { "epoch": 0.11, "learning_rate": 1.999827465417617e-05, "loss": 0.5644, "step": 580 }, { "epoch": 0.11, "learning_rate": 1.9998237351575823e-05, "loss": 0.5657, "step": 581 }, { "epoch": 0.11, "learning_rate": 1.9998199650064317e-05, "loss": 0.5465, "step": 582 }, { "epoch": 0.11, "learning_rate": 1.999816154964316e-05, "loss": 0.5337, "step": 583 }, { "epoch": 0.11, "learning_rate": 1.9998123050313866e-05, "loss": 0.5461, "step": 584 }, { "epoch": 0.11, "learning_rate": 1.9998084152077973e-05, "loss": 0.553, "step": 585 }, { "epoch": 0.11, "learning_rate": 1.9998044854937033e-05, "loss": 0.5373, "step": 586 }, { "epoch": 0.11, "learning_rate": 1.9998005158892614e-05, "loss": 0.5449, "step": 587 }, { "epoch": 0.11, "learning_rate": 1.9997965063946303e-05, "loss": 0.555, "step": 588 }, { "epoch": 0.11, "learning_rate": 1.9997924570099695e-05, "loss": 0.5451, "step": 589 }, { "epoch": 0.11, "learning_rate": 1.9997883677354407e-05, "loss": 0.5536, "step": 590 }, { "epoch": 0.11, "learning_rate": 1.999784238571207e-05, "loss": 0.5556, "step": 591 }, { "epoch": 0.11, "learning_rate": 1.9997800695174333e-05, "loss": 0.5514, "step": 592 }, { "epoch": 0.11, "learning_rate": 1.9997758605742858e-05, "loss": 0.5565, "step": 593 }, { "epoch": 0.11, "learning_rate": 1.9997716117419323e-05, "loss": 0.5686, "step": 594 }, { "epoch": 0.11, "learning_rate": 1.9997673230205428e-05, "loss": 0.5457, "step": 595 }, { "epoch": 0.11, "learning_rate": 1.999762994410288e-05, "loss": 0.5596, "step": 596 }, { "epoch": 0.11, "learning_rate": 1.999758625911341e-05, "loss": 0.5778, "step": 597 }, { "epoch": 0.11, "learning_rate": 1.9997542175238758e-05, "loss": 0.5544, "step": 598 }, { "epoch": 0.11, "learning_rate": 1.999749769248068e-05, "loss": 0.5412, "step": 599 }, { "epoch": 0.11, "learning_rate": 1.9997452810840956e-05, "loss": 0.559, "step": 600 }, { "epoch": 0.11, "learning_rate": 1.9997407530321377e-05, "loss": 0.5335, "step": 601 }, { "epoch": 0.11, "learning_rate": 1.9997361850923745e-05, "loss": 0.5389, "step": 602 }, { "epoch": 0.11, "learning_rate": 1.9997315772649882e-05, "loss": 0.5424, "step": 603 }, { "epoch": 0.11, "learning_rate": 1.999726929550163e-05, "loss": 0.5504, "step": 604 }, { "epoch": 0.11, "learning_rate": 1.9997222419480845e-05, "loss": 0.5703, "step": 605 }, { "epoch": 0.11, "learning_rate": 1.9997175144589395e-05, "loss": 0.5371, "step": 606 }, { "epoch": 0.11, "learning_rate": 1.9997127470829165e-05, "loss": 0.5444, "step": 607 }, { "epoch": 0.11, "learning_rate": 1.999707939820206e-05, "loss": 0.5698, "step": 608 }, { "epoch": 0.11, "learning_rate": 1.9997030926709993e-05, "loss": 0.5632, "step": 609 }, { "epoch": 0.11, "learning_rate": 1.99969820563549e-05, "loss": 0.5553, "step": 610 }, { "epoch": 0.11, "learning_rate": 1.9996932787138735e-05, "loss": 0.5402, "step": 611 }, { "epoch": 0.11, "learning_rate": 1.9996883119063462e-05, "loss": 0.5942, "step": 612 }, { "epoch": 0.11, "learning_rate": 1.9996833052131058e-05, "loss": 0.5635, "step": 613 }, { "epoch": 0.11, "learning_rate": 1.9996782586343527e-05, "loss": 0.554, "step": 614 }, { "epoch": 0.11, "learning_rate": 1.9996731721702875e-05, "loss": 0.538, "step": 615 }, { "epoch": 0.11, "learning_rate": 1.999668045821114e-05, "loss": 0.5629, "step": 616 }, { "epoch": 0.11, "learning_rate": 1.9996628795870362e-05, "loss": 0.5459, "step": 617 }, { "epoch": 0.11, "learning_rate": 1.99965767346826e-05, "loss": 0.563, "step": 618 }, { "epoch": 0.11, "learning_rate": 1.9996524274649935e-05, "loss": 0.5159, "step": 619 }, { "epoch": 0.11, "learning_rate": 1.9996471415774462e-05, "loss": 0.5513, "step": 620 }, { "epoch": 0.11, "learning_rate": 1.999641815805829e-05, "loss": 0.5578, "step": 621 }, { "epoch": 0.12, "learning_rate": 1.9996364501503538e-05, "loss": 0.5419, "step": 622 }, { "epoch": 0.12, "learning_rate": 1.999631044611235e-05, "loss": 0.5521, "step": 623 }, { "epoch": 0.12, "learning_rate": 1.999625599188688e-05, "loss": 0.5519, "step": 624 }, { "epoch": 0.12, "learning_rate": 1.999620113882931e-05, "loss": 0.5505, "step": 625 }, { "epoch": 0.12, "learning_rate": 1.999614588694182e-05, "loss": 0.5311, "step": 626 }, { "epoch": 0.12, "learning_rate": 1.9996090236226612e-05, "loss": 0.5404, "step": 627 }, { "epoch": 0.12, "learning_rate": 1.9996034186685915e-05, "loss": 0.5652, "step": 628 }, { "epoch": 0.12, "learning_rate": 1.999597773832196e-05, "loss": 0.5364, "step": 629 }, { "epoch": 0.12, "learning_rate": 1.9995920891137e-05, "loss": 0.5652, "step": 630 }, { "epoch": 0.12, "learning_rate": 1.9995863645133308e-05, "loss": 0.5317, "step": 631 }, { "epoch": 0.12, "learning_rate": 1.9995806000313157e-05, "loss": 0.5663, "step": 632 }, { "epoch": 0.12, "learning_rate": 1.9995747956678856e-05, "loss": 0.5482, "step": 633 }, { "epoch": 0.12, "learning_rate": 1.999568951423272e-05, "loss": 0.564, "step": 634 }, { "epoch": 0.12, "learning_rate": 1.9995630672977073e-05, "loss": 0.5453, "step": 635 }, { "epoch": 0.12, "learning_rate": 1.9995571432914273e-05, "loss": 0.5564, "step": 636 }, { "epoch": 0.12, "learning_rate": 1.999551179404668e-05, "loss": 0.5511, "step": 637 }, { "epoch": 0.12, "learning_rate": 1.9995451756376672e-05, "loss": 0.5511, "step": 638 }, { "epoch": 0.12, "learning_rate": 1.999539131990664e-05, "loss": 0.5497, "step": 639 }, { "epoch": 0.12, "learning_rate": 1.9995330484639005e-05, "loss": 0.5304, "step": 640 }, { "epoch": 0.12, "learning_rate": 1.999526925057619e-05, "loss": 0.5624, "step": 641 }, { "epoch": 0.12, "learning_rate": 1.9995207617720637e-05, "loss": 0.5605, "step": 642 }, { "epoch": 0.12, "learning_rate": 1.9995145586074806e-05, "loss": 0.5653, "step": 643 }, { "epoch": 0.12, "learning_rate": 1.999508315564117e-05, "loss": 0.5349, "step": 644 }, { "epoch": 0.12, "learning_rate": 1.9995020326422224e-05, "loss": 0.5349, "step": 645 }, { "epoch": 0.12, "learning_rate": 1.999495709842047e-05, "loss": 0.5317, "step": 646 }, { "epoch": 0.12, "learning_rate": 1.9994893471638433e-05, "loss": 0.5481, "step": 647 }, { "epoch": 0.12, "learning_rate": 1.9994829446078653e-05, "loss": 0.5518, "step": 648 }, { "epoch": 0.12, "learning_rate": 1.999476502174368e-05, "loss": 0.5452, "step": 649 }, { "epoch": 0.12, "learning_rate": 1.999470019863609e-05, "loss": 0.5393, "step": 650 }, { "epoch": 0.12, "learning_rate": 1.999463497675847e-05, "loss": 0.5435, "step": 651 }, { "epoch": 0.12, "learning_rate": 1.9994569356113412e-05, "loss": 0.5533, "step": 652 }, { "epoch": 0.12, "learning_rate": 1.9994503336703546e-05, "loss": 0.5301, "step": 653 }, { "epoch": 0.12, "learning_rate": 1.9994436918531498e-05, "loss": 0.5414, "step": 654 }, { "epoch": 0.12, "learning_rate": 1.9994370101599926e-05, "loss": 0.5728, "step": 655 }, { "epoch": 0.12, "learning_rate": 1.9994302885911487e-05, "loss": 0.5342, "step": 656 }, { "epoch": 0.12, "learning_rate": 1.9994235271468867e-05, "loss": 0.5389, "step": 657 }, { "epoch": 0.12, "learning_rate": 1.9994167258274764e-05, "loss": 0.5323, "step": 658 }, { "epoch": 0.12, "learning_rate": 1.9994098846331892e-05, "loss": 0.5492, "step": 659 }, { "epoch": 0.12, "learning_rate": 1.999403003564298e-05, "loss": 0.5369, "step": 660 }, { "epoch": 0.12, "learning_rate": 1.9993960826210773e-05, "loss": 0.5462, "step": 661 }, { "epoch": 0.12, "learning_rate": 1.9993891218038028e-05, "loss": 0.5469, "step": 662 }, { "epoch": 0.12, "learning_rate": 1.999382121112753e-05, "loss": 0.5318, "step": 663 }, { "epoch": 0.12, "learning_rate": 1.999375080548207e-05, "loss": 0.5453, "step": 664 }, { "epoch": 0.12, "learning_rate": 1.9993680001104453e-05, "loss": 0.5514, "step": 665 }, { "epoch": 0.12, "learning_rate": 1.9993608797997508e-05, "loss": 0.5238, "step": 666 }, { "epoch": 0.12, "learning_rate": 1.9993537196164078e-05, "loss": 0.5391, "step": 667 }, { "epoch": 0.12, "learning_rate": 1.999346519560701e-05, "loss": 0.5577, "step": 668 }, { "epoch": 0.12, "learning_rate": 1.9993392796329188e-05, "loss": 0.5636, "step": 669 }, { "epoch": 0.12, "learning_rate": 1.9993319998333495e-05, "loss": 0.5471, "step": 670 }, { "epoch": 0.12, "learning_rate": 1.9993246801622833e-05, "loss": 0.5549, "step": 671 }, { "epoch": 0.12, "learning_rate": 1.999317320620013e-05, "loss": 0.5315, "step": 672 }, { "epoch": 0.12, "learning_rate": 1.9993099212068316e-05, "loss": 0.5301, "step": 673 }, { "epoch": 0.12, "learning_rate": 1.9993024819230343e-05, "loss": 0.5099, "step": 674 }, { "epoch": 0.12, "learning_rate": 1.9992950027689185e-05, "loss": 0.5665, "step": 675 }, { "epoch": 0.13, "learning_rate": 1.999287483744782e-05, "loss": 0.5266, "step": 676 }, { "epoch": 0.13, "learning_rate": 1.999279924850925e-05, "loss": 0.5592, "step": 677 }, { "epoch": 0.13, "learning_rate": 1.9992723260876494e-05, "loss": 0.5536, "step": 678 }, { "epoch": 0.13, "learning_rate": 1.9992646874552578e-05, "loss": 0.5598, "step": 679 }, { "epoch": 0.13, "learning_rate": 1.9992570089540554e-05, "loss": 0.5558, "step": 680 }, { "epoch": 0.13, "learning_rate": 1.9992492905843485e-05, "loss": 0.5648, "step": 681 }, { "epoch": 0.13, "learning_rate": 1.9992415323464447e-05, "loss": 0.5487, "step": 682 }, { "epoch": 0.13, "learning_rate": 1.999233734240654e-05, "loss": 0.534, "step": 683 }, { "epoch": 0.13, "learning_rate": 1.9992258962672874e-05, "loss": 0.5434, "step": 684 }, { "epoch": 0.13, "learning_rate": 1.9992180184266573e-05, "loss": 0.5696, "step": 685 }, { "epoch": 0.13, "learning_rate": 1.9992101007190782e-05, "loss": 0.5613, "step": 686 }, { "epoch": 0.13, "learning_rate": 1.9992021431448665e-05, "loss": 0.5455, "step": 687 }, { "epoch": 0.13, "learning_rate": 1.9991941457043393e-05, "loss": 0.5256, "step": 688 }, { "epoch": 0.13, "learning_rate": 1.9991861083978154e-05, "loss": 0.5147, "step": 689 }, { "epoch": 0.13, "learning_rate": 1.9991780312256154e-05, "loss": 0.5508, "step": 690 }, { "epoch": 0.13, "learning_rate": 1.9991699141880622e-05, "loss": 0.5271, "step": 691 }, { "epoch": 0.13, "learning_rate": 1.9991617572854793e-05, "loss": 0.5234, "step": 692 }, { "epoch": 0.13, "learning_rate": 1.9991535605181923e-05, "loss": 0.5255, "step": 693 }, { "epoch": 0.13, "learning_rate": 1.9991453238865278e-05, "loss": 0.5333, "step": 694 }, { "epoch": 0.13, "learning_rate": 1.9991370473908152e-05, "loss": 0.5248, "step": 695 }, { "epoch": 0.13, "learning_rate": 1.999128731031384e-05, "loss": 0.5392, "step": 696 }, { "epoch": 0.13, "learning_rate": 1.9991203748085663e-05, "loss": 0.5625, "step": 697 }, { "epoch": 0.13, "learning_rate": 1.9991119787226957e-05, "loss": 0.5482, "step": 698 }, { "epoch": 0.13, "learning_rate": 1.9991035427741065e-05, "loss": 0.5251, "step": 699 }, { "epoch": 0.13, "learning_rate": 1.999095066963136e-05, "loss": 0.5679, "step": 700 }, { "epoch": 0.13, "learning_rate": 1.9990865512901224e-05, "loss": 0.5414, "step": 701 }, { "epoch": 0.13, "learning_rate": 1.9990779957554048e-05, "loss": 0.5374, "step": 702 }, { "epoch": 0.13, "learning_rate": 1.9990694003593248e-05, "loss": 0.5403, "step": 703 }, { "epoch": 0.13, "learning_rate": 1.9990607651022256e-05, "loss": 0.5318, "step": 704 }, { "epoch": 0.13, "learning_rate": 1.9990520899844516e-05, "loss": 0.5306, "step": 705 }, { "epoch": 0.13, "learning_rate": 1.999043375006349e-05, "loss": 0.5366, "step": 706 }, { "epoch": 0.13, "learning_rate": 1.999034620168265e-05, "loss": 0.5519, "step": 707 }, { "epoch": 0.13, "learning_rate": 1.99902582547055e-05, "loss": 0.5525, "step": 708 }, { "epoch": 0.13, "learning_rate": 1.999016990913554e-05, "loss": 0.5544, "step": 709 }, { "epoch": 0.13, "learning_rate": 1.999008116497629e-05, "loss": 0.5604, "step": 710 }, { "epoch": 0.13, "learning_rate": 1.9989992022231303e-05, "loss": 0.5421, "step": 711 }, { "epoch": 0.13, "learning_rate": 1.998990248090413e-05, "loss": 0.5031, "step": 712 }, { "epoch": 0.13, "learning_rate": 1.9989812540998347e-05, "loss": 0.5393, "step": 713 }, { "epoch": 0.13, "learning_rate": 1.9989722202517537e-05, "loss": 0.5416, "step": 714 }, { "epoch": 0.13, "learning_rate": 1.9989631465465303e-05, "loss": 0.5568, "step": 715 }, { "epoch": 0.13, "learning_rate": 1.998954032984527e-05, "loss": 0.5391, "step": 716 }, { "epoch": 0.13, "learning_rate": 1.9989448795661077e-05, "loss": 0.5594, "step": 717 }, { "epoch": 0.13, "learning_rate": 1.998935686291637e-05, "loss": 0.5488, "step": 718 }, { "epoch": 0.13, "learning_rate": 1.998926453161482e-05, "loss": 0.5447, "step": 719 }, { "epoch": 0.13, "learning_rate": 1.998917180176011e-05, "loss": 0.5525, "step": 720 }, { "epoch": 0.13, "learning_rate": 1.9989078673355937e-05, "loss": 0.5214, "step": 721 }, { "epoch": 0.13, "learning_rate": 1.998898514640602e-05, "loss": 0.5411, "step": 722 }, { "epoch": 0.13, "learning_rate": 1.998889122091409e-05, "loss": 0.5557, "step": 723 }, { "epoch": 0.13, "learning_rate": 1.9988796896883892e-05, "loss": 0.5508, "step": 724 }, { "epoch": 0.13, "learning_rate": 1.9988702174319194e-05, "loss": 0.56, "step": 725 }, { "epoch": 0.13, "learning_rate": 1.9988607053223776e-05, "loss": 0.5625, "step": 726 }, { "epoch": 0.13, "learning_rate": 1.9988511533601426e-05, "loss": 0.5651, "step": 727 }, { "epoch": 0.13, "learning_rate": 1.998841561545596e-05, "loss": 0.545, "step": 728 }, { "epoch": 0.13, "learning_rate": 1.9988319298791202e-05, "loss": 0.5401, "step": 729 }, { "epoch": 0.14, "learning_rate": 1.9988222583611e-05, "loss": 0.5336, "step": 730 }, { "epoch": 0.14, "learning_rate": 1.998812546991921e-05, "loss": 0.5638, "step": 731 }, { "epoch": 0.14, "learning_rate": 1.9988027957719702e-05, "loss": 0.5394, "step": 732 }, { "epoch": 0.14, "learning_rate": 1.9987930047016374e-05, "loss": 0.5162, "step": 733 }, { "epoch": 0.14, "learning_rate": 1.9987831737813128e-05, "loss": 0.5385, "step": 734 }, { "epoch": 0.14, "learning_rate": 1.998773303011389e-05, "loss": 0.5544, "step": 735 }, { "epoch": 0.14, "learning_rate": 1.9987633923922592e-05, "loss": 0.5485, "step": 736 }, { "epoch": 0.14, "learning_rate": 1.9987534419243197e-05, "loss": 0.563, "step": 737 }, { "epoch": 0.14, "learning_rate": 1.9987434516079666e-05, "loss": 0.5494, "step": 738 }, { "epoch": 0.14, "learning_rate": 1.998733421443599e-05, "loss": 0.533, "step": 739 }, { "epoch": 0.14, "learning_rate": 1.998723351431617e-05, "loss": 0.5226, "step": 740 }, { "epoch": 0.14, "learning_rate": 1.9987132415724222e-05, "loss": 0.5495, "step": 741 }, { "epoch": 0.14, "learning_rate": 1.9987030918664185e-05, "loss": 0.5339, "step": 742 }, { "epoch": 0.14, "learning_rate": 1.9986929023140103e-05, "loss": 0.5399, "step": 743 }, { "epoch": 0.14, "learning_rate": 1.9986826729156045e-05, "loss": 0.5244, "step": 744 }, { "epoch": 0.14, "learning_rate": 1.998672403671609e-05, "loss": 0.5386, "step": 745 }, { "epoch": 0.14, "learning_rate": 1.9986620945824332e-05, "loss": 0.5469, "step": 746 }, { "epoch": 0.14, "learning_rate": 1.9986517456484892e-05, "loss": 0.5351, "step": 747 }, { "epoch": 0.14, "learning_rate": 1.9986413568701893e-05, "loss": 0.5249, "step": 748 }, { "epoch": 0.14, "learning_rate": 1.9986309282479484e-05, "loss": 0.5198, "step": 749 }, { "epoch": 0.14, "learning_rate": 1.998620459782182e-05, "loss": 0.5312, "step": 750 }, { "epoch": 0.14, "learning_rate": 1.9986099514733085e-05, "loss": 0.5144, "step": 751 }, { "epoch": 0.14, "learning_rate": 1.998599403321747e-05, "loss": 0.546, "step": 752 }, { "epoch": 0.14, "learning_rate": 1.9985888153279175e-05, "loss": 0.5363, "step": 753 }, { "epoch": 0.14, "learning_rate": 1.9985781874922438e-05, "loss": 0.5333, "step": 754 }, { "epoch": 0.14, "learning_rate": 1.998567519815149e-05, "loss": 0.5183, "step": 755 }, { "epoch": 0.14, "learning_rate": 1.9985568122970586e-05, "loss": 0.5562, "step": 756 }, { "epoch": 0.14, "learning_rate": 1.9985460649384007e-05, "loss": 0.5414, "step": 757 }, { "epoch": 0.14, "learning_rate": 1.9985352777396033e-05, "loss": 0.5247, "step": 758 }, { "epoch": 0.14, "learning_rate": 1.998524450701097e-05, "loss": 0.5571, "step": 759 }, { "epoch": 0.14, "learning_rate": 1.9985135838233137e-05, "loss": 0.5515, "step": 760 }, { "epoch": 0.14, "learning_rate": 1.9985026771066876e-05, "loss": 0.5473, "step": 761 }, { "epoch": 0.14, "learning_rate": 1.9984917305516533e-05, "loss": 0.5321, "step": 762 }, { "epoch": 0.14, "learning_rate": 1.9984807441586473e-05, "loss": 0.5281, "step": 763 }, { "epoch": 0.14, "learning_rate": 1.9984697179281083e-05, "loss": 0.5183, "step": 764 }, { "epoch": 0.14, "learning_rate": 1.998458651860476e-05, "loss": 0.529, "step": 765 }, { "epoch": 0.14, "learning_rate": 1.9984475459561927e-05, "loss": 0.5675, "step": 766 }, { "epoch": 0.14, "learning_rate": 1.9984364002157003e-05, "loss": 0.5235, "step": 767 }, { "epoch": 0.14, "learning_rate": 1.9984252146394442e-05, "loss": 0.5238, "step": 768 }, { "epoch": 0.14, "learning_rate": 1.9984139892278707e-05, "loss": 0.5474, "step": 769 }, { "epoch": 0.14, "learning_rate": 1.9984027239814273e-05, "loss": 0.5391, "step": 770 }, { "epoch": 0.14, "learning_rate": 1.998391418900564e-05, "loss": 0.5458, "step": 771 }, { "epoch": 0.14, "learning_rate": 1.9983800739857316e-05, "loss": 0.5266, "step": 772 }, { "epoch": 0.14, "learning_rate": 1.9983686892373826e-05, "loss": 0.5417, "step": 773 }, { "epoch": 0.14, "learning_rate": 1.998357264655971e-05, "loss": 0.5082, "step": 774 }, { "epoch": 0.14, "learning_rate": 1.9983458002419534e-05, "loss": 0.5276, "step": 775 }, { "epoch": 0.14, "learning_rate": 1.9983342959957866e-05, "loss": 0.5469, "step": 776 }, { "epoch": 0.14, "learning_rate": 1.9983227519179296e-05, "loss": 0.5417, "step": 777 }, { "epoch": 0.14, "learning_rate": 1.9983111680088434e-05, "loss": 0.5398, "step": 778 }, { "epoch": 0.14, "learning_rate": 1.99829954426899e-05, "loss": 0.5238, "step": 779 }, { "epoch": 0.14, "learning_rate": 1.9982878806988327e-05, "loss": 0.541, "step": 780 }, { "epoch": 0.14, "learning_rate": 1.9982761772988374e-05, "loss": 0.5278, "step": 781 }, { "epoch": 0.14, "learning_rate": 1.998264434069471e-05, "loss": 0.5395, "step": 782 }, { "epoch": 0.14, "learning_rate": 1.9982526510112018e-05, "loss": 0.5364, "step": 783 }, { "epoch": 0.15, "learning_rate": 1.9982408281245004e-05, "loss": 0.553, "step": 784 }, { "epoch": 0.15, "learning_rate": 1.9982289654098378e-05, "loss": 0.52, "step": 785 }, { "epoch": 0.15, "learning_rate": 1.9982170628676877e-05, "loss": 0.5482, "step": 786 }, { "epoch": 0.15, "learning_rate": 1.9982051204985245e-05, "loss": 0.552, "step": 787 }, { "epoch": 0.15, "learning_rate": 1.998193138302826e-05, "loss": 0.5272, "step": 788 }, { "epoch": 0.15, "learning_rate": 1.9981811162810685e-05, "loss": 0.5397, "step": 789 }, { "epoch": 0.15, "learning_rate": 1.9981690544337333e-05, "loss": 0.5575, "step": 790 }, { "epoch": 0.15, "learning_rate": 1.9981569527613005e-05, "loss": 0.5308, "step": 791 }, { "epoch": 0.15, "learning_rate": 1.9981448112642534e-05, "loss": 0.5164, "step": 792 }, { "epoch": 0.15, "learning_rate": 1.9981326299430764e-05, "loss": 0.519, "step": 793 }, { "epoch": 0.15, "learning_rate": 1.9981204087982554e-05, "loss": 0.5149, "step": 794 }, { "epoch": 0.15, "learning_rate": 1.998108147830278e-05, "loss": 0.5286, "step": 795 }, { "epoch": 0.15, "learning_rate": 1.9980958470396334e-05, "loss": 0.5505, "step": 796 }, { "epoch": 0.15, "learning_rate": 1.9980835064268126e-05, "loss": 0.5275, "step": 797 }, { "epoch": 0.15, "learning_rate": 1.9980711259923078e-05, "loss": 0.5313, "step": 798 }, { "epoch": 0.15, "learning_rate": 1.9980587057366127e-05, "loss": 0.5407, "step": 799 }, { "epoch": 0.15, "learning_rate": 1.9980462456602233e-05, "loss": 0.5432, "step": 800 }, { "epoch": 0.15, "learning_rate": 1.9980337457636367e-05, "loss": 0.5334, "step": 801 }, { "epoch": 0.15, "learning_rate": 1.9980212060473512e-05, "loss": 0.5414, "step": 802 }, { "epoch": 0.15, "learning_rate": 1.9980086265118674e-05, "loss": 0.5405, "step": 803 }, { "epoch": 0.15, "learning_rate": 1.997996007157687e-05, "loss": 0.5421, "step": 804 }, { "epoch": 0.15, "learning_rate": 1.997983347985314e-05, "loss": 0.5422, "step": 805 }, { "epoch": 0.15, "learning_rate": 1.997970648995253e-05, "loss": 0.5289, "step": 806 }, { "epoch": 0.15, "learning_rate": 1.997957910188011e-05, "loss": 0.5269, "step": 807 }, { "epoch": 0.15, "learning_rate": 1.997945131564096e-05, "loss": 0.5279, "step": 808 }, { "epoch": 0.15, "learning_rate": 1.9979323131240176e-05, "loss": 0.5051, "step": 809 }, { "epoch": 0.15, "learning_rate": 1.9979194548682875e-05, "loss": 0.5172, "step": 810 }, { "epoch": 0.15, "learning_rate": 1.997906556797419e-05, "loss": 0.5313, "step": 811 }, { "epoch": 0.15, "learning_rate": 1.9978936189119263e-05, "loss": 0.5228, "step": 812 }, { "epoch": 0.15, "learning_rate": 1.997880641212326e-05, "loss": 0.5476, "step": 813 }, { "epoch": 0.15, "learning_rate": 1.9978676236991355e-05, "loss": 0.5052, "step": 814 }, { "epoch": 0.15, "learning_rate": 1.9978545663728744e-05, "loss": 0.5317, "step": 815 }, { "epoch": 0.15, "learning_rate": 1.9978414692340635e-05, "loss": 0.4973, "step": 816 }, { "epoch": 0.15, "learning_rate": 1.9978283322832254e-05, "loss": 0.5446, "step": 817 }, { "epoch": 0.15, "learning_rate": 1.997815155520884e-05, "loss": 0.5147, "step": 818 }, { "epoch": 0.15, "learning_rate": 1.9978019389475655e-05, "loss": 0.5506, "step": 819 }, { "epoch": 0.15, "learning_rate": 1.997788682563797e-05, "loss": 0.5417, "step": 820 }, { "epoch": 0.15, "learning_rate": 1.9977753863701077e-05, "loss": 0.539, "step": 821 }, { "epoch": 0.15, "learning_rate": 1.9977620503670278e-05, "loss": 0.5297, "step": 822 }, { "epoch": 0.15, "learning_rate": 1.997748674555089e-05, "loss": 0.5312, "step": 823 }, { "epoch": 0.15, "learning_rate": 1.9977352589348257e-05, "loss": 0.5179, "step": 824 }, { "epoch": 0.15, "learning_rate": 1.9977218035067728e-05, "loss": 0.5081, "step": 825 }, { "epoch": 0.15, "learning_rate": 1.997708308271467e-05, "loss": 0.517, "step": 826 }, { "epoch": 0.15, "learning_rate": 1.997694773229447e-05, "loss": 0.5292, "step": 827 }, { "epoch": 0.15, "learning_rate": 1.9976811983812527e-05, "loss": 0.5295, "step": 828 }, { "epoch": 0.15, "learning_rate": 1.997667583727426e-05, "loss": 0.5405, "step": 829 }, { "epoch": 0.15, "learning_rate": 1.9976539292685097e-05, "loss": 0.5444, "step": 830 }, { "epoch": 0.15, "learning_rate": 1.9976402350050487e-05, "loss": 0.5224, "step": 831 }, { "epoch": 0.15, "learning_rate": 1.997626500937589e-05, "loss": 0.5255, "step": 832 }, { "epoch": 0.15, "learning_rate": 1.9976127270666794e-05, "loss": 0.5467, "step": 833 }, { "epoch": 0.15, "learning_rate": 1.9975989133928692e-05, "loss": 0.5436, "step": 834 }, { "epoch": 0.15, "learning_rate": 1.9975850599167088e-05, "loss": 0.53, "step": 835 }, { "epoch": 0.15, "learning_rate": 1.9975711666387517e-05, "loss": 0.5542, "step": 836 }, { "epoch": 0.15, "learning_rate": 1.9975572335595523e-05, "loss": 0.5558, "step": 837 }, { "epoch": 0.16, "learning_rate": 1.997543260679666e-05, "loss": 0.5305, "step": 838 }, { "epoch": 0.16, "learning_rate": 1.9975292479996505e-05, "loss": 0.5191, "step": 839 }, { "epoch": 0.16, "learning_rate": 1.9975151955200648e-05, "loss": 0.5373, "step": 840 }, { "epoch": 0.16, "learning_rate": 1.99750110324147e-05, "loss": 0.5408, "step": 841 }, { "epoch": 0.16, "learning_rate": 1.9974869711644274e-05, "loss": 0.5288, "step": 842 }, { "epoch": 0.16, "learning_rate": 1.997472799289502e-05, "loss": 0.5316, "step": 843 }, { "epoch": 0.16, "learning_rate": 1.9974585876172584e-05, "loss": 0.5406, "step": 844 }, { "epoch": 0.16, "learning_rate": 1.9974443361482637e-05, "loss": 0.4961, "step": 845 }, { "epoch": 0.16, "learning_rate": 1.9974300448830873e-05, "loss": 0.5207, "step": 846 }, { "epoch": 0.16, "learning_rate": 1.9974157138222985e-05, "loss": 0.5282, "step": 847 }, { "epoch": 0.16, "learning_rate": 1.997401342966469e-05, "loss": 0.5568, "step": 848 }, { "epoch": 0.16, "learning_rate": 1.997386932316173e-05, "loss": 0.537, "step": 849 }, { "epoch": 0.16, "learning_rate": 1.9973724818719852e-05, "loss": 0.5223, "step": 850 }, { "epoch": 0.16, "learning_rate": 1.9973579916344814e-05, "loss": 0.5431, "step": 851 }, { "epoch": 0.16, "learning_rate": 1.9973434616042408e-05, "loss": 0.5311, "step": 852 }, { "epoch": 0.16, "learning_rate": 1.9973288917818425e-05, "loss": 0.5461, "step": 853 }, { "epoch": 0.16, "learning_rate": 1.9973142821678678e-05, "loss": 0.5252, "step": 854 }, { "epoch": 0.16, "learning_rate": 1.9972996327628996e-05, "loss": 0.5364, "step": 855 }, { "epoch": 0.16, "learning_rate": 1.9972849435675225e-05, "loss": 0.5305, "step": 856 }, { "epoch": 0.16, "learning_rate": 1.997270214582323e-05, "loss": 0.5129, "step": 857 }, { "epoch": 0.16, "learning_rate": 1.9972554458078877e-05, "loss": 0.5193, "step": 858 }, { "epoch": 0.16, "learning_rate": 1.997240637244807e-05, "loss": 0.5316, "step": 859 }, { "epoch": 0.16, "learning_rate": 1.997225788893671e-05, "loss": 0.5408, "step": 860 }, { "epoch": 0.16, "learning_rate": 1.9972109007550725e-05, "loss": 0.5354, "step": 861 }, { "epoch": 0.16, "learning_rate": 1.997195972829605e-05, "loss": 0.5336, "step": 862 }, { "epoch": 0.16, "learning_rate": 1.9971810051178647e-05, "loss": 0.5423, "step": 863 }, { "epoch": 0.16, "learning_rate": 1.9971659976204488e-05, "loss": 0.5447, "step": 864 }, { "epoch": 0.16, "learning_rate": 1.9971509503379552e-05, "loss": 0.5542, "step": 865 }, { "epoch": 0.16, "learning_rate": 1.9971358632709856e-05, "loss": 0.4943, "step": 866 }, { "epoch": 0.16, "learning_rate": 1.9971207364201404e-05, "loss": 0.5551, "step": 867 }, { "epoch": 0.16, "learning_rate": 1.9971055697860243e-05, "loss": 0.5678, "step": 868 }, { "epoch": 0.16, "learning_rate": 1.9970903633692423e-05, "loss": 0.5265, "step": 869 }, { "epoch": 0.16, "learning_rate": 1.9970751171704005e-05, "loss": 0.5316, "step": 870 }, { "epoch": 0.16, "learning_rate": 1.9970598311901078e-05, "loss": 0.525, "step": 871 }, { "epoch": 0.16, "learning_rate": 1.9970445054289737e-05, "loss": 0.5065, "step": 872 }, { "epoch": 0.16, "learning_rate": 1.99702913988761e-05, "loss": 0.5179, "step": 873 }, { "epoch": 0.16, "learning_rate": 1.997013734566629e-05, "loss": 0.5348, "step": 874 }, { "epoch": 0.16, "learning_rate": 1.9969982894666463e-05, "loss": 0.5381, "step": 875 }, { "epoch": 0.16, "learning_rate": 1.996982804588278e-05, "loss": 0.5361, "step": 876 }, { "epoch": 0.16, "learning_rate": 1.9969672799321414e-05, "loss": 0.528, "step": 877 }, { "epoch": 0.16, "learning_rate": 1.9969517154988563e-05, "loss": 0.5151, "step": 878 }, { "epoch": 0.16, "learning_rate": 1.9969361112890433e-05, "loss": 0.5291, "step": 879 }, { "epoch": 0.16, "learning_rate": 1.9969204673033253e-05, "loss": 0.5312, "step": 880 }, { "epoch": 0.16, "learning_rate": 1.9969047835423266e-05, "loss": 0.5437, "step": 881 }, { "epoch": 0.16, "learning_rate": 1.9968890600066726e-05, "loss": 0.5421, "step": 882 }, { "epoch": 0.16, "learning_rate": 1.996873296696991e-05, "loss": 0.5237, "step": 883 }, { "epoch": 0.16, "learning_rate": 1.9968574936139102e-05, "loss": 0.5384, "step": 884 }, { "epoch": 0.16, "learning_rate": 1.996841650758061e-05, "loss": 0.5535, "step": 885 }, { "epoch": 0.16, "learning_rate": 1.996825768130076e-05, "loss": 0.5147, "step": 886 }, { "epoch": 0.16, "learning_rate": 1.9968098457305882e-05, "loss": 0.5423, "step": 887 }, { "epoch": 0.16, "learning_rate": 1.996793883560233e-05, "loss": 0.519, "step": 888 }, { "epoch": 0.16, "learning_rate": 1.9967778816196474e-05, "loss": 0.535, "step": 889 }, { "epoch": 0.16, "learning_rate": 1.99676183990947e-05, "loss": 0.5099, "step": 890 }, { "epoch": 0.16, "learning_rate": 1.9967457584303406e-05, "loss": 0.5544, "step": 891 }, { "epoch": 0.17, "learning_rate": 1.9967296371829005e-05, "loss": 0.5272, "step": 892 }, { "epoch": 0.17, "learning_rate": 1.9967134761677936e-05, "loss": 0.5209, "step": 893 }, { "epoch": 0.17, "learning_rate": 1.9966972753856644e-05, "loss": 0.5251, "step": 894 }, { "epoch": 0.17, "learning_rate": 1.996681034837159e-05, "loss": 0.5296, "step": 895 }, { "epoch": 0.17, "learning_rate": 1.9966647545229255e-05, "loss": 0.5087, "step": 896 }, { "epoch": 0.17, "learning_rate": 1.996648434443614e-05, "loss": 0.5334, "step": 897 }, { "epoch": 0.17, "learning_rate": 1.996632074599875e-05, "loss": 0.5369, "step": 898 }, { "epoch": 0.17, "learning_rate": 1.9966156749923617e-05, "loss": 0.545, "step": 899 }, { "epoch": 0.17, "learning_rate": 1.996599235621728e-05, "loss": 0.4941, "step": 900 }, { "epoch": 0.17, "learning_rate": 1.9965827564886298e-05, "loss": 0.5281, "step": 901 }, { "epoch": 0.17, "learning_rate": 1.9965662375937248e-05, "loss": 0.5165, "step": 902 }, { "epoch": 0.17, "learning_rate": 1.996549678937672e-05, "loss": 0.5285, "step": 903 }, { "epoch": 0.17, "learning_rate": 1.996533080521132e-05, "loss": 0.549, "step": 904 }, { "epoch": 0.17, "learning_rate": 1.9965164423447672e-05, "loss": 0.5117, "step": 905 }, { "epoch": 0.17, "learning_rate": 1.9964997644092413e-05, "loss": 0.5493, "step": 906 }, { "epoch": 0.17, "learning_rate": 1.99648304671522e-05, "loss": 0.5498, "step": 907 }, { "epoch": 0.17, "learning_rate": 1.9964662892633696e-05, "loss": 0.5358, "step": 908 }, { "epoch": 0.17, "learning_rate": 1.9964494920543598e-05, "loss": 0.513, "step": 909 }, { "epoch": 0.17, "learning_rate": 1.9964326550888598e-05, "loss": 0.5128, "step": 910 }, { "epoch": 0.17, "learning_rate": 1.9964157783675415e-05, "loss": 0.499, "step": 911 }, { "epoch": 0.17, "learning_rate": 1.9963988618910787e-05, "loss": 0.5631, "step": 912 }, { "epoch": 0.17, "learning_rate": 1.996381905660146e-05, "loss": 0.5368, "step": 913 }, { "epoch": 0.17, "learning_rate": 1.9963649096754202e-05, "loss": 0.5154, "step": 914 }, { "epoch": 0.17, "learning_rate": 1.9963478739375794e-05, "loss": 0.5116, "step": 915 }, { "epoch": 0.17, "learning_rate": 1.9963307984473026e-05, "loss": 0.5321, "step": 916 }, { "epoch": 0.17, "learning_rate": 1.996313683205272e-05, "loss": 0.5113, "step": 917 }, { "epoch": 0.17, "learning_rate": 1.9962965282121697e-05, "loss": 0.5336, "step": 918 }, { "epoch": 0.17, "learning_rate": 1.996279333468681e-05, "loss": 0.5563, "step": 919 }, { "epoch": 0.17, "learning_rate": 1.996262098975491e-05, "loss": 0.5503, "step": 920 }, { "epoch": 0.17, "learning_rate": 1.996244824733288e-05, "loss": 0.5135, "step": 921 }, { "epoch": 0.17, "learning_rate": 1.996227510742761e-05, "loss": 0.5249, "step": 922 }, { "epoch": 0.17, "learning_rate": 1.9962101570046007e-05, "loss": 0.5445, "step": 923 }, { "epoch": 0.17, "learning_rate": 1.9961927635194994e-05, "loss": 0.5301, "step": 924 }, { "epoch": 0.17, "learning_rate": 1.9961753302881517e-05, "loss": 0.5362, "step": 925 }, { "epoch": 0.17, "learning_rate": 1.9961578573112526e-05, "loss": 0.5341, "step": 926 }, { "epoch": 0.17, "learning_rate": 1.996140344589499e-05, "loss": 0.527, "step": 927 }, { "epoch": 0.17, "learning_rate": 1.99612279212359e-05, "loss": 0.496, "step": 928 }, { "epoch": 0.17, "learning_rate": 1.9961051999142264e-05, "loss": 0.5257, "step": 929 }, { "epoch": 0.17, "learning_rate": 1.996087567962109e-05, "loss": 0.5367, "step": 930 }, { "epoch": 0.17, "learning_rate": 1.9960698962679417e-05, "loss": 0.5088, "step": 931 }, { "epoch": 0.17, "learning_rate": 1.99605218483243e-05, "loss": 0.5535, "step": 932 }, { "epoch": 0.17, "learning_rate": 1.996034433656281e-05, "loss": 0.5193, "step": 933 }, { "epoch": 0.17, "learning_rate": 1.996016642740201e-05, "loss": 0.5078, "step": 934 }, { "epoch": 0.17, "learning_rate": 1.9959988120849015e-05, "loss": 0.5188, "step": 935 }, { "epoch": 0.17, "learning_rate": 1.9959809416910934e-05, "loss": 0.5472, "step": 936 }, { "epoch": 0.17, "learning_rate": 1.99596303155949e-05, "loss": 0.5126, "step": 937 }, { "epoch": 0.17, "learning_rate": 1.9959450816908052e-05, "loss": 0.5286, "step": 938 }, { "epoch": 0.17, "learning_rate": 1.9959270920857562e-05, "loss": 0.5124, "step": 939 }, { "epoch": 0.17, "learning_rate": 1.9959090627450595e-05, "loss": 0.5275, "step": 940 }, { "epoch": 0.17, "learning_rate": 1.9958909936694354e-05, "loss": 0.5033, "step": 941 }, { "epoch": 0.17, "learning_rate": 1.9958728848596044e-05, "loss": 0.5422, "step": 942 }, { "epoch": 0.17, "learning_rate": 1.995854736316289e-05, "loss": 0.5221, "step": 943 }, { "epoch": 0.17, "learning_rate": 1.9958365480402135e-05, "loss": 0.5404, "step": 944 }, { "epoch": 0.17, "learning_rate": 1.9958183200321034e-05, "loss": 0.5199, "step": 945 }, { "epoch": 0.18, "learning_rate": 1.995800052292686e-05, "loss": 0.5222, "step": 946 }, { "epoch": 0.18, "learning_rate": 1.9957817448226905e-05, "loss": 0.5302, "step": 947 }, { "epoch": 0.18, "learning_rate": 1.9957633976228467e-05, "loss": 0.52, "step": 948 }, { "epoch": 0.18, "learning_rate": 1.995745010693887e-05, "loss": 0.5184, "step": 949 }, { "epoch": 0.18, "learning_rate": 1.9957265840365453e-05, "loss": 0.5262, "step": 950 }, { "epoch": 0.18, "learning_rate": 1.995708117651556e-05, "loss": 0.5318, "step": 951 }, { "epoch": 0.18, "learning_rate": 1.9956896115396565e-05, "loss": 0.5338, "step": 952 }, { "epoch": 0.18, "learning_rate": 1.995671065701585e-05, "loss": 0.5382, "step": 953 }, { "epoch": 0.18, "learning_rate": 1.9956524801380812e-05, "loss": 0.5352, "step": 954 }, { "epoch": 0.18, "learning_rate": 1.995633854849887e-05, "loss": 0.5241, "step": 955 }, { "epoch": 0.18, "learning_rate": 1.9956151898377455e-05, "loss": 0.4892, "step": 956 }, { "epoch": 0.18, "learning_rate": 1.995596485102401e-05, "loss": 0.5134, "step": 957 }, { "epoch": 0.18, "learning_rate": 1.9955777406446002e-05, "loss": 0.533, "step": 958 }, { "epoch": 0.18, "learning_rate": 1.9955589564650908e-05, "loss": 0.5425, "step": 959 }, { "epoch": 0.18, "learning_rate": 1.9955401325646223e-05, "loss": 0.5076, "step": 960 }, { "epoch": 0.18, "learning_rate": 1.9955212689439457e-05, "loss": 0.5315, "step": 961 }, { "epoch": 0.18, "learning_rate": 1.995502365603813e-05, "loss": 0.5314, "step": 962 }, { "epoch": 0.18, "learning_rate": 1.99548342254498e-05, "loss": 0.5129, "step": 963 }, { "epoch": 0.18, "learning_rate": 1.995464439768201e-05, "loss": 0.517, "step": 964 }, { "epoch": 0.18, "learning_rate": 1.995445417274234e-05, "loss": 0.5341, "step": 965 }, { "epoch": 0.18, "learning_rate": 1.995426355063838e-05, "loss": 0.5286, "step": 966 }, { "epoch": 0.18, "learning_rate": 1.9954072531377733e-05, "loss": 0.5036, "step": 967 }, { "epoch": 0.18, "learning_rate": 1.9953881114968023e-05, "loss": 0.5165, "step": 968 }, { "epoch": 0.18, "learning_rate": 1.9953689301416883e-05, "loss": 0.5086, "step": 969 }, { "epoch": 0.18, "learning_rate": 1.9953497090731967e-05, "loss": 0.517, "step": 970 }, { "epoch": 0.18, "learning_rate": 1.9953304482920953e-05, "loss": 0.5336, "step": 971 }, { "epoch": 0.18, "learning_rate": 1.995311147799151e-05, "loss": 0.5215, "step": 972 }, { "epoch": 0.18, "learning_rate": 1.9952918075951353e-05, "loss": 0.5392, "step": 973 }, { "epoch": 0.18, "learning_rate": 1.9952724276808187e-05, "loss": 0.507, "step": 974 }, { "epoch": 0.18, "learning_rate": 1.995253008056975e-05, "loss": 0.5176, "step": 975 }, { "epoch": 0.18, "learning_rate": 1.995233548724379e-05, "loss": 0.5408, "step": 976 }, { "epoch": 0.18, "learning_rate": 1.9952140496838076e-05, "loss": 0.5546, "step": 977 }, { "epoch": 0.18, "learning_rate": 1.9951945109360377e-05, "loss": 0.531, "step": 978 }, { "epoch": 0.18, "learning_rate": 1.9951749324818492e-05, "loss": 0.5196, "step": 979 }, { "epoch": 0.18, "learning_rate": 1.9951553143220236e-05, "loss": 0.5167, "step": 980 }, { "epoch": 0.18, "learning_rate": 1.9951356564573436e-05, "loss": 0.5221, "step": 981 }, { "epoch": 0.18, "learning_rate": 1.9951159588885932e-05, "loss": 0.5149, "step": 982 }, { "epoch": 0.18, "learning_rate": 1.9950962216165585e-05, "loss": 0.5166, "step": 983 }, { "epoch": 0.18, "learning_rate": 1.995076444642027e-05, "loss": 0.5289, "step": 984 }, { "epoch": 0.18, "learning_rate": 1.9950566279657874e-05, "loss": 0.5163, "step": 985 }, { "epoch": 0.18, "learning_rate": 1.995036771588631e-05, "loss": 0.515, "step": 986 }, { "epoch": 0.18, "learning_rate": 1.9950168755113494e-05, "loss": 0.5379, "step": 987 }, { "epoch": 0.18, "learning_rate": 1.994996939734737e-05, "loss": 0.5321, "step": 988 }, { "epoch": 0.18, "learning_rate": 1.9949769642595886e-05, "loss": 0.5382, "step": 989 }, { "epoch": 0.18, "learning_rate": 1.9949569490867016e-05, "loss": 0.5347, "step": 990 }, { "epoch": 0.18, "learning_rate": 1.9949368942168745e-05, "loss": 0.5057, "step": 991 }, { "epoch": 0.18, "learning_rate": 1.9949167996509073e-05, "loss": 0.5111, "step": 992 }, { "epoch": 0.18, "learning_rate": 1.9948966653896017e-05, "loss": 0.5234, "step": 993 }, { "epoch": 0.18, "learning_rate": 1.9948764914337615e-05, "loss": 0.5062, "step": 994 }, { "epoch": 0.18, "learning_rate": 1.994856277784191e-05, "loss": 0.518, "step": 995 }, { "epoch": 0.18, "learning_rate": 1.994836024441697e-05, "loss": 0.5236, "step": 996 }, { "epoch": 0.18, "learning_rate": 1.9948157314070874e-05, "loss": 0.5058, "step": 997 }, { "epoch": 0.18, "learning_rate": 1.994795398681172e-05, "loss": 0.5452, "step": 998 }, { "epoch": 0.18, "learning_rate": 1.9947750262647623e-05, "loss": 0.5485, "step": 999 }, { "epoch": 0.19, "learning_rate": 1.9947546141586705e-05, "loss": 0.5292, "step": 1000 }, { "epoch": 0.19, "learning_rate": 1.9947341623637115e-05, "loss": 0.5359, "step": 1001 }, { "epoch": 0.19, "learning_rate": 1.994713670880701e-05, "loss": 0.5189, "step": 1002 }, { "epoch": 0.19, "learning_rate": 1.994693139710457e-05, "loss": 0.5502, "step": 1003 }, { "epoch": 0.19, "learning_rate": 1.994672568853798e-05, "loss": 0.5026, "step": 1004 }, { "epoch": 0.19, "learning_rate": 1.994651958311545e-05, "loss": 0.536, "step": 1005 }, { "epoch": 0.19, "learning_rate": 1.9946313080845207e-05, "loss": 0.5317, "step": 1006 }, { "epoch": 0.19, "learning_rate": 1.9946106181735488e-05, "loss": 0.5109, "step": 1007 }, { "epoch": 0.19, "learning_rate": 1.9945898885794547e-05, "loss": 0.515, "step": 1008 }, { "epoch": 0.19, "learning_rate": 1.9945691193030653e-05, "loss": 0.5263, "step": 1009 }, { "epoch": 0.19, "learning_rate": 1.9945483103452092e-05, "loss": 0.4991, "step": 1010 }, { "epoch": 0.19, "learning_rate": 1.994527461706717e-05, "loss": 0.5526, "step": 1011 }, { "epoch": 0.19, "learning_rate": 1.9945065733884207e-05, "loss": 0.5155, "step": 1012 }, { "epoch": 0.19, "learning_rate": 1.994485645391153e-05, "loss": 0.5413, "step": 1013 }, { "epoch": 0.19, "learning_rate": 1.9944646777157497e-05, "loss": 0.5293, "step": 1014 }, { "epoch": 0.19, "learning_rate": 1.994443670363047e-05, "loss": 0.5341, "step": 1015 }, { "epoch": 0.19, "learning_rate": 1.9944226233338826e-05, "loss": 0.5138, "step": 1016 }, { "epoch": 0.19, "learning_rate": 1.994401536629097e-05, "loss": 0.5131, "step": 1017 }, { "epoch": 0.19, "learning_rate": 1.994380410249531e-05, "loss": 0.5366, "step": 1018 }, { "epoch": 0.19, "learning_rate": 1.994359244196028e-05, "loss": 0.5044, "step": 1019 }, { "epoch": 0.19, "learning_rate": 1.9943380384694316e-05, "loss": 0.5272, "step": 1020 }, { "epoch": 0.19, "learning_rate": 1.9943167930705886e-05, "loss": 0.5174, "step": 1021 }, { "epoch": 0.19, "learning_rate": 1.9942955080003467e-05, "loss": 0.5317, "step": 1022 }, { "epoch": 0.19, "learning_rate": 1.9942741832595545e-05, "loss": 0.5297, "step": 1023 }, { "epoch": 0.19, "learning_rate": 1.994252818849064e-05, "loss": 0.5255, "step": 1024 }, { "epoch": 0.19, "learning_rate": 1.9942314147697263e-05, "loss": 0.5562, "step": 1025 }, { "epoch": 0.19, "learning_rate": 1.9942099710223957e-05, "loss": 0.5135, "step": 1026 }, { "epoch": 0.19, "learning_rate": 1.9941884876079285e-05, "loss": 0.5189, "step": 1027 }, { "epoch": 0.19, "learning_rate": 1.994166964527181e-05, "loss": 0.5101, "step": 1028 }, { "epoch": 0.19, "learning_rate": 1.9941454017810124e-05, "loss": 0.5156, "step": 1029 }, { "epoch": 0.19, "learning_rate": 1.994123799370283e-05, "loss": 0.518, "step": 1030 }, { "epoch": 0.19, "learning_rate": 1.9941021572958546e-05, "loss": 0.5206, "step": 1031 }, { "epoch": 0.19, "learning_rate": 1.9940804755585903e-05, "loss": 0.5383, "step": 1032 }, { "epoch": 0.19, "learning_rate": 1.994058754159356e-05, "loss": 0.5121, "step": 1033 }, { "epoch": 0.19, "learning_rate": 1.9940369930990174e-05, "loss": 0.5381, "step": 1034 }, { "epoch": 0.19, "learning_rate": 1.994015192378443e-05, "loss": 0.5108, "step": 1035 }, { "epoch": 0.19, "learning_rate": 1.9939933519985035e-05, "loss": 0.5258, "step": 1036 }, { "epoch": 0.19, "learning_rate": 1.9939714719600692e-05, "loss": 0.5158, "step": 1037 }, { "epoch": 0.19, "learning_rate": 1.9939495522640136e-05, "loss": 0.5058, "step": 1038 }, { "epoch": 0.19, "learning_rate": 1.993927592911211e-05, "loss": 0.5392, "step": 1039 }, { "epoch": 0.19, "learning_rate": 1.9939055939025378e-05, "loss": 0.5198, "step": 1040 }, { "epoch": 0.19, "learning_rate": 1.9938835552388713e-05, "loss": 0.5129, "step": 1041 }, { "epoch": 0.19, "learning_rate": 1.9938614769210912e-05, "loss": 0.5225, "step": 1042 }, { "epoch": 0.19, "learning_rate": 1.9938393589500782e-05, "loss": 0.5121, "step": 1043 }, { "epoch": 0.19, "learning_rate": 1.993817201326715e-05, "loss": 0.5292, "step": 1044 }, { "epoch": 0.19, "learning_rate": 1.9937950040518852e-05, "loss": 0.5262, "step": 1045 }, { "epoch": 0.19, "learning_rate": 1.993772767126475e-05, "loss": 0.5192, "step": 1046 }, { "epoch": 0.19, "learning_rate": 1.9937504905513712e-05, "loss": 0.508, "step": 1047 }, { "epoch": 0.19, "learning_rate": 1.9937281743274628e-05, "loss": 0.5179, "step": 1048 }, { "epoch": 0.19, "learning_rate": 1.9937058184556398e-05, "loss": 0.5205, "step": 1049 }, { "epoch": 0.19, "learning_rate": 1.9936834229367945e-05, "loss": 0.5426, "step": 1050 }, { "epoch": 0.19, "learning_rate": 1.9936609877718206e-05, "loss": 0.5127, "step": 1051 }, { "epoch": 0.19, "learning_rate": 1.993638512961613e-05, "loss": 0.5203, "step": 1052 }, { "epoch": 0.19, "learning_rate": 1.9936159985070683e-05, "loss": 0.5423, "step": 1053 }, { "epoch": 0.2, "learning_rate": 1.9935934444090846e-05, "loss": 0.5329, "step": 1054 }, { "epoch": 0.2, "learning_rate": 1.9935708506685624e-05, "loss": 0.4988, "step": 1055 }, { "epoch": 0.2, "learning_rate": 1.993548217286403e-05, "loss": 0.5039, "step": 1056 }, { "epoch": 0.2, "learning_rate": 1.9935255442635087e-05, "loss": 0.5266, "step": 1057 }, { "epoch": 0.2, "learning_rate": 1.993502831600785e-05, "loss": 0.5169, "step": 1058 }, { "epoch": 0.2, "learning_rate": 1.993480079299138e-05, "loss": 0.5215, "step": 1059 }, { "epoch": 0.2, "learning_rate": 1.9934572873594746e-05, "loss": 0.5265, "step": 1060 }, { "epoch": 0.2, "learning_rate": 1.9934344557827053e-05, "loss": 0.516, "step": 1061 }, { "epoch": 0.2, "learning_rate": 1.99341158456974e-05, "loss": 0.52, "step": 1062 }, { "epoch": 0.2, "learning_rate": 1.993388673721492e-05, "loss": 0.5066, "step": 1063 }, { "epoch": 0.2, "learning_rate": 1.9933657232388752e-05, "loss": 0.5166, "step": 1064 }, { "epoch": 0.2, "learning_rate": 1.993342733122805e-05, "loss": 0.5054, "step": 1065 }, { "epoch": 0.2, "learning_rate": 1.993319703374199e-05, "loss": 0.5078, "step": 1066 }, { "epoch": 0.2, "learning_rate": 1.993296633993976e-05, "loss": 0.5211, "step": 1067 }, { "epoch": 0.2, "learning_rate": 1.9932735249830564e-05, "loss": 0.4943, "step": 1068 }, { "epoch": 0.2, "learning_rate": 1.993250376342362e-05, "loss": 0.5125, "step": 1069 }, { "epoch": 0.2, "learning_rate": 1.9932271880728168e-05, "loss": 0.5393, "step": 1070 }, { "epoch": 0.2, "learning_rate": 1.993203960175345e-05, "loss": 0.5081, "step": 1071 }, { "epoch": 0.2, "learning_rate": 1.993180692650875e-05, "loss": 0.4947, "step": 1072 }, { "epoch": 0.2, "learning_rate": 1.9931573855003334e-05, "loss": 0.5131, "step": 1073 }, { "epoch": 0.2, "learning_rate": 1.9931340387246512e-05, "loss": 0.5174, "step": 1074 }, { "epoch": 0.2, "learning_rate": 1.9931106523247596e-05, "loss": 0.4968, "step": 1075 }, { "epoch": 0.2, "learning_rate": 1.9930872263015917e-05, "loss": 0.526, "step": 1076 }, { "epoch": 0.2, "learning_rate": 1.9930637606560822e-05, "loss": 0.5191, "step": 1077 }, { "epoch": 0.2, "learning_rate": 1.993040255389167e-05, "loss": 0.4968, "step": 1078 }, { "epoch": 0.2, "learning_rate": 1.9930167105017843e-05, "loss": 0.549, "step": 1079 }, { "epoch": 0.2, "learning_rate": 1.9929931259948735e-05, "loss": 0.5043, "step": 1080 }, { "epoch": 0.2, "learning_rate": 1.9929695018693752e-05, "loss": 0.5137, "step": 1081 }, { "epoch": 0.2, "learning_rate": 1.9929458381262324e-05, "loss": 0.5241, "step": 1082 }, { "epoch": 0.2, "learning_rate": 1.992922134766389e-05, "loss": 0.5151, "step": 1083 }, { "epoch": 0.2, "learning_rate": 1.992898391790791e-05, "loss": 0.5406, "step": 1084 }, { "epoch": 0.2, "learning_rate": 1.992874609200385e-05, "loss": 0.5169, "step": 1085 }, { "epoch": 0.2, "learning_rate": 1.9928507869961207e-05, "loss": 0.5421, "step": 1086 }, { "epoch": 0.2, "learning_rate": 1.9928269251789484e-05, "loss": 0.5145, "step": 1087 }, { "epoch": 0.2, "learning_rate": 1.9928030237498194e-05, "loss": 0.5126, "step": 1088 }, { "epoch": 0.2, "learning_rate": 1.9927790827096884e-05, "loss": 0.5085, "step": 1089 }, { "epoch": 0.2, "learning_rate": 1.9927551020595096e-05, "loss": 0.5223, "step": 1090 }, { "epoch": 0.2, "learning_rate": 1.9927310818002406e-05, "loss": 0.5387, "step": 1091 }, { "epoch": 0.2, "learning_rate": 1.9927070219328393e-05, "loss": 0.5047, "step": 1092 }, { "epoch": 0.2, "learning_rate": 1.9926829224582658e-05, "loss": 0.5225, "step": 1093 }, { "epoch": 0.2, "learning_rate": 1.9926587833774816e-05, "loss": 0.5006, "step": 1094 }, { "epoch": 0.2, "learning_rate": 1.9926346046914497e-05, "loss": 0.5281, "step": 1095 }, { "epoch": 0.2, "learning_rate": 1.992610386401135e-05, "loss": 0.509, "step": 1096 }, { "epoch": 0.2, "learning_rate": 1.9925861285075035e-05, "loss": 0.5047, "step": 1097 }, { "epoch": 0.2, "learning_rate": 1.9925618310115235e-05, "loss": 0.5324, "step": 1098 }, { "epoch": 0.2, "learning_rate": 1.992537493914164e-05, "loss": 0.5156, "step": 1099 }, { "epoch": 0.2, "learning_rate": 1.992513117216396e-05, "loss": 0.5406, "step": 1100 }, { "epoch": 0.2, "learning_rate": 1.9924887009191924e-05, "loss": 0.5301, "step": 1101 }, { "epoch": 0.2, "learning_rate": 1.992464245023527e-05, "loss": 0.4994, "step": 1102 }, { "epoch": 0.2, "learning_rate": 1.9924397495303756e-05, "loss": 0.5092, "step": 1103 }, { "epoch": 0.2, "learning_rate": 1.992415214440716e-05, "loss": 0.5421, "step": 1104 }, { "epoch": 0.2, "learning_rate": 1.9923906397555267e-05, "loss": 0.5024, "step": 1105 }, { "epoch": 0.2, "learning_rate": 1.992366025475788e-05, "loss": 0.5099, "step": 1106 }, { "epoch": 0.2, "learning_rate": 1.9923413716024823e-05, "loss": 0.5211, "step": 1107 }, { "epoch": 0.2, "learning_rate": 1.992316678136593e-05, "loss": 0.5083, "step": 1108 }, { "epoch": 0.21, "learning_rate": 1.9922919450791057e-05, "loss": 0.5437, "step": 1109 }, { "epoch": 0.21, "learning_rate": 1.992267172431007e-05, "loss": 0.5325, "step": 1110 }, { "epoch": 0.21, "learning_rate": 1.992242360193285e-05, "loss": 0.5131, "step": 1111 }, { "epoch": 0.21, "learning_rate": 1.9922175083669303e-05, "loss": 0.5236, "step": 1112 }, { "epoch": 0.21, "learning_rate": 1.992192616952934e-05, "loss": 0.5196, "step": 1113 }, { "epoch": 0.21, "learning_rate": 1.992167685952289e-05, "loss": 0.516, "step": 1114 }, { "epoch": 0.21, "learning_rate": 1.9921427153659904e-05, "loss": 0.4941, "step": 1115 }, { "epoch": 0.21, "learning_rate": 1.9921177051950345e-05, "loss": 0.5116, "step": 1116 }, { "epoch": 0.21, "learning_rate": 1.9920926554404188e-05, "loss": 0.5435, "step": 1117 }, { "epoch": 0.21, "learning_rate": 1.992067566103143e-05, "loss": 0.5149, "step": 1118 }, { "epoch": 0.21, "learning_rate": 1.9920424371842082e-05, "loss": 0.5173, "step": 1119 }, { "epoch": 0.21, "learning_rate": 1.9920172686846165e-05, "loss": 0.4984, "step": 1120 }, { "epoch": 0.21, "learning_rate": 1.9919920606053727e-05, "loss": 0.5265, "step": 1121 }, { "epoch": 0.21, "learning_rate": 1.9919668129474825e-05, "loss": 0.5048, "step": 1122 }, { "epoch": 0.21, "learning_rate": 1.991941525711953e-05, "loss": 0.5055, "step": 1123 }, { "epoch": 0.21, "learning_rate": 1.991916198899793e-05, "loss": 0.5428, "step": 1124 }, { "epoch": 0.21, "learning_rate": 1.991890832512013e-05, "loss": 0.5338, "step": 1125 }, { "epoch": 0.21, "learning_rate": 1.9918654265496257e-05, "loss": 0.5314, "step": 1126 }, { "epoch": 0.21, "learning_rate": 1.991839981013644e-05, "loss": 0.5109, "step": 1127 }, { "epoch": 0.21, "learning_rate": 1.991814495905083e-05, "loss": 0.5238, "step": 1128 }, { "epoch": 0.21, "learning_rate": 1.9917889712249606e-05, "loss": 0.5102, "step": 1129 }, { "epoch": 0.21, "learning_rate": 1.991763406974294e-05, "loss": 0.5339, "step": 1130 }, { "epoch": 0.21, "learning_rate": 1.991737803154104e-05, "loss": 0.5243, "step": 1131 }, { "epoch": 0.21, "learning_rate": 1.9917121597654115e-05, "loss": 0.516, "step": 1132 }, { "epoch": 0.21, "learning_rate": 1.99168647680924e-05, "loss": 0.5361, "step": 1133 }, { "epoch": 0.21, "learning_rate": 1.991660754286614e-05, "loss": 0.5044, "step": 1134 }, { "epoch": 0.21, "learning_rate": 1.9916349921985604e-05, "loss": 0.5283, "step": 1135 }, { "epoch": 0.21, "learning_rate": 1.9916091905461062e-05, "loss": 0.5217, "step": 1136 }, { "epoch": 0.21, "learning_rate": 1.9915833493302817e-05, "loss": 0.5211, "step": 1137 }, { "epoch": 0.21, "learning_rate": 1.9915574685521167e-05, "loss": 0.5458, "step": 1138 }, { "epoch": 0.21, "learning_rate": 1.991531548212645e-05, "loss": 0.543, "step": 1139 }, { "epoch": 0.21, "learning_rate": 1.9915055883129e-05, "loss": 0.5047, "step": 1140 }, { "epoch": 0.21, "learning_rate": 1.9914795888539182e-05, "loss": 0.5073, "step": 1141 }, { "epoch": 0.21, "learning_rate": 1.9914535498367362e-05, "loss": 0.5051, "step": 1142 }, { "epoch": 0.21, "learning_rate": 1.9914274712623932e-05, "loss": 0.5208, "step": 1143 }, { "epoch": 0.21, "learning_rate": 1.9914013531319297e-05, "loss": 0.5178, "step": 1144 }, { "epoch": 0.21, "learning_rate": 1.9913751954463876e-05, "loss": 0.5268, "step": 1145 }, { "epoch": 0.21, "learning_rate": 1.9913489982068107e-05, "loss": 0.5068, "step": 1146 }, { "epoch": 0.21, "learning_rate": 1.9913227614142446e-05, "loss": 0.5316, "step": 1147 }, { "epoch": 0.21, "learning_rate": 1.9912964850697353e-05, "loss": 0.5026, "step": 1148 }, { "epoch": 0.21, "learning_rate": 1.9912701691743317e-05, "loss": 0.5024, "step": 1149 }, { "epoch": 0.21, "learning_rate": 1.9912438137290834e-05, "loss": 0.5298, "step": 1150 }, { "epoch": 0.21, "learning_rate": 1.9912174187350424e-05, "loss": 0.521, "step": 1151 }, { "epoch": 0.21, "learning_rate": 1.9911909841932616e-05, "loss": 0.4998, "step": 1152 }, { "epoch": 0.21, "learning_rate": 1.9911645101047958e-05, "loss": 0.5029, "step": 1153 }, { "epoch": 0.21, "learning_rate": 1.991137996470701e-05, "loss": 0.4954, "step": 1154 }, { "epoch": 0.21, "learning_rate": 1.991111443292035e-05, "loss": 0.517, "step": 1155 }, { "epoch": 0.21, "learning_rate": 1.9910848505698575e-05, "loss": 0.531, "step": 1156 }, { "epoch": 0.21, "learning_rate": 1.9910582183052297e-05, "loss": 0.5303, "step": 1157 }, { "epoch": 0.21, "learning_rate": 1.9910315464992136e-05, "loss": 0.4985, "step": 1158 }, { "epoch": 0.21, "learning_rate": 1.9910048351528738e-05, "loss": 0.5194, "step": 1159 }, { "epoch": 0.21, "learning_rate": 1.9909780842672756e-05, "loss": 0.5187, "step": 1160 }, { "epoch": 0.21, "learning_rate": 1.990951293843487e-05, "loss": 0.5211, "step": 1161 }, { "epoch": 0.21, "learning_rate": 1.9909244638825763e-05, "loss": 0.506, "step": 1162 }, { "epoch": 0.22, "learning_rate": 1.990897594385614e-05, "loss": 0.5138, "step": 1163 }, { "epoch": 0.22, "learning_rate": 1.9908706853536725e-05, "loss": 0.5325, "step": 1164 }, { "epoch": 0.22, "learning_rate": 1.990843736787825e-05, "loss": 0.5137, "step": 1165 }, { "epoch": 0.22, "learning_rate": 1.990816748689147e-05, "loss": 0.5166, "step": 1166 }, { "epoch": 0.22, "learning_rate": 1.990789721058715e-05, "loss": 0.4916, "step": 1167 }, { "epoch": 0.22, "learning_rate": 1.9907626538976073e-05, "loss": 0.5165, "step": 1168 }, { "epoch": 0.22, "learning_rate": 1.9907355472069048e-05, "loss": 0.5104, "step": 1169 }, { "epoch": 0.22, "learning_rate": 1.990708400987688e-05, "loss": 0.5159, "step": 1170 }, { "epoch": 0.22, "learning_rate": 1.99068121524104e-05, "loss": 0.5004, "step": 1171 }, { "epoch": 0.22, "learning_rate": 1.990653989968046e-05, "loss": 0.5496, "step": 1172 }, { "epoch": 0.22, "learning_rate": 1.9906267251697916e-05, "loss": 0.5072, "step": 1173 }, { "epoch": 0.22, "learning_rate": 1.9905994208473652e-05, "loss": 0.4955, "step": 1174 }, { "epoch": 0.22, "learning_rate": 1.990572077001856e-05, "loss": 0.5092, "step": 1175 }, { "epoch": 0.22, "learning_rate": 1.990544693634355e-05, "loss": 0.5184, "step": 1176 }, { "epoch": 0.22, "learning_rate": 1.9905172707459543e-05, "loss": 0.5158, "step": 1177 }, { "epoch": 0.22, "learning_rate": 1.9904898083377486e-05, "loss": 0.5016, "step": 1178 }, { "epoch": 0.22, "learning_rate": 1.990462306410833e-05, "loss": 0.517, "step": 1179 }, { "epoch": 0.22, "learning_rate": 1.990434764966306e-05, "loss": 0.5029, "step": 1180 }, { "epoch": 0.22, "learning_rate": 1.9904071840052652e-05, "loss": 0.5055, "step": 1181 }, { "epoch": 0.22, "learning_rate": 1.990379563528811e-05, "loss": 0.5226, "step": 1182 }, { "epoch": 0.22, "learning_rate": 1.9903519035380467e-05, "loss": 0.5176, "step": 1183 }, { "epoch": 0.22, "learning_rate": 1.9903242040340745e-05, "loss": 0.5064, "step": 1184 }, { "epoch": 0.22, "learning_rate": 1.990296465018e-05, "loss": 0.5307, "step": 1185 }, { "epoch": 0.22, "learning_rate": 1.9902686864909303e-05, "loss": 0.5009, "step": 1186 }, { "epoch": 0.22, "learning_rate": 1.9902408684539732e-05, "loss": 0.5124, "step": 1187 }, { "epoch": 0.22, "learning_rate": 1.9902130109082393e-05, "loss": 0.5175, "step": 1188 }, { "epoch": 0.22, "learning_rate": 1.9901851138548392e-05, "loss": 0.5314, "step": 1189 }, { "epoch": 0.22, "learning_rate": 1.9901571772948864e-05, "loss": 0.4897, "step": 1190 }, { "epoch": 0.22, "learning_rate": 1.9901292012294954e-05, "loss": 0.5193, "step": 1191 }, { "epoch": 0.22, "learning_rate": 1.9901011856597828e-05, "loss": 0.5181, "step": 1192 }, { "epoch": 0.22, "learning_rate": 1.9900731305868658e-05, "loss": 0.5154, "step": 1193 }, { "epoch": 0.22, "learning_rate": 1.9900450360118636e-05, "loss": 0.4822, "step": 1194 }, { "epoch": 0.22, "learning_rate": 1.990016901935898e-05, "loss": 0.5384, "step": 1195 }, { "epoch": 0.22, "learning_rate": 1.989988728360091e-05, "loss": 0.491, "step": 1196 }, { "epoch": 0.22, "learning_rate": 1.9899605152855663e-05, "loss": 0.5177, "step": 1197 }, { "epoch": 0.22, "learning_rate": 1.9899322627134498e-05, "loss": 0.5009, "step": 1198 }, { "epoch": 0.22, "learning_rate": 1.9899039706448694e-05, "loss": 0.5079, "step": 1199 }, { "epoch": 0.22, "learning_rate": 1.989875639080953e-05, "loss": 0.5194, "step": 1200 }, { "epoch": 0.22, "learning_rate": 1.9898472680228314e-05, "loss": 0.5114, "step": 1201 }, { "epoch": 0.22, "learning_rate": 1.989818857471636e-05, "loss": 0.5008, "step": 1202 }, { "epoch": 0.22, "learning_rate": 1.9897904074285012e-05, "loss": 0.5134, "step": 1203 }, { "epoch": 0.22, "learning_rate": 1.9897619178945616e-05, "loss": 0.5076, "step": 1204 }, { "epoch": 0.22, "learning_rate": 1.989733388870954e-05, "loss": 0.53, "step": 1205 }, { "epoch": 0.22, "learning_rate": 1.9897048203588168e-05, "loss": 0.5024, "step": 1206 }, { "epoch": 0.22, "learning_rate": 1.9896762123592897e-05, "loss": 0.5442, "step": 1207 }, { "epoch": 0.22, "learning_rate": 1.9896475648735135e-05, "loss": 0.5241, "step": 1208 }, { "epoch": 0.22, "learning_rate": 1.9896188779026323e-05, "loss": 0.5158, "step": 1209 }, { "epoch": 0.22, "learning_rate": 1.9895901514477898e-05, "loss": 0.5201, "step": 1210 }, { "epoch": 0.22, "learning_rate": 1.9895613855101324e-05, "loss": 0.5154, "step": 1211 }, { "epoch": 0.22, "learning_rate": 1.989532580090808e-05, "loss": 0.5109, "step": 1212 }, { "epoch": 0.22, "learning_rate": 1.989503735190966e-05, "loss": 0.5181, "step": 1213 }, { "epoch": 0.22, "learning_rate": 1.9894748508117568e-05, "loss": 0.5219, "step": 1214 }, { "epoch": 0.22, "learning_rate": 1.9894459269543328e-05, "loss": 0.5108, "step": 1215 }, { "epoch": 0.22, "learning_rate": 1.9894169636198483e-05, "loss": 0.4936, "step": 1216 }, { "epoch": 0.23, "learning_rate": 1.9893879608094587e-05, "loss": 0.5101, "step": 1217 }, { "epoch": 0.23, "learning_rate": 1.9893589185243214e-05, "loss": 0.5467, "step": 1218 }, { "epoch": 0.23, "learning_rate": 1.989329836765595e-05, "loss": 0.4947, "step": 1219 }, { "epoch": 0.23, "learning_rate": 1.98930071553444e-05, "loss": 0.5122, "step": 1220 }, { "epoch": 0.23, "learning_rate": 1.989271554832018e-05, "loss": 0.5056, "step": 1221 }, { "epoch": 0.23, "learning_rate": 1.9892423546594924e-05, "loss": 0.5014, "step": 1222 }, { "epoch": 0.23, "learning_rate": 1.9892131150180284e-05, "loss": 0.5203, "step": 1223 }, { "epoch": 0.23, "learning_rate": 1.9891838359087928e-05, "loss": 0.504, "step": 1224 }, { "epoch": 0.23, "learning_rate": 1.9891545173329532e-05, "loss": 0.4943, "step": 1225 }, { "epoch": 0.23, "learning_rate": 1.98912515929168e-05, "loss": 0.5108, "step": 1226 }, { "epoch": 0.23, "learning_rate": 1.989095761786144e-05, "loss": 0.5244, "step": 1227 }, { "epoch": 0.23, "learning_rate": 1.9890663248175186e-05, "loss": 0.4939, "step": 1228 }, { "epoch": 0.23, "learning_rate": 1.989036848386978e-05, "loss": 0.5045, "step": 1229 }, { "epoch": 0.23, "learning_rate": 1.989007332495698e-05, "loss": 0.4968, "step": 1230 }, { "epoch": 0.23, "learning_rate": 1.9889777771448573e-05, "loss": 0.5151, "step": 1231 }, { "epoch": 0.23, "learning_rate": 1.9889481823356338e-05, "loss": 0.5164, "step": 1232 }, { "epoch": 0.23, "learning_rate": 1.9889185480692087e-05, "loss": 0.5028, "step": 1233 }, { "epoch": 0.23, "learning_rate": 1.9888888743467648e-05, "loss": 0.5263, "step": 1234 }, { "epoch": 0.23, "learning_rate": 1.9888591611694855e-05, "loss": 0.509, "step": 1235 }, { "epoch": 0.23, "learning_rate": 1.9888294085385567e-05, "loss": 0.506, "step": 1236 }, { "epoch": 0.23, "learning_rate": 1.988799616455165e-05, "loss": 0.495, "step": 1237 }, { "epoch": 0.23, "learning_rate": 1.9887697849204995e-05, "loss": 0.521, "step": 1238 }, { "epoch": 0.23, "learning_rate": 1.9887399139357502e-05, "loss": 0.513, "step": 1239 }, { "epoch": 0.23, "learning_rate": 1.9887100035021087e-05, "loss": 0.4944, "step": 1240 }, { "epoch": 0.23, "learning_rate": 1.988680053620769e-05, "loss": 0.5176, "step": 1241 }, { "epoch": 0.23, "learning_rate": 1.9886500642929252e-05, "loss": 0.5057, "step": 1242 }, { "epoch": 0.23, "learning_rate": 1.988620035519775e-05, "loss": 0.5027, "step": 1243 }, { "epoch": 0.23, "learning_rate": 1.9885899673025152e-05, "loss": 0.5058, "step": 1244 }, { "epoch": 0.23, "learning_rate": 1.988559859642346e-05, "loss": 0.5146, "step": 1245 }, { "epoch": 0.23, "learning_rate": 1.9885297125404687e-05, "loss": 0.51, "step": 1246 }, { "epoch": 0.23, "learning_rate": 1.9884995259980863e-05, "loss": 0.5076, "step": 1247 }, { "epoch": 0.23, "learning_rate": 1.9884693000164027e-05, "loss": 0.5092, "step": 1248 }, { "epoch": 0.23, "learning_rate": 1.9884390345966245e-05, "loss": 0.4918, "step": 1249 }, { "epoch": 0.23, "learning_rate": 1.9884087297399586e-05, "loss": 0.4948, "step": 1250 }, { "epoch": 0.23, "learning_rate": 1.9883783854476145e-05, "loss": 0.5237, "step": 1251 }, { "epoch": 0.23, "learning_rate": 1.9883480017208025e-05, "loss": 0.5023, "step": 1252 }, { "epoch": 0.23, "learning_rate": 1.9883175785607352e-05, "loss": 0.5066, "step": 1253 }, { "epoch": 0.23, "learning_rate": 1.9882871159686266e-05, "loss": 0.5011, "step": 1254 }, { "epoch": 0.23, "learning_rate": 1.9882566139456916e-05, "loss": 0.5143, "step": 1255 }, { "epoch": 0.23, "learning_rate": 1.9882260724931476e-05, "loss": 0.523, "step": 1256 }, { "epoch": 0.23, "learning_rate": 1.988195491612213e-05, "loss": 0.5138, "step": 1257 }, { "epoch": 0.23, "learning_rate": 1.9881648713041074e-05, "loss": 0.5046, "step": 1258 }, { "epoch": 0.23, "learning_rate": 1.9881342115700534e-05, "loss": 0.5132, "step": 1259 }, { "epoch": 0.23, "learning_rate": 1.9881035124112737e-05, "loss": 0.5006, "step": 1260 }, { "epoch": 0.23, "learning_rate": 1.9880727738289934e-05, "loss": 0.5322, "step": 1261 }, { "epoch": 0.23, "learning_rate": 1.9880419958244384e-05, "loss": 0.4828, "step": 1262 }, { "epoch": 0.23, "learning_rate": 1.9880111783988376e-05, "loss": 0.5006, "step": 1263 }, { "epoch": 0.23, "learning_rate": 1.98798032155342e-05, "loss": 0.5034, "step": 1264 }, { "epoch": 0.23, "learning_rate": 1.9879494252894163e-05, "loss": 0.5295, "step": 1265 }, { "epoch": 0.23, "learning_rate": 1.98791848960806e-05, "loss": 0.5167, "step": 1266 }, { "epoch": 0.23, "learning_rate": 1.987887514510585e-05, "loss": 0.5232, "step": 1267 }, { "epoch": 0.23, "learning_rate": 1.9878564999982274e-05, "loss": 0.5336, "step": 1268 }, { "epoch": 0.23, "learning_rate": 1.9878254460722243e-05, "loss": 0.4832, "step": 1269 }, { "epoch": 0.23, "learning_rate": 1.9877943527338145e-05, "loss": 0.5152, "step": 1270 }, { "epoch": 0.24, "learning_rate": 1.9877632199842393e-05, "loss": 0.4979, "step": 1271 }, { "epoch": 0.24, "learning_rate": 1.98773204782474e-05, "loss": 0.4977, "step": 1272 }, { "epoch": 0.24, "learning_rate": 1.9877008362565607e-05, "loss": 0.53, "step": 1273 }, { "epoch": 0.24, "learning_rate": 1.9876695852809473e-05, "loss": 0.5174, "step": 1274 }, { "epoch": 0.24, "learning_rate": 1.9876382948991458e-05, "loss": 0.4989, "step": 1275 }, { "epoch": 0.24, "learning_rate": 1.9876069651124048e-05, "loss": 0.4871, "step": 1276 }, { "epoch": 0.24, "learning_rate": 1.987575595921974e-05, "loss": 0.4976, "step": 1277 }, { "epoch": 0.24, "learning_rate": 1.9875441873291062e-05, "loss": 0.5189, "step": 1278 }, { "epoch": 0.24, "learning_rate": 1.9875127393350533e-05, "loss": 0.5049, "step": 1279 }, { "epoch": 0.24, "learning_rate": 1.9874812519410704e-05, "loss": 0.5215, "step": 1280 }, { "epoch": 0.24, "learning_rate": 1.9874497251484136e-05, "loss": 0.5225, "step": 1281 }, { "epoch": 0.24, "learning_rate": 1.9874181589583417e-05, "loss": 0.5289, "step": 1282 }, { "epoch": 0.24, "learning_rate": 1.987386553372113e-05, "loss": 0.497, "step": 1283 }, { "epoch": 0.24, "learning_rate": 1.9873549083909885e-05, "loss": 0.507, "step": 1284 }, { "epoch": 0.24, "learning_rate": 1.987323224016232e-05, "loss": 0.5455, "step": 1285 }, { "epoch": 0.24, "learning_rate": 1.987291500249106e-05, "loss": 0.5051, "step": 1286 }, { "epoch": 0.24, "learning_rate": 1.9872597370908777e-05, "loss": 0.5393, "step": 1287 }, { "epoch": 0.24, "learning_rate": 1.9872279345428132e-05, "loss": 0.5074, "step": 1288 }, { "epoch": 0.24, "learning_rate": 1.9871960926061825e-05, "loss": 0.4976, "step": 1289 }, { "epoch": 0.24, "learning_rate": 1.9871642112822552e-05, "loss": 0.5323, "step": 1290 }, { "epoch": 0.24, "learning_rate": 1.9871322905723038e-05, "loss": 0.512, "step": 1291 }, { "epoch": 0.24, "learning_rate": 1.9871003304776012e-05, "loss": 0.5223, "step": 1292 }, { "epoch": 0.24, "learning_rate": 1.987068330999423e-05, "loss": 0.5318, "step": 1293 }, { "epoch": 0.24, "learning_rate": 1.987036292139046e-05, "loss": 0.5233, "step": 1294 }, { "epoch": 0.24, "learning_rate": 1.9870042138977486e-05, "loss": 0.511, "step": 1295 }, { "epoch": 0.24, "learning_rate": 1.9869720962768106e-05, "loss": 0.4941, "step": 1296 }, { "epoch": 0.24, "learning_rate": 1.9869399392775128e-05, "loss": 0.5044, "step": 1297 }, { "epoch": 0.24, "learning_rate": 1.986907742901139e-05, "loss": 0.5101, "step": 1298 }, { "epoch": 0.24, "learning_rate": 1.9868755071489732e-05, "loss": 0.537, "step": 1299 }, { "epoch": 0.24, "learning_rate": 1.986843232022302e-05, "loss": 0.4892, "step": 1300 }, { "epoch": 0.24, "learning_rate": 1.986810917522413e-05, "loss": 0.5012, "step": 1301 }, { "epoch": 0.24, "learning_rate": 1.9867785636505953e-05, "loss": 0.5271, "step": 1302 }, { "epoch": 0.24, "learning_rate": 1.9867461704081398e-05, "loss": 0.5257, "step": 1303 }, { "epoch": 0.24, "learning_rate": 1.9867137377963394e-05, "loss": 0.5229, "step": 1304 }, { "epoch": 0.24, "learning_rate": 1.986681265816487e-05, "loss": 0.5149, "step": 1305 }, { "epoch": 0.24, "learning_rate": 1.9866487544698792e-05, "loss": 0.5353, "step": 1306 }, { "epoch": 0.24, "learning_rate": 1.986616203757813e-05, "loss": 0.4938, "step": 1307 }, { "epoch": 0.24, "learning_rate": 1.986583613681587e-05, "loss": 0.4951, "step": 1308 }, { "epoch": 0.24, "learning_rate": 1.9865509842425016e-05, "loss": 0.5039, "step": 1309 }, { "epoch": 0.24, "learning_rate": 1.9865183154418583e-05, "loss": 0.5097, "step": 1310 }, { "epoch": 0.24, "learning_rate": 1.9864856072809603e-05, "loss": 0.4981, "step": 1311 }, { "epoch": 0.24, "learning_rate": 1.9864528597611136e-05, "loss": 0.5207, "step": 1312 }, { "epoch": 0.24, "learning_rate": 1.9864200728836237e-05, "loss": 0.5182, "step": 1313 }, { "epoch": 0.24, "learning_rate": 1.9863872466497996e-05, "loss": 0.5154, "step": 1314 }, { "epoch": 0.24, "learning_rate": 1.98635438106095e-05, "loss": 0.5076, "step": 1315 }, { "epoch": 0.24, "learning_rate": 1.9863214761183873e-05, "loss": 0.4802, "step": 1316 }, { "epoch": 0.24, "learning_rate": 1.9862885318234237e-05, "loss": 0.5163, "step": 1317 }, { "epoch": 0.24, "learning_rate": 1.986255548177374e-05, "loss": 0.5037, "step": 1318 }, { "epoch": 0.24, "learning_rate": 1.9862225251815536e-05, "loss": 0.5027, "step": 1319 }, { "epoch": 0.24, "learning_rate": 1.9861894628372802e-05, "loss": 0.5359, "step": 1320 }, { "epoch": 0.24, "learning_rate": 1.9861563611458734e-05, "loss": 0.531, "step": 1321 }, { "epoch": 0.24, "learning_rate": 1.9861232201086536e-05, "loss": 0.4988, "step": 1322 }, { "epoch": 0.24, "learning_rate": 1.986090039726943e-05, "loss": 0.5099, "step": 1323 }, { "epoch": 0.24, "learning_rate": 1.9860568200020657e-05, "loss": 0.4848, "step": 1324 }, { "epoch": 0.25, "learning_rate": 1.9860235609353465e-05, "loss": 0.5157, "step": 1325 }, { "epoch": 0.25, "learning_rate": 1.9859902625281133e-05, "loss": 0.4848, "step": 1326 }, { "epoch": 0.25, "learning_rate": 1.9859569247816938e-05, "loss": 0.502, "step": 1327 }, { "epoch": 0.25, "learning_rate": 1.9859235476974187e-05, "loss": 0.5177, "step": 1328 }, { "epoch": 0.25, "learning_rate": 1.985890131276619e-05, "loss": 0.5278, "step": 1329 }, { "epoch": 0.25, "learning_rate": 1.985856675520629e-05, "loss": 0.5079, "step": 1330 }, { "epoch": 0.25, "learning_rate": 1.9858231804307823e-05, "loss": 0.4877, "step": 1331 }, { "epoch": 0.25, "learning_rate": 1.9857896460084164e-05, "loss": 0.5062, "step": 1332 }, { "epoch": 0.25, "learning_rate": 1.9857560722548684e-05, "loss": 0.5185, "step": 1333 }, { "epoch": 0.25, "learning_rate": 1.9857224591714787e-05, "loss": 0.5091, "step": 1334 }, { "epoch": 0.25, "learning_rate": 1.9856888067595875e-05, "loss": 0.5034, "step": 1335 }, { "epoch": 0.25, "learning_rate": 1.9856551150205377e-05, "loss": 0.499, "step": 1336 }, { "epoch": 0.25, "learning_rate": 1.985621383955674e-05, "loss": 0.5205, "step": 1337 }, { "epoch": 0.25, "learning_rate": 1.9855876135663418e-05, "loss": 0.4969, "step": 1338 }, { "epoch": 0.25, "learning_rate": 1.9855538038538888e-05, "loss": 0.4967, "step": 1339 }, { "epoch": 0.25, "learning_rate": 1.9855199548196637e-05, "loss": 0.5234, "step": 1340 }, { "epoch": 0.25, "learning_rate": 1.9854860664650165e-05, "loss": 0.5084, "step": 1341 }, { "epoch": 0.25, "learning_rate": 1.9854521387913004e-05, "loss": 0.4878, "step": 1342 }, { "epoch": 0.25, "learning_rate": 1.9854181717998684e-05, "loss": 0.5018, "step": 1343 }, { "epoch": 0.25, "learning_rate": 1.9853841654920757e-05, "loss": 0.4921, "step": 1344 }, { "epoch": 0.25, "learning_rate": 1.985350119869279e-05, "loss": 0.5188, "step": 1345 }, { "epoch": 0.25, "learning_rate": 1.985316034932837e-05, "loss": 0.508, "step": 1346 }, { "epoch": 0.25, "learning_rate": 1.9852819106841096e-05, "loss": 0.5172, "step": 1347 }, { "epoch": 0.25, "learning_rate": 1.9852477471244582e-05, "loss": 0.5057, "step": 1348 }, { "epoch": 0.25, "learning_rate": 1.9852135442552457e-05, "loss": 0.5317, "step": 1349 }, { "epoch": 0.25, "learning_rate": 1.9851793020778368e-05, "loss": 0.5106, "step": 1350 }, { "epoch": 0.25, "learning_rate": 1.9851450205935977e-05, "loss": 0.5187, "step": 1351 }, { "epoch": 0.25, "learning_rate": 1.9851106998038966e-05, "loss": 0.5252, "step": 1352 }, { "epoch": 0.25, "learning_rate": 1.9850763397101018e-05, "loss": 0.5105, "step": 1353 }, { "epoch": 0.25, "learning_rate": 1.9850419403135856e-05, "loss": 0.4958, "step": 1354 }, { "epoch": 0.25, "learning_rate": 1.9850075016157194e-05, "loss": 0.5116, "step": 1355 }, { "epoch": 0.25, "learning_rate": 1.9849730236178775e-05, "loss": 0.5196, "step": 1356 }, { "epoch": 0.25, "learning_rate": 1.9849385063214356e-05, "loss": 0.4936, "step": 1357 }, { "epoch": 0.25, "learning_rate": 1.9849039497277708e-05, "loss": 0.5134, "step": 1358 }, { "epoch": 0.25, "learning_rate": 1.984869353838262e-05, "loss": 0.5195, "step": 1359 }, { "epoch": 0.25, "learning_rate": 1.98483471865429e-05, "loss": 0.525, "step": 1360 }, { "epoch": 0.25, "learning_rate": 1.984800044177235e-05, "loss": 0.527, "step": 1361 }, { "epoch": 0.25, "learning_rate": 1.9847653304084822e-05, "loss": 0.5128, "step": 1362 }, { "epoch": 0.25, "learning_rate": 1.984730577349416e-05, "loss": 0.5, "step": 1363 }, { "epoch": 0.25, "learning_rate": 1.984695785001423e-05, "loss": 0.4977, "step": 1364 }, { "epoch": 0.25, "learning_rate": 1.9846609533658907e-05, "loss": 0.5319, "step": 1365 }, { "epoch": 0.25, "learning_rate": 1.9846260824442098e-05, "loss": 0.5174, "step": 1366 }, { "epoch": 0.25, "learning_rate": 1.9845911722377713e-05, "loss": 0.5034, "step": 1367 }, { "epoch": 0.25, "learning_rate": 1.9845562227479678e-05, "loss": 0.5126, "step": 1368 }, { "epoch": 0.25, "learning_rate": 1.984521233976194e-05, "loss": 0.5172, "step": 1369 }, { "epoch": 0.25, "learning_rate": 1.9844862059238455e-05, "loss": 0.4921, "step": 1370 }, { "epoch": 0.25, "learning_rate": 1.9844511385923203e-05, "loss": 0.5063, "step": 1371 }, { "epoch": 0.25, "learning_rate": 1.9844160319830177e-05, "loss": 0.5068, "step": 1372 }, { "epoch": 0.25, "learning_rate": 1.9843808860973375e-05, "loss": 0.4941, "step": 1373 }, { "epoch": 0.25, "learning_rate": 1.9843457009366825e-05, "loss": 0.5134, "step": 1374 }, { "epoch": 0.25, "learning_rate": 1.9843104765024567e-05, "loss": 0.5026, "step": 1375 }, { "epoch": 0.25, "learning_rate": 1.9842752127960652e-05, "loss": 0.5113, "step": 1376 }, { "epoch": 0.25, "learning_rate": 1.9842399098189152e-05, "loss": 0.4919, "step": 1377 }, { "epoch": 0.25, "learning_rate": 1.984204567572415e-05, "loss": 0.5046, "step": 1378 }, { "epoch": 0.26, "learning_rate": 1.9841691860579747e-05, "loss": 0.5174, "step": 1379 }, { "epoch": 0.26, "learning_rate": 1.9841337652770058e-05, "loss": 0.5141, "step": 1380 }, { "epoch": 0.26, "learning_rate": 1.984098305230922e-05, "loss": 0.5031, "step": 1381 }, { "epoch": 0.26, "learning_rate": 1.984062805921138e-05, "loss": 0.4972, "step": 1382 }, { "epoch": 0.26, "learning_rate": 1.9840272673490696e-05, "loss": 0.5027, "step": 1383 }, { "epoch": 0.26, "learning_rate": 1.9839916895161353e-05, "loss": 0.5134, "step": 1384 }, { "epoch": 0.26, "learning_rate": 1.9839560724237544e-05, "loss": 0.4995, "step": 1385 }, { "epoch": 0.26, "learning_rate": 1.983920416073348e-05, "loss": 0.5192, "step": 1386 }, { "epoch": 0.26, "learning_rate": 1.9838847204663386e-05, "loss": 0.4743, "step": 1387 }, { "epoch": 0.26, "learning_rate": 1.9838489856041505e-05, "loss": 0.53, "step": 1388 }, { "epoch": 0.26, "learning_rate": 1.9838132114882093e-05, "loss": 0.502, "step": 1389 }, { "epoch": 0.26, "learning_rate": 1.9837773981199423e-05, "loss": 0.5135, "step": 1390 }, { "epoch": 0.26, "learning_rate": 1.9837415455007792e-05, "loss": 0.5053, "step": 1391 }, { "epoch": 0.26, "learning_rate": 1.9837056536321492e-05, "loss": 0.5156, "step": 1392 }, { "epoch": 0.26, "learning_rate": 1.983669722515485e-05, "loss": 0.5119, "step": 1393 }, { "epoch": 0.26, "learning_rate": 1.9836337521522204e-05, "loss": 0.5178, "step": 1394 }, { "epoch": 0.26, "learning_rate": 1.98359774254379e-05, "loss": 0.5005, "step": 1395 }, { "epoch": 0.26, "learning_rate": 1.9835616936916303e-05, "loss": 0.4987, "step": 1396 }, { "epoch": 0.26, "learning_rate": 1.9835256055971808e-05, "loss": 0.5085, "step": 1397 }, { "epoch": 0.26, "learning_rate": 1.98348947826188e-05, "loss": 0.5287, "step": 1398 }, { "epoch": 0.26, "learning_rate": 1.9834533116871703e-05, "loss": 0.5039, "step": 1399 }, { "epoch": 0.26, "learning_rate": 1.983417105874494e-05, "loss": 0.4932, "step": 1400 }, { "epoch": 0.26, "learning_rate": 1.9833808608252965e-05, "loss": 0.4982, "step": 1401 }, { "epoch": 0.26, "learning_rate": 1.983344576541023e-05, "loss": 0.5272, "step": 1402 }, { "epoch": 0.26, "learning_rate": 1.9833082530231213e-05, "loss": 0.5155, "step": 1403 }, { "epoch": 0.26, "learning_rate": 1.983271890273041e-05, "loss": 0.4996, "step": 1404 }, { "epoch": 0.26, "learning_rate": 1.9832354882922327e-05, "loss": 0.5078, "step": 1405 }, { "epoch": 0.26, "learning_rate": 1.9831990470821487e-05, "loss": 0.4795, "step": 1406 }, { "epoch": 0.26, "learning_rate": 1.9831625666442433e-05, "loss": 0.5056, "step": 1407 }, { "epoch": 0.26, "learning_rate": 1.9831260469799714e-05, "loss": 0.5225, "step": 1408 }, { "epoch": 0.26, "learning_rate": 1.983089488090791e-05, "loss": 0.5171, "step": 1409 }, { "epoch": 0.26, "learning_rate": 1.9830528899781598e-05, "loss": 0.517, "step": 1410 }, { "epoch": 0.26, "learning_rate": 1.9830162526435383e-05, "loss": 0.4957, "step": 1411 }, { "epoch": 0.26, "learning_rate": 1.9829795760883887e-05, "loss": 0.4909, "step": 1412 }, { "epoch": 0.26, "learning_rate": 1.982942860314174e-05, "loss": 0.5418, "step": 1413 }, { "epoch": 0.26, "learning_rate": 1.9829061053223582e-05, "loss": 0.5185, "step": 1414 }, { "epoch": 0.26, "learning_rate": 1.9828693111144095e-05, "loss": 0.5008, "step": 1415 }, { "epoch": 0.26, "learning_rate": 1.9828324776917945e-05, "loss": 0.4909, "step": 1416 }, { "epoch": 0.26, "learning_rate": 1.9827956050559837e-05, "loss": 0.5165, "step": 1417 }, { "epoch": 0.26, "learning_rate": 1.9827586932084476e-05, "loss": 0.5061, "step": 1418 }, { "epoch": 0.26, "learning_rate": 1.9827217421506592e-05, "loss": 0.48, "step": 1419 }, { "epoch": 0.26, "learning_rate": 1.9826847518840928e-05, "loss": 0.5016, "step": 1420 }, { "epoch": 0.26, "learning_rate": 1.9826477224102242e-05, "loss": 0.4975, "step": 1421 }, { "epoch": 0.26, "learning_rate": 1.9826106537305307e-05, "loss": 0.4957, "step": 1422 }, { "epoch": 0.26, "learning_rate": 1.9825735458464915e-05, "loss": 0.5224, "step": 1423 }, { "epoch": 0.26, "learning_rate": 1.982536398759587e-05, "loss": 0.5047, "step": 1424 }, { "epoch": 0.26, "learning_rate": 1.9824992124712993e-05, "loss": 0.5027, "step": 1425 }, { "epoch": 0.26, "learning_rate": 1.982461986983112e-05, "loss": 0.4881, "step": 1426 }, { "epoch": 0.26, "learning_rate": 1.9824247222965104e-05, "loss": 0.5184, "step": 1427 }, { "epoch": 0.26, "learning_rate": 1.982387418412981e-05, "loss": 0.4926, "step": 1428 }, { "epoch": 0.26, "learning_rate": 1.982350075334013e-05, "loss": 0.4966, "step": 1429 }, { "epoch": 0.26, "learning_rate": 1.9823126930610956e-05, "loss": 0.5093, "step": 1430 }, { "epoch": 0.26, "learning_rate": 1.9822752715957202e-05, "loss": 0.4838, "step": 1431 }, { "epoch": 0.26, "learning_rate": 1.9822378109393802e-05, "loss": 0.5003, "step": 1432 }, { "epoch": 0.27, "learning_rate": 1.9822003110935704e-05, "loss": 0.4978, "step": 1433 }, { "epoch": 0.27, "learning_rate": 1.9821627720597865e-05, "loss": 0.5094, "step": 1434 }, { "epoch": 0.27, "learning_rate": 1.982125193839526e-05, "loss": 0.5255, "step": 1435 }, { "epoch": 0.27, "learning_rate": 1.9820875764342894e-05, "loss": 0.5101, "step": 1436 }, { "epoch": 0.27, "learning_rate": 1.9820499198455762e-05, "loss": 0.4918, "step": 1437 }, { "epoch": 0.27, "learning_rate": 1.98201222407489e-05, "loss": 0.4886, "step": 1438 }, { "epoch": 0.27, "learning_rate": 1.9819744891237337e-05, "loss": 0.4874, "step": 1439 }, { "epoch": 0.27, "learning_rate": 1.9819367149936136e-05, "loss": 0.4801, "step": 1440 }, { "epoch": 0.27, "learning_rate": 1.9818989016860365e-05, "loss": 0.5048, "step": 1441 }, { "epoch": 0.27, "learning_rate": 1.981861049202511e-05, "loss": 0.4949, "step": 1442 }, { "epoch": 0.27, "learning_rate": 1.9818231575445474e-05, "loss": 0.5256, "step": 1443 }, { "epoch": 0.27, "learning_rate": 1.9817852267136577e-05, "loss": 0.4861, "step": 1444 }, { "epoch": 0.27, "learning_rate": 1.9817472567113557e-05, "loss": 0.4997, "step": 1445 }, { "epoch": 0.27, "learning_rate": 1.981709247539155e-05, "loss": 0.5037, "step": 1446 }, { "epoch": 0.27, "learning_rate": 1.981671199198574e-05, "loss": 0.4994, "step": 1447 }, { "epoch": 0.27, "learning_rate": 1.9816331116911286e-05, "loss": 0.4898, "step": 1448 }, { "epoch": 0.27, "learning_rate": 1.9815949850183397e-05, "loss": 0.498, "step": 1449 }, { "epoch": 0.27, "learning_rate": 1.981556819181729e-05, "loss": 0.4735, "step": 1450 }, { "epoch": 0.27, "learning_rate": 1.9815186141828174e-05, "loss": 0.4943, "step": 1451 }, { "epoch": 0.27, "learning_rate": 1.9814803700231313e-05, "loss": 0.4934, "step": 1452 }, { "epoch": 0.27, "learning_rate": 1.9814420867041952e-05, "loss": 0.5016, "step": 1453 }, { "epoch": 0.27, "learning_rate": 1.9814037642275368e-05, "loss": 0.5195, "step": 1454 }, { "epoch": 0.27, "learning_rate": 1.9813654025946856e-05, "loss": 0.5007, "step": 1455 }, { "epoch": 0.27, "learning_rate": 1.9813270018071712e-05, "loss": 0.4932, "step": 1456 }, { "epoch": 0.27, "learning_rate": 1.981288561866527e-05, "loss": 0.4798, "step": 1457 }, { "epoch": 0.27, "learning_rate": 1.9812500827742857e-05, "loss": 0.5131, "step": 1458 }, { "epoch": 0.27, "learning_rate": 1.9812115645319827e-05, "loss": 0.4865, "step": 1459 }, { "epoch": 0.27, "learning_rate": 1.981173007141155e-05, "loss": 0.5208, "step": 1460 }, { "epoch": 0.27, "learning_rate": 1.981134410603341e-05, "loss": 0.4941, "step": 1461 }, { "epoch": 0.27, "learning_rate": 1.9810957749200804e-05, "loss": 0.4836, "step": 1462 }, { "epoch": 0.27, "learning_rate": 1.9810571000929148e-05, "loss": 0.5169, "step": 1463 }, { "epoch": 0.27, "learning_rate": 1.9810183861233874e-05, "loss": 0.5075, "step": 1464 }, { "epoch": 0.27, "learning_rate": 1.9809796330130427e-05, "loss": 0.5243, "step": 1465 }, { "epoch": 0.27, "learning_rate": 1.980940840763427e-05, "loss": 0.5192, "step": 1466 }, { "epoch": 0.27, "learning_rate": 1.9809020093760876e-05, "loss": 0.4752, "step": 1467 }, { "epoch": 0.27, "learning_rate": 1.9808631388525743e-05, "loss": 0.5106, "step": 1468 }, { "epoch": 0.27, "learning_rate": 1.980824229194438e-05, "loss": 0.5064, "step": 1469 }, { "epoch": 0.27, "learning_rate": 1.9807852804032306e-05, "loss": 0.5374, "step": 1470 }, { "epoch": 0.27, "learning_rate": 1.9807462924805065e-05, "loss": 0.5136, "step": 1471 }, { "epoch": 0.27, "learning_rate": 1.980707265427821e-05, "loss": 0.5121, "step": 1472 }, { "epoch": 0.27, "learning_rate": 1.9806681992467314e-05, "loss": 0.5275, "step": 1473 }, { "epoch": 0.27, "learning_rate": 1.9806290939387965e-05, "loss": 0.514, "step": 1474 }, { "epoch": 0.27, "learning_rate": 1.9805899495055762e-05, "loss": 0.5011, "step": 1475 }, { "epoch": 0.27, "learning_rate": 1.9805507659486325e-05, "loss": 0.5215, "step": 1476 }, { "epoch": 0.27, "learning_rate": 1.9805115432695284e-05, "loss": 0.4754, "step": 1477 }, { "epoch": 0.27, "learning_rate": 1.9804722814698295e-05, "loss": 0.5013, "step": 1478 }, { "epoch": 0.27, "learning_rate": 1.9804329805511018e-05, "loss": 0.4964, "step": 1479 }, { "epoch": 0.27, "learning_rate": 1.980393640514913e-05, "loss": 0.5293, "step": 1480 }, { "epoch": 0.27, "learning_rate": 1.9803542613628335e-05, "loss": 0.5249, "step": 1481 }, { "epoch": 0.27, "learning_rate": 1.9803148430964338e-05, "loss": 0.4894, "step": 1482 }, { "epoch": 0.27, "learning_rate": 1.980275385717287e-05, "loss": 0.5149, "step": 1483 }, { "epoch": 0.27, "learning_rate": 1.9802358892269674e-05, "loss": 0.499, "step": 1484 }, { "epoch": 0.27, "learning_rate": 1.9801963536270504e-05, "loss": 0.5149, "step": 1485 }, { "epoch": 0.27, "learning_rate": 1.9801567789191137e-05, "loss": 0.5109, "step": 1486 }, { "epoch": 0.28, "learning_rate": 1.9801171651047362e-05, "loss": 0.4905, "step": 1487 }, { "epoch": 0.28, "learning_rate": 1.9800775121854987e-05, "loss": 0.5036, "step": 1488 }, { "epoch": 0.28, "learning_rate": 1.9800378201629828e-05, "loss": 0.5084, "step": 1489 }, { "epoch": 0.28, "learning_rate": 1.9799980890387724e-05, "loss": 0.5093, "step": 1490 }, { "epoch": 0.28, "learning_rate": 1.9799583188144526e-05, "loss": 0.4806, "step": 1491 }, { "epoch": 0.28, "learning_rate": 1.9799185094916104e-05, "loss": 0.5047, "step": 1492 }, { "epoch": 0.28, "learning_rate": 1.979878661071834e-05, "loss": 0.4748, "step": 1493 }, { "epoch": 0.28, "learning_rate": 1.979838773556713e-05, "loss": 0.5096, "step": 1494 }, { "epoch": 0.28, "learning_rate": 1.9797988469478392e-05, "loss": 0.4971, "step": 1495 }, { "epoch": 0.28, "learning_rate": 1.9797588812468052e-05, "loss": 0.5125, "step": 1496 }, { "epoch": 0.28, "learning_rate": 1.9797188764552065e-05, "loss": 0.5091, "step": 1497 }, { "epoch": 0.28, "learning_rate": 1.9796788325746378e-05, "loss": 0.5015, "step": 1498 }, { "epoch": 0.28, "learning_rate": 1.9796387496066977e-05, "loss": 0.5019, "step": 1499 }, { "epoch": 0.28, "learning_rate": 1.9795986275529857e-05, "loss": 0.4881, "step": 1500 }, { "epoch": 0.28, "learning_rate": 1.9795584664151016e-05, "loss": 0.5257, "step": 1501 }, { "epoch": 0.28, "learning_rate": 1.9795182661946484e-05, "loss": 0.5082, "step": 1502 }, { "epoch": 0.28, "learning_rate": 1.9794780268932298e-05, "loss": 0.5049, "step": 1503 }, { "epoch": 0.28, "learning_rate": 1.9794377485124516e-05, "loss": 0.4874, "step": 1504 }, { "epoch": 0.28, "learning_rate": 1.9793974310539205e-05, "loss": 0.5079, "step": 1505 }, { "epoch": 0.28, "learning_rate": 1.9793570745192456e-05, "loss": 0.506, "step": 1506 }, { "epoch": 0.28, "learning_rate": 1.979316678910036e-05, "loss": 0.4876, "step": 1507 }, { "epoch": 0.28, "learning_rate": 1.9792762442279044e-05, "loss": 0.5136, "step": 1508 }, { "epoch": 0.28, "learning_rate": 1.9792357704744635e-05, "loss": 0.5168, "step": 1509 }, { "epoch": 0.28, "learning_rate": 1.9791952576513285e-05, "loss": 0.5193, "step": 1510 }, { "epoch": 0.28, "learning_rate": 1.979154705760116e-05, "loss": 0.5235, "step": 1511 }, { "epoch": 0.28, "learning_rate": 1.9791141148024432e-05, "loss": 0.5126, "step": 1512 }, { "epoch": 0.28, "learning_rate": 1.9790734847799302e-05, "loss": 0.4831, "step": 1513 }, { "epoch": 0.28, "learning_rate": 1.9790328156941977e-05, "loss": 0.4981, "step": 1514 }, { "epoch": 0.28, "learning_rate": 1.9789921075468687e-05, "loss": 0.503, "step": 1515 }, { "epoch": 0.28, "learning_rate": 1.978951360339567e-05, "loss": 0.5307, "step": 1516 }, { "epoch": 0.28, "learning_rate": 1.9789105740739186e-05, "loss": 0.5182, "step": 1517 }, { "epoch": 0.28, "learning_rate": 1.9788697487515506e-05, "loss": 0.5092, "step": 1518 }, { "epoch": 0.28, "learning_rate": 1.9788288843740922e-05, "loss": 0.4926, "step": 1519 }, { "epoch": 0.28, "learning_rate": 1.978787980943173e-05, "loss": 0.5077, "step": 1520 }, { "epoch": 0.28, "learning_rate": 1.9787470384604262e-05, "loss": 0.506, "step": 1521 }, { "epoch": 0.28, "learning_rate": 1.9787060569274845e-05, "loss": 0.5163, "step": 1522 }, { "epoch": 0.28, "learning_rate": 1.978665036345983e-05, "loss": 0.4945, "step": 1523 }, { "epoch": 0.28, "learning_rate": 1.9786239767175583e-05, "loss": 0.5137, "step": 1524 }, { "epoch": 0.28, "learning_rate": 1.978582878043849e-05, "loss": 0.5113, "step": 1525 }, { "epoch": 0.28, "learning_rate": 1.9785417403264948e-05, "loss": 0.5286, "step": 1526 }, { "epoch": 0.28, "learning_rate": 1.9785005635671367e-05, "loss": 0.5213, "step": 1527 }, { "epoch": 0.28, "learning_rate": 1.9784593477674183e-05, "loss": 0.4924, "step": 1528 }, { "epoch": 0.28, "learning_rate": 1.9784180929289826e-05, "loss": 0.5176, "step": 1529 }, { "epoch": 0.28, "learning_rate": 1.978376799053477e-05, "loss": 0.4891, "step": 1530 }, { "epoch": 0.28, "learning_rate": 1.9783354661425486e-05, "loss": 0.4887, "step": 1531 }, { "epoch": 0.28, "learning_rate": 1.9782940941978462e-05, "loss": 0.5016, "step": 1532 }, { "epoch": 0.28, "learning_rate": 1.9782526832210206e-05, "loss": 0.5248, "step": 1533 }, { "epoch": 0.28, "learning_rate": 1.9782112332137246e-05, "loss": 0.4914, "step": 1534 }, { "epoch": 0.28, "learning_rate": 1.978169744177611e-05, "loss": 0.5154, "step": 1535 }, { "epoch": 0.28, "learning_rate": 1.9781282161143357e-05, "loss": 0.4993, "step": 1536 }, { "epoch": 0.28, "learning_rate": 1.978086649025556e-05, "loss": 0.5225, "step": 1537 }, { "epoch": 0.28, "learning_rate": 1.9780450429129298e-05, "loss": 0.5059, "step": 1538 }, { "epoch": 0.28, "learning_rate": 1.9780033977781167e-05, "loss": 0.4866, "step": 1539 }, { "epoch": 0.28, "learning_rate": 1.977961713622779e-05, "loss": 0.487, "step": 1540 }, { "epoch": 0.29, "learning_rate": 1.97791999044858e-05, "loss": 0.4964, "step": 1541 }, { "epoch": 0.29, "learning_rate": 1.977878228257183e-05, "loss": 0.523, "step": 1542 }, { "epoch": 0.29, "learning_rate": 1.977836427050256e-05, "loss": 0.5185, "step": 1543 }, { "epoch": 0.29, "learning_rate": 1.9777945868294656e-05, "loss": 0.5297, "step": 1544 }, { "epoch": 0.29, "learning_rate": 1.9777527075964817e-05, "loss": 0.5014, "step": 1545 }, { "epoch": 0.29, "learning_rate": 1.9777107893529747e-05, "loss": 0.5292, "step": 1546 }, { "epoch": 0.29, "learning_rate": 1.977668832100618e-05, "loss": 0.5056, "step": 1547 }, { "epoch": 0.29, "learning_rate": 1.9776268358410843e-05, "loss": 0.4811, "step": 1548 }, { "epoch": 0.29, "learning_rate": 1.9775848005760504e-05, "loss": 0.5055, "step": 1549 }, { "epoch": 0.29, "learning_rate": 1.9775427263071927e-05, "loss": 0.5099, "step": 1550 }, { "epoch": 0.29, "learning_rate": 1.9775006130361904e-05, "loss": 0.4818, "step": 1551 }, { "epoch": 0.29, "learning_rate": 1.9774584607647228e-05, "loss": 0.5175, "step": 1552 }, { "epoch": 0.29, "learning_rate": 1.977416269494473e-05, "loss": 0.493, "step": 1553 }, { "epoch": 0.29, "learning_rate": 1.9773740392271234e-05, "loss": 0.5111, "step": 1554 }, { "epoch": 0.29, "learning_rate": 1.977331769964359e-05, "loss": 0.4837, "step": 1555 }, { "epoch": 0.29, "learning_rate": 1.9772894617078666e-05, "loss": 0.4955, "step": 1556 }, { "epoch": 0.29, "learning_rate": 1.9772471144593344e-05, "loss": 0.512, "step": 1557 }, { "epoch": 0.29, "learning_rate": 1.9772047282204512e-05, "loss": 0.4942, "step": 1558 }, { "epoch": 0.29, "learning_rate": 1.9771623029929088e-05, "loss": 0.496, "step": 1559 }, { "epoch": 0.29, "learning_rate": 1.9771198387783995e-05, "loss": 0.4862, "step": 1560 }, { "epoch": 0.29, "learning_rate": 1.9770773355786178e-05, "loss": 0.4786, "step": 1561 }, { "epoch": 0.29, "learning_rate": 1.9770347933952597e-05, "loss": 0.5017, "step": 1562 }, { "epoch": 0.29, "learning_rate": 1.9769922122300223e-05, "loss": 0.5142, "step": 1563 }, { "epoch": 0.29, "learning_rate": 1.9769495920846042e-05, "loss": 0.4811, "step": 1564 }, { "epoch": 0.29, "learning_rate": 1.976906932960706e-05, "loss": 0.541, "step": 1565 }, { "epoch": 0.29, "learning_rate": 1.9768642348600303e-05, "loss": 0.5189, "step": 1566 }, { "epoch": 0.29, "learning_rate": 1.97682149778428e-05, "loss": 0.505, "step": 1567 }, { "epoch": 0.29, "learning_rate": 1.9767787217351604e-05, "loss": 0.4884, "step": 1568 }, { "epoch": 0.29, "learning_rate": 1.9767359067143784e-05, "loss": 0.5105, "step": 1569 }, { "epoch": 0.29, "learning_rate": 1.976693052723642e-05, "loss": 0.4896, "step": 1570 }, { "epoch": 0.29, "learning_rate": 1.976650159764661e-05, "loss": 0.4927, "step": 1571 }, { "epoch": 0.29, "learning_rate": 1.976607227839147e-05, "loss": 0.5105, "step": 1572 }, { "epoch": 0.29, "learning_rate": 1.976564256948813e-05, "loss": 0.5418, "step": 1573 }, { "epoch": 0.29, "learning_rate": 1.976521247095373e-05, "loss": 0.5167, "step": 1574 }, { "epoch": 0.29, "learning_rate": 1.976478198280543e-05, "loss": 0.5077, "step": 1575 }, { "epoch": 0.29, "learning_rate": 1.976435110506041e-05, "loss": 0.5007, "step": 1576 }, { "epoch": 0.29, "learning_rate": 1.976391983773586e-05, "loss": 0.5174, "step": 1577 }, { "epoch": 0.29, "learning_rate": 1.9763488180848983e-05, "loss": 0.5016, "step": 1578 }, { "epoch": 0.29, "learning_rate": 1.9763056134417007e-05, "loss": 0.4857, "step": 1579 }, { "epoch": 0.29, "learning_rate": 1.9762623698457164e-05, "loss": 0.485, "step": 1580 }, { "epoch": 0.29, "learning_rate": 1.9762190872986712e-05, "loss": 0.4821, "step": 1581 }, { "epoch": 0.29, "learning_rate": 1.976175765802292e-05, "loss": 0.4966, "step": 1582 }, { "epoch": 0.29, "learning_rate": 1.976132405358307e-05, "loss": 0.4981, "step": 1583 }, { "epoch": 0.29, "learning_rate": 1.976089005968446e-05, "loss": 0.5275, "step": 1584 }, { "epoch": 0.29, "learning_rate": 1.9760455676344413e-05, "loss": 0.5238, "step": 1585 }, { "epoch": 0.29, "learning_rate": 1.9760020903580252e-05, "loss": 0.4915, "step": 1586 }, { "epoch": 0.29, "learning_rate": 1.975958574140933e-05, "loss": 0.5119, "step": 1587 }, { "epoch": 0.29, "learning_rate": 1.9759150189849007e-05, "loss": 0.5086, "step": 1588 }, { "epoch": 0.29, "learning_rate": 1.9758714248916653e-05, "loss": 0.5081, "step": 1589 }, { "epoch": 0.29, "learning_rate": 1.9758277918629675e-05, "loss": 0.5363, "step": 1590 }, { "epoch": 0.29, "learning_rate": 1.9757841199005473e-05, "loss": 0.5141, "step": 1591 }, { "epoch": 0.29, "learning_rate": 1.9757404090061475e-05, "loss": 0.5155, "step": 1592 }, { "epoch": 0.29, "learning_rate": 1.9756966591815118e-05, "loss": 0.4967, "step": 1593 }, { "epoch": 0.29, "learning_rate": 1.9756528704283856e-05, "loss": 0.5032, "step": 1594 }, { "epoch": 0.3, "learning_rate": 1.9756090427485163e-05, "loss": 0.4971, "step": 1595 }, { "epoch": 0.3, "learning_rate": 1.9755651761436528e-05, "loss": 0.4853, "step": 1596 }, { "epoch": 0.3, "learning_rate": 1.975521270615545e-05, "loss": 0.5018, "step": 1597 }, { "epoch": 0.3, "learning_rate": 1.9754773261659444e-05, "loss": 0.51, "step": 1598 }, { "epoch": 0.3, "learning_rate": 1.9754333427966045e-05, "loss": 0.4629, "step": 1599 }, { "epoch": 0.3, "learning_rate": 1.9753893205092804e-05, "loss": 0.4906, "step": 1600 }, { "epoch": 0.3, "learning_rate": 1.975345259305728e-05, "loss": 0.4986, "step": 1601 }, { "epoch": 0.3, "learning_rate": 1.9753011591877058e-05, "loss": 0.4963, "step": 1602 }, { "epoch": 0.3, "learning_rate": 1.975257020156973e-05, "loss": 0.4799, "step": 1603 }, { "epoch": 0.3, "learning_rate": 1.9752128422152907e-05, "loss": 0.5095, "step": 1604 }, { "epoch": 0.3, "learning_rate": 1.9751686253644217e-05, "loss": 0.5294, "step": 1605 }, { "epoch": 0.3, "learning_rate": 1.97512436960613e-05, "loss": 0.4792, "step": 1606 }, { "epoch": 0.3, "learning_rate": 1.9750800749421813e-05, "loss": 0.5044, "step": 1607 }, { "epoch": 0.3, "learning_rate": 1.9750357413743427e-05, "loss": 0.4881, "step": 1608 }, { "epoch": 0.3, "learning_rate": 1.9749913689043834e-05, "loss": 0.5286, "step": 1609 }, { "epoch": 0.3, "learning_rate": 1.9749469575340736e-05, "loss": 0.5109, "step": 1610 }, { "epoch": 0.3, "learning_rate": 1.9749025072651854e-05, "loss": 0.5135, "step": 1611 }, { "epoch": 0.3, "learning_rate": 1.974858018099492e-05, "loss": 0.5016, "step": 1612 }, { "epoch": 0.3, "learning_rate": 1.9748134900387686e-05, "loss": 0.4944, "step": 1613 }, { "epoch": 0.3, "learning_rate": 1.974768923084792e-05, "loss": 0.5001, "step": 1614 }, { "epoch": 0.3, "learning_rate": 1.97472431723934e-05, "loss": 0.5125, "step": 1615 }, { "epoch": 0.3, "learning_rate": 1.974679672504192e-05, "loss": 0.4975, "step": 1616 }, { "epoch": 0.3, "learning_rate": 1.9746349888811304e-05, "loss": 0.5035, "step": 1617 }, { "epoch": 0.3, "learning_rate": 1.9745902663719367e-05, "loss": 0.5106, "step": 1618 }, { "epoch": 0.3, "learning_rate": 1.9745455049783958e-05, "loss": 0.5053, "step": 1619 }, { "epoch": 0.3, "learning_rate": 1.9745007047022936e-05, "loss": 0.5171, "step": 1620 }, { "epoch": 0.3, "learning_rate": 1.9744558655454175e-05, "loss": 0.5206, "step": 1621 }, { "epoch": 0.3, "learning_rate": 1.9744109875095566e-05, "loss": 0.4988, "step": 1622 }, { "epoch": 0.3, "learning_rate": 1.9743660705965017e-05, "loss": 0.4983, "step": 1623 }, { "epoch": 0.3, "learning_rate": 1.974321114808044e-05, "loss": 0.4917, "step": 1624 }, { "epoch": 0.3, "learning_rate": 1.974276120145978e-05, "loss": 0.4959, "step": 1625 }, { "epoch": 0.3, "learning_rate": 1.9742310866120987e-05, "loss": 0.4895, "step": 1626 }, { "epoch": 0.3, "learning_rate": 1.9741860142082024e-05, "loss": 0.4817, "step": 1627 }, { "epoch": 0.3, "learning_rate": 1.974140902936088e-05, "loss": 0.502, "step": 1628 }, { "epoch": 0.3, "learning_rate": 1.9740957527975553e-05, "loss": 0.4995, "step": 1629 }, { "epoch": 0.3, "learning_rate": 1.9740505637944056e-05, "loss": 0.4948, "step": 1630 }, { "epoch": 0.3, "learning_rate": 1.9740053359284416e-05, "loss": 0.5073, "step": 1631 }, { "epoch": 0.3, "learning_rate": 1.9739600692014683e-05, "loss": 0.5141, "step": 1632 }, { "epoch": 0.3, "learning_rate": 1.973914763615291e-05, "loss": 0.5095, "step": 1633 }, { "epoch": 0.3, "learning_rate": 1.973869419171718e-05, "loss": 0.4929, "step": 1634 }, { "epoch": 0.3, "learning_rate": 1.9738240358725585e-05, "loss": 0.5176, "step": 1635 }, { "epoch": 0.3, "learning_rate": 1.9737786137196228e-05, "loss": 0.5152, "step": 1636 }, { "epoch": 0.3, "learning_rate": 1.973733152714723e-05, "loss": 0.51, "step": 1637 }, { "epoch": 0.3, "learning_rate": 1.9736876528596737e-05, "loss": 0.5084, "step": 1638 }, { "epoch": 0.3, "learning_rate": 1.9736421141562896e-05, "loss": 0.4874, "step": 1639 }, { "epoch": 0.3, "learning_rate": 1.9735965366063875e-05, "loss": 0.4972, "step": 1640 }, { "epoch": 0.3, "learning_rate": 1.973550920211787e-05, "loss": 0.504, "step": 1641 }, { "epoch": 0.3, "learning_rate": 1.9735052649743065e-05, "loss": 0.4823, "step": 1642 }, { "epoch": 0.3, "learning_rate": 1.9734595708957685e-05, "loss": 0.5121, "step": 1643 }, { "epoch": 0.3, "learning_rate": 1.973413837977996e-05, "loss": 0.5049, "step": 1644 }, { "epoch": 0.3, "learning_rate": 1.9733680662228135e-05, "loss": 0.497, "step": 1645 }, { "epoch": 0.3, "learning_rate": 1.9733222556320472e-05, "loss": 0.491, "step": 1646 }, { "epoch": 0.3, "learning_rate": 1.9732764062075253e-05, "loss": 0.5093, "step": 1647 }, { "epoch": 0.3, "learning_rate": 1.9732305179510765e-05, "loss": 0.5132, "step": 1648 }, { "epoch": 0.31, "learning_rate": 1.973184590864532e-05, "loss": 0.4898, "step": 1649 }, { "epoch": 0.31, "learning_rate": 1.973138624949724e-05, "loss": 0.4949, "step": 1650 }, { "epoch": 0.31, "learning_rate": 1.973092620208487e-05, "loss": 0.5091, "step": 1651 }, { "epoch": 0.31, "learning_rate": 1.9730465766426556e-05, "loss": 0.4836, "step": 1652 }, { "epoch": 0.31, "learning_rate": 1.9730004942540676e-05, "loss": 0.4876, "step": 1653 }, { "epoch": 0.31, "learning_rate": 1.9729543730445614e-05, "loss": 0.4928, "step": 1654 }, { "epoch": 0.31, "learning_rate": 1.972908213015977e-05, "loss": 0.5125, "step": 1655 }, { "epoch": 0.31, "learning_rate": 1.972862014170156e-05, "loss": 0.5169, "step": 1656 }, { "epoch": 0.31, "learning_rate": 1.972815776508942e-05, "loss": 0.5027, "step": 1657 }, { "epoch": 0.31, "learning_rate": 1.9727695000341795e-05, "loss": 0.5011, "step": 1658 }, { "epoch": 0.31, "learning_rate": 1.9727231847477153e-05, "loss": 0.5023, "step": 1659 }, { "epoch": 0.31, "learning_rate": 1.9726768306513967e-05, "loss": 0.4889, "step": 1660 }, { "epoch": 0.31, "learning_rate": 1.9726304377470735e-05, "loss": 0.4805, "step": 1661 }, { "epoch": 0.31, "learning_rate": 1.9725840060365968e-05, "loss": 0.4951, "step": 1662 }, { "epoch": 0.31, "learning_rate": 1.972537535521819e-05, "loss": 0.4899, "step": 1663 }, { "epoch": 0.31, "learning_rate": 1.9724910262045938e-05, "loss": 0.5161, "step": 1664 }, { "epoch": 0.31, "learning_rate": 1.9724444780867772e-05, "loss": 0.5327, "step": 1665 }, { "epoch": 0.31, "learning_rate": 1.9723978911702265e-05, "loss": 0.4887, "step": 1666 }, { "epoch": 0.31, "learning_rate": 1.9723512654568e-05, "loss": 0.487, "step": 1667 }, { "epoch": 0.31, "learning_rate": 1.9723046009483587e-05, "loss": 0.4855, "step": 1668 }, { "epoch": 0.31, "learning_rate": 1.9722578976467638e-05, "loss": 0.5271, "step": 1669 }, { "epoch": 0.31, "learning_rate": 1.972211155553879e-05, "loss": 0.5025, "step": 1670 }, { "epoch": 0.31, "learning_rate": 1.972164374671569e-05, "loss": 0.5292, "step": 1671 }, { "epoch": 0.31, "learning_rate": 1.9721175550017e-05, "loss": 0.5023, "step": 1672 }, { "epoch": 0.31, "learning_rate": 1.972070696546141e-05, "loss": 0.5132, "step": 1673 }, { "epoch": 0.31, "learning_rate": 1.9720237993067607e-05, "loss": 0.4809, "step": 1674 }, { "epoch": 0.31, "learning_rate": 1.9719768632854303e-05, "loss": 0.4915, "step": 1675 }, { "epoch": 0.31, "learning_rate": 1.9719298884840226e-05, "loss": 0.4858, "step": 1676 }, { "epoch": 0.31, "learning_rate": 1.9718828749044122e-05, "loss": 0.4854, "step": 1677 }, { "epoch": 0.31, "learning_rate": 1.9718358225484744e-05, "loss": 0.4933, "step": 1678 }, { "epoch": 0.31, "learning_rate": 1.9717887314180862e-05, "loss": 0.4945, "step": 1679 }, { "epoch": 0.31, "learning_rate": 1.9717416015151274e-05, "loss": 0.491, "step": 1680 }, { "epoch": 0.31, "learning_rate": 1.9716944328414773e-05, "loss": 0.4547, "step": 1681 }, { "epoch": 0.31, "learning_rate": 1.9716472253990185e-05, "loss": 0.4916, "step": 1682 }, { "epoch": 0.31, "learning_rate": 1.9715999791896347e-05, "loss": 0.5091, "step": 1683 }, { "epoch": 0.31, "learning_rate": 1.9715526942152103e-05, "loss": 0.5045, "step": 1684 }, { "epoch": 0.31, "learning_rate": 1.9715053704776324e-05, "loss": 0.5063, "step": 1685 }, { "epoch": 0.31, "learning_rate": 1.9714580079787886e-05, "loss": 0.4952, "step": 1686 }, { "epoch": 0.31, "learning_rate": 1.9714106067205693e-05, "loss": 0.5129, "step": 1687 }, { "epoch": 0.31, "learning_rate": 1.971363166704865e-05, "loss": 0.5001, "step": 1688 }, { "epoch": 0.31, "learning_rate": 1.9713156879335686e-05, "loss": 0.4884, "step": 1689 }, { "epoch": 0.31, "learning_rate": 1.971268170408575e-05, "loss": 0.5078, "step": 1690 }, { "epoch": 0.31, "learning_rate": 1.9712206141317795e-05, "loss": 0.4951, "step": 1691 }, { "epoch": 0.31, "learning_rate": 1.9711730191050794e-05, "loss": 0.5076, "step": 1692 }, { "epoch": 0.31, "learning_rate": 1.9711253853303742e-05, "loss": 0.5074, "step": 1693 }, { "epoch": 0.31, "learning_rate": 1.9710777128095642e-05, "loss": 0.5233, "step": 1694 }, { "epoch": 0.31, "learning_rate": 1.971030001544551e-05, "loss": 0.4961, "step": 1695 }, { "epoch": 0.31, "learning_rate": 1.970982251537239e-05, "loss": 0.504, "step": 1696 }, { "epoch": 0.31, "learning_rate": 1.9709344627895327e-05, "loss": 0.495, "step": 1697 }, { "epoch": 0.31, "learning_rate": 1.970886635303339e-05, "loss": 0.486, "step": 1698 }, { "epoch": 0.31, "learning_rate": 1.9708387690805662e-05, "loss": 0.5139, "step": 1699 }, { "epoch": 0.31, "learning_rate": 1.9707908641231236e-05, "loss": 0.4869, "step": 1700 }, { "epoch": 0.31, "learning_rate": 1.9707429204329232e-05, "loss": 0.5121, "step": 1701 }, { "epoch": 0.31, "learning_rate": 1.9706949380118774e-05, "loss": 0.5026, "step": 1702 }, { "epoch": 0.32, "learning_rate": 1.970646916861901e-05, "loss": 0.4974, "step": 1703 }, { "epoch": 0.32, "learning_rate": 1.9705988569849094e-05, "loss": 0.4953, "step": 1704 }, { "epoch": 0.32, "learning_rate": 1.9705507583828205e-05, "loss": 0.5246, "step": 1705 }, { "epoch": 0.32, "learning_rate": 1.9705026210575535e-05, "loss": 0.5071, "step": 1706 }, { "epoch": 0.32, "learning_rate": 1.9704544450110287e-05, "loss": 0.5058, "step": 1707 }, { "epoch": 0.32, "learning_rate": 1.970406230245168e-05, "loss": 0.5103, "step": 1708 }, { "epoch": 0.32, "learning_rate": 1.9703579767618958e-05, "loss": 0.5037, "step": 1709 }, { "epoch": 0.32, "learning_rate": 1.9703096845631365e-05, "loss": 0.4825, "step": 1710 }, { "epoch": 0.32, "learning_rate": 1.9702613536508174e-05, "loss": 0.4899, "step": 1711 }, { "epoch": 0.32, "learning_rate": 1.970212984026867e-05, "loss": 0.4847, "step": 1712 }, { "epoch": 0.32, "learning_rate": 1.9701645756932143e-05, "loss": 0.4936, "step": 1713 }, { "epoch": 0.32, "learning_rate": 1.9701161286517917e-05, "loss": 0.5082, "step": 1714 }, { "epoch": 0.32, "learning_rate": 1.9700676429045312e-05, "loss": 0.4982, "step": 1715 }, { "epoch": 0.32, "learning_rate": 1.9700191184533683e-05, "loss": 0.4819, "step": 1716 }, { "epoch": 0.32, "learning_rate": 1.9699705553002384e-05, "loss": 0.4992, "step": 1717 }, { "epoch": 0.32, "learning_rate": 1.969921953447079e-05, "loss": 0.4818, "step": 1718 }, { "epoch": 0.32, "learning_rate": 1.9698733128958295e-05, "loss": 0.5139, "step": 1719 }, { "epoch": 0.32, "learning_rate": 1.9698246336484306e-05, "loss": 0.4891, "step": 1720 }, { "epoch": 0.32, "learning_rate": 1.969775915706824e-05, "loss": 0.5118, "step": 1721 }, { "epoch": 0.32, "learning_rate": 1.9697271590729542e-05, "loss": 0.4883, "step": 1722 }, { "epoch": 0.32, "learning_rate": 1.9696783637487663e-05, "loss": 0.5171, "step": 1723 }, { "epoch": 0.32, "learning_rate": 1.969629529736207e-05, "loss": 0.5104, "step": 1724 }, { "epoch": 0.32, "learning_rate": 1.9695806570372242e-05, "loss": 0.4892, "step": 1725 }, { "epoch": 0.32, "learning_rate": 1.9695317456537685e-05, "loss": 0.5042, "step": 1726 }, { "epoch": 0.32, "learning_rate": 1.9694827955877915e-05, "loss": 0.49, "step": 1727 }, { "epoch": 0.32, "learning_rate": 1.9694338068412455e-05, "loss": 0.5058, "step": 1728 }, { "epoch": 0.32, "learning_rate": 1.969384779416086e-05, "loss": 0.5065, "step": 1729 }, { "epoch": 0.32, "learning_rate": 1.9693357133142682e-05, "loss": 0.5081, "step": 1730 }, { "epoch": 0.32, "learning_rate": 1.96928660853775e-05, "loss": 0.5198, "step": 1731 }, { "epoch": 0.32, "learning_rate": 1.9692374650884908e-05, "loss": 0.5009, "step": 1732 }, { "epoch": 0.32, "learning_rate": 1.9691882829684514e-05, "loss": 0.498, "step": 1733 }, { "epoch": 0.32, "learning_rate": 1.9691390621795938e-05, "loss": 0.5057, "step": 1734 }, { "epoch": 0.32, "learning_rate": 1.969089802723882e-05, "loss": 0.5182, "step": 1735 }, { "epoch": 0.32, "learning_rate": 1.9690405046032813e-05, "loss": 0.4998, "step": 1736 }, { "epoch": 0.32, "learning_rate": 1.9689911678197583e-05, "loss": 0.475, "step": 1737 }, { "epoch": 0.32, "learning_rate": 1.968941792375282e-05, "loss": 0.4843, "step": 1738 }, { "epoch": 0.32, "learning_rate": 1.9688923782718224e-05, "loss": 0.5282, "step": 1739 }, { "epoch": 0.32, "learning_rate": 1.9688429255113505e-05, "loss": 0.5065, "step": 1740 }, { "epoch": 0.32, "learning_rate": 1.9687934340958393e-05, "loss": 0.4915, "step": 1741 }, { "epoch": 0.32, "learning_rate": 1.9687439040272643e-05, "loss": 0.472, "step": 1742 }, { "epoch": 0.32, "learning_rate": 1.9686943353076008e-05, "loss": 0.4689, "step": 1743 }, { "epoch": 0.32, "learning_rate": 1.9686447279388268e-05, "loss": 0.4977, "step": 1744 }, { "epoch": 0.32, "learning_rate": 1.9685950819229217e-05, "loss": 0.5084, "step": 1745 }, { "epoch": 0.32, "learning_rate": 1.968545397261866e-05, "loss": 0.5109, "step": 1746 }, { "epoch": 0.32, "learning_rate": 1.968495673957642e-05, "loss": 0.4851, "step": 1747 }, { "epoch": 0.32, "learning_rate": 1.9684459120122342e-05, "loss": 0.489, "step": 1748 }, { "epoch": 0.32, "learning_rate": 1.9683961114276274e-05, "loss": 0.4895, "step": 1749 }, { "epoch": 0.32, "learning_rate": 1.9683462722058086e-05, "loss": 0.4974, "step": 1750 }, { "epoch": 0.32, "learning_rate": 1.9682963943487662e-05, "loss": 0.4803, "step": 1751 }, { "epoch": 0.32, "learning_rate": 1.9682464778584908e-05, "loss": 0.4884, "step": 1752 }, { "epoch": 0.32, "learning_rate": 1.968196522736973e-05, "loss": 0.4931, "step": 1753 }, { "epoch": 0.32, "learning_rate": 1.9681465289862073e-05, "loss": 0.4834, "step": 1754 }, { "epoch": 0.32, "learning_rate": 1.968096496608187e-05, "loss": 0.5104, "step": 1755 }, { "epoch": 0.32, "learning_rate": 1.968046425604909e-05, "loss": 0.5199, "step": 1756 }, { "epoch": 0.33, "learning_rate": 1.967996315978371e-05, "loss": 0.489, "step": 1757 }, { "epoch": 0.33, "learning_rate": 1.9679461677305722e-05, "loss": 0.4868, "step": 1758 }, { "epoch": 0.33, "learning_rate": 1.9678959808635135e-05, "loss": 0.4724, "step": 1759 }, { "epoch": 0.33, "learning_rate": 1.9678457553791968e-05, "loss": 0.502, "step": 1760 }, { "epoch": 0.33, "learning_rate": 1.9677954912796268e-05, "loss": 0.4819, "step": 1761 }, { "epoch": 0.33, "learning_rate": 1.9677451885668084e-05, "loss": 0.5039, "step": 1762 }, { "epoch": 0.33, "learning_rate": 1.9676948472427482e-05, "loss": 0.4825, "step": 1763 }, { "epoch": 0.33, "learning_rate": 1.967644467309456e-05, "loss": 0.4877, "step": 1764 }, { "epoch": 0.33, "learning_rate": 1.9675940487689406e-05, "loss": 0.4953, "step": 1765 }, { "epoch": 0.33, "learning_rate": 1.9675435916232145e-05, "loss": 0.4924, "step": 1766 }, { "epoch": 0.33, "learning_rate": 1.96749309587429e-05, "loss": 0.4994, "step": 1767 }, { "epoch": 0.33, "learning_rate": 1.9674425615241827e-05, "loss": 0.4935, "step": 1768 }, { "epoch": 0.33, "learning_rate": 1.967391988574908e-05, "loss": 0.4909, "step": 1769 }, { "epoch": 0.33, "learning_rate": 1.9673413770284843e-05, "loss": 0.4826, "step": 1770 }, { "epoch": 0.33, "learning_rate": 1.9672907268869306e-05, "loss": 0.4967, "step": 1771 }, { "epoch": 0.33, "learning_rate": 1.9672400381522676e-05, "loss": 0.497, "step": 1772 }, { "epoch": 0.33, "learning_rate": 1.9671893108265178e-05, "loss": 0.4878, "step": 1773 }, { "epoch": 0.33, "learning_rate": 1.9671385449117057e-05, "loss": 0.464, "step": 1774 }, { "epoch": 0.33, "learning_rate": 1.9670877404098557e-05, "loss": 0.4984, "step": 1775 }, { "epoch": 0.33, "learning_rate": 1.967036897322996e-05, "loss": 0.5091, "step": 1776 }, { "epoch": 0.33, "learning_rate": 1.966986015653154e-05, "loss": 0.497, "step": 1777 }, { "epoch": 0.33, "learning_rate": 1.96693509540236e-05, "loss": 0.4962, "step": 1778 }, { "epoch": 0.33, "learning_rate": 1.9668841365726464e-05, "loss": 0.5012, "step": 1779 }, { "epoch": 0.33, "learning_rate": 1.9668331391660463e-05, "loss": 0.5216, "step": 1780 }, { "epoch": 0.33, "learning_rate": 1.9667821031845934e-05, "loss": 0.4673, "step": 1781 }, { "epoch": 0.33, "learning_rate": 1.9667310286303246e-05, "loss": 0.5109, "step": 1782 }, { "epoch": 0.33, "learning_rate": 1.966679915505278e-05, "loss": 0.4947, "step": 1783 }, { "epoch": 0.33, "learning_rate": 1.966628763811492e-05, "loss": 0.4991, "step": 1784 }, { "epoch": 0.33, "learning_rate": 1.966577573551008e-05, "loss": 0.5019, "step": 1785 }, { "epoch": 0.33, "learning_rate": 1.966526344725869e-05, "loss": 0.5013, "step": 1786 }, { "epoch": 0.33, "learning_rate": 1.9664750773381178e-05, "loss": 0.5054, "step": 1787 }, { "epoch": 0.33, "learning_rate": 1.9664237713898004e-05, "loss": 0.4936, "step": 1788 }, { "epoch": 0.33, "learning_rate": 1.966372426882964e-05, "loss": 0.5048, "step": 1789 }, { "epoch": 0.33, "learning_rate": 1.966321043819657e-05, "loss": 0.5062, "step": 1790 }, { "epoch": 0.33, "learning_rate": 1.9662696222019292e-05, "loss": 0.5206, "step": 1791 }, { "epoch": 0.33, "learning_rate": 1.9662181620318325e-05, "loss": 0.4893, "step": 1792 }, { "epoch": 0.33, "learning_rate": 1.9661666633114203e-05, "loss": 0.4954, "step": 1793 }, { "epoch": 0.33, "learning_rate": 1.966115126042747e-05, "loss": 0.4817, "step": 1794 }, { "epoch": 0.33, "learning_rate": 1.9660635502278688e-05, "loss": 0.4905, "step": 1795 }, { "epoch": 0.33, "learning_rate": 1.9660119358688435e-05, "loss": 0.4911, "step": 1796 }, { "epoch": 0.33, "learning_rate": 1.9659602829677306e-05, "loss": 0.4984, "step": 1797 }, { "epoch": 0.33, "learning_rate": 1.9659085915265905e-05, "loss": 0.5019, "step": 1798 }, { "epoch": 0.33, "learning_rate": 1.9658568615474862e-05, "loss": 0.4824, "step": 1799 }, { "epoch": 0.33, "learning_rate": 1.9658050930324815e-05, "loss": 0.4847, "step": 1800 }, { "epoch": 0.33, "learning_rate": 1.9657532859836413e-05, "loss": 0.5015, "step": 1801 }, { "epoch": 0.33, "learning_rate": 1.9657014404030335e-05, "loss": 0.5164, "step": 1802 }, { "epoch": 0.33, "learning_rate": 1.9656495562927262e-05, "loss": 0.5109, "step": 1803 }, { "epoch": 0.33, "learning_rate": 1.965597633654789e-05, "loss": 0.5028, "step": 1804 }, { "epoch": 0.33, "learning_rate": 1.9655456724912943e-05, "loss": 0.4951, "step": 1805 }, { "epoch": 0.33, "learning_rate": 1.9654936728043147e-05, "loss": 0.5037, "step": 1806 }, { "epoch": 0.33, "learning_rate": 1.9654416345959254e-05, "loss": 0.4943, "step": 1807 }, { "epoch": 0.33, "learning_rate": 1.965389557868202e-05, "loss": 0.4867, "step": 1808 }, { "epoch": 0.33, "learning_rate": 1.965337442623223e-05, "loss": 0.4719, "step": 1809 }, { "epoch": 0.33, "learning_rate": 1.9652852888630672e-05, "loss": 0.5024, "step": 1810 }, { "epoch": 0.34, "learning_rate": 1.9652330965898155e-05, "loss": 0.5191, "step": 1811 }, { "epoch": 0.34, "learning_rate": 1.96518086580555e-05, "loss": 0.4848, "step": 1812 }, { "epoch": 0.34, "learning_rate": 1.9651285965123555e-05, "loss": 0.4905, "step": 1813 }, { "epoch": 0.34, "learning_rate": 1.9650762887123167e-05, "loss": 0.4972, "step": 1814 }, { "epoch": 0.34, "learning_rate": 1.9650239424075207e-05, "loss": 0.5135, "step": 1815 }, { "epoch": 0.34, "learning_rate": 1.964971557600056e-05, "loss": 0.5033, "step": 1816 }, { "epoch": 0.34, "learning_rate": 1.964919134292013e-05, "loss": 0.4965, "step": 1817 }, { "epoch": 0.34, "learning_rate": 1.964866672485483e-05, "loss": 0.4903, "step": 1818 }, { "epoch": 0.34, "learning_rate": 1.9648141721825592e-05, "loss": 0.5006, "step": 1819 }, { "epoch": 0.34, "learning_rate": 1.964761633385336e-05, "loss": 0.4841, "step": 1820 }, { "epoch": 0.34, "learning_rate": 1.96470905609591e-05, "loss": 0.4974, "step": 1821 }, { "epoch": 0.34, "learning_rate": 1.9646564403163787e-05, "loss": 0.4817, "step": 1822 }, { "epoch": 0.34, "learning_rate": 1.964603786048841e-05, "loss": 0.4869, "step": 1823 }, { "epoch": 0.34, "learning_rate": 1.9645510932953988e-05, "loss": 0.5064, "step": 1824 }, { "epoch": 0.34, "learning_rate": 1.9644983620581537e-05, "loss": 0.5023, "step": 1825 }, { "epoch": 0.34, "learning_rate": 1.9644455923392095e-05, "loss": 0.5031, "step": 1826 }, { "epoch": 0.34, "learning_rate": 1.964392784140672e-05, "loss": 0.5029, "step": 1827 }, { "epoch": 0.34, "learning_rate": 1.9643399374646477e-05, "loss": 0.507, "step": 1828 }, { "epoch": 0.34, "learning_rate": 1.9642870523132457e-05, "loss": 0.4848, "step": 1829 }, { "epoch": 0.34, "learning_rate": 1.964234128688575e-05, "loss": 0.5028, "step": 1830 }, { "epoch": 0.34, "learning_rate": 1.9641811665927483e-05, "loss": 0.4658, "step": 1831 }, { "epoch": 0.34, "learning_rate": 1.964128166027878e-05, "loss": 0.5156, "step": 1832 }, { "epoch": 0.34, "learning_rate": 1.964075126996079e-05, "loss": 0.5065, "step": 1833 }, { "epoch": 0.34, "learning_rate": 1.9640220494994674e-05, "loss": 0.4806, "step": 1834 }, { "epoch": 0.34, "learning_rate": 1.963968933540161e-05, "loss": 0.5047, "step": 1835 }, { "epoch": 0.34, "learning_rate": 1.963915779120279e-05, "loss": 0.4724, "step": 1836 }, { "epoch": 0.34, "learning_rate": 1.9638625862419413e-05, "loss": 0.4977, "step": 1837 }, { "epoch": 0.34, "learning_rate": 1.9638093549072718e-05, "loss": 0.5076, "step": 1838 }, { "epoch": 0.34, "learning_rate": 1.9637560851183927e-05, "loss": 0.5075, "step": 1839 }, { "epoch": 0.34, "learning_rate": 1.9637027768774305e-05, "loss": 0.4991, "step": 1840 }, { "epoch": 0.34, "learning_rate": 1.963649430186512e-05, "loss": 0.5051, "step": 1841 }, { "epoch": 0.34, "learning_rate": 1.963596045047765e-05, "loss": 0.4892, "step": 1842 }, { "epoch": 0.34, "learning_rate": 1.96354262146332e-05, "loss": 0.5017, "step": 1843 }, { "epoch": 0.34, "learning_rate": 1.9634891594353088e-05, "loss": 0.4837, "step": 1844 }, { "epoch": 0.34, "learning_rate": 1.9634356589658635e-05, "loss": 0.5089, "step": 1845 }, { "epoch": 0.34, "learning_rate": 1.963382120057119e-05, "loss": 0.5011, "step": 1846 }, { "epoch": 0.34, "learning_rate": 1.9633285427112118e-05, "loss": 0.5093, "step": 1847 }, { "epoch": 0.34, "learning_rate": 1.9632749269302796e-05, "loss": 0.5017, "step": 1848 }, { "epoch": 0.34, "learning_rate": 1.9632212727164606e-05, "loss": 0.4614, "step": 1849 }, { "epoch": 0.34, "learning_rate": 1.9631675800718967e-05, "loss": 0.5045, "step": 1850 }, { "epoch": 0.34, "learning_rate": 1.9631138489987296e-05, "loss": 0.5117, "step": 1851 }, { "epoch": 0.34, "learning_rate": 1.9630600794991028e-05, "loss": 0.4894, "step": 1852 }, { "epoch": 0.34, "learning_rate": 1.9630062715751622e-05, "loss": 0.4882, "step": 1853 }, { "epoch": 0.34, "learning_rate": 1.962952425229054e-05, "loss": 0.4689, "step": 1854 }, { "epoch": 0.34, "learning_rate": 1.962898540462927e-05, "loss": 0.4923, "step": 1855 }, { "epoch": 0.34, "learning_rate": 1.9628446172789313e-05, "loss": 0.5079, "step": 1856 }, { "epoch": 0.34, "learning_rate": 1.9627906556792177e-05, "loss": 0.5098, "step": 1857 }, { "epoch": 0.34, "learning_rate": 1.9627366556659395e-05, "loss": 0.4922, "step": 1858 }, { "epoch": 0.34, "learning_rate": 1.962682617241251e-05, "loss": 0.494, "step": 1859 }, { "epoch": 0.34, "learning_rate": 1.9626285404073088e-05, "loss": 0.4823, "step": 1860 }, { "epoch": 0.34, "learning_rate": 1.9625744251662702e-05, "loss": 0.4823, "step": 1861 }, { "epoch": 0.34, "learning_rate": 1.962520271520294e-05, "loss": 0.4948, "step": 1862 }, { "epoch": 0.34, "learning_rate": 1.962466079471541e-05, "loss": 0.4922, "step": 1863 }, { "epoch": 0.34, "learning_rate": 1.9624118490221734e-05, "loss": 0.4839, "step": 1864 }, { "epoch": 0.35, "learning_rate": 1.9623575801743547e-05, "loss": 0.5038, "step": 1865 }, { "epoch": 0.35, "learning_rate": 1.9623032729302506e-05, "loss": 0.4807, "step": 1866 }, { "epoch": 0.35, "learning_rate": 1.9622489272920274e-05, "loss": 0.479, "step": 1867 }, { "epoch": 0.35, "learning_rate": 1.9621945432618536e-05, "loss": 0.4899, "step": 1868 }, { "epoch": 0.35, "learning_rate": 1.962140120841899e-05, "loss": 0.4986, "step": 1869 }, { "epoch": 0.35, "learning_rate": 1.9620856600343353e-05, "loss": 0.506, "step": 1870 }, { "epoch": 0.35, "learning_rate": 1.9620311608413343e-05, "loss": 0.4942, "step": 1871 }, { "epoch": 0.35, "learning_rate": 1.9619766232650716e-05, "loss": 0.4867, "step": 1872 }, { "epoch": 0.35, "learning_rate": 1.9619220473077227e-05, "loss": 0.5015, "step": 1873 }, { "epoch": 0.35, "learning_rate": 1.9618674329714647e-05, "loss": 0.4942, "step": 1874 }, { "epoch": 0.35, "learning_rate": 1.9618127802584773e-05, "loss": 0.5051, "step": 1875 }, { "epoch": 0.35, "learning_rate": 1.9617580891709407e-05, "loss": 0.471, "step": 1876 }, { "epoch": 0.35, "learning_rate": 1.961703359711037e-05, "loss": 0.4937, "step": 1877 }, { "epoch": 0.35, "learning_rate": 1.9616485918809496e-05, "loss": 0.4899, "step": 1878 }, { "epoch": 0.35, "learning_rate": 1.961593785682864e-05, "loss": 0.5066, "step": 1879 }, { "epoch": 0.35, "learning_rate": 1.9615389411189666e-05, "loss": 0.483, "step": 1880 }, { "epoch": 0.35, "learning_rate": 1.9614840581914457e-05, "loss": 0.4907, "step": 1881 }, { "epoch": 0.35, "learning_rate": 1.961429136902491e-05, "loss": 0.4954, "step": 1882 }, { "epoch": 0.35, "learning_rate": 1.961374177254294e-05, "loss": 0.4932, "step": 1883 }, { "epoch": 0.35, "learning_rate": 1.9613191792490472e-05, "loss": 0.4617, "step": 1884 }, { "epoch": 0.35, "learning_rate": 1.961264142888945e-05, "loss": 0.4906, "step": 1885 }, { "epoch": 0.35, "learning_rate": 1.9612090681761828e-05, "loss": 0.4892, "step": 1886 }, { "epoch": 0.35, "learning_rate": 1.9611539551129587e-05, "loss": 0.4785, "step": 1887 }, { "epoch": 0.35, "learning_rate": 1.9610988037014716e-05, "loss": 0.5096, "step": 1888 }, { "epoch": 0.35, "learning_rate": 1.9610436139439214e-05, "loss": 0.498, "step": 1889 }, { "epoch": 0.35, "learning_rate": 1.96098838584251e-05, "loss": 0.4884, "step": 1890 }, { "epoch": 0.35, "learning_rate": 1.9609331193994418e-05, "loss": 0.4863, "step": 1891 }, { "epoch": 0.35, "learning_rate": 1.9608778146169207e-05, "loss": 0.4921, "step": 1892 }, { "epoch": 0.35, "learning_rate": 1.960822471497154e-05, "loss": 0.4725, "step": 1893 }, { "epoch": 0.35, "learning_rate": 1.9607670900423497e-05, "loss": 0.5007, "step": 1894 }, { "epoch": 0.35, "learning_rate": 1.9607116702547176e-05, "loss": 0.4694, "step": 1895 }, { "epoch": 0.35, "learning_rate": 1.9606562121364682e-05, "loss": 0.4904, "step": 1896 }, { "epoch": 0.35, "learning_rate": 1.9606007156898146e-05, "loss": 0.5049, "step": 1897 }, { "epoch": 0.35, "learning_rate": 1.960545180916971e-05, "loss": 0.4682, "step": 1898 }, { "epoch": 0.35, "learning_rate": 1.9604896078201533e-05, "loss": 0.5009, "step": 1899 }, { "epoch": 0.35, "learning_rate": 1.9604339964015785e-05, "loss": 0.4965, "step": 1900 }, { "epoch": 0.35, "learning_rate": 1.9603783466634652e-05, "loss": 0.4913, "step": 1901 }, { "epoch": 0.35, "learning_rate": 1.9603226586080338e-05, "loss": 0.4891, "step": 1902 }, { "epoch": 0.35, "learning_rate": 1.9602669322375068e-05, "loss": 0.4813, "step": 1903 }, { "epoch": 0.35, "learning_rate": 1.9602111675541068e-05, "loss": 0.4937, "step": 1904 }, { "epoch": 0.35, "learning_rate": 1.960155364560059e-05, "loss": 0.504, "step": 1905 }, { "epoch": 0.35, "learning_rate": 1.9600995232575898e-05, "loss": 0.4974, "step": 1906 }, { "epoch": 0.35, "learning_rate": 1.9600436436489273e-05, "loss": 0.51, "step": 1907 }, { "epoch": 0.35, "learning_rate": 1.9599877257363008e-05, "loss": 0.4922, "step": 1908 }, { "epoch": 0.35, "learning_rate": 1.9599317695219415e-05, "loss": 0.4654, "step": 1909 }, { "epoch": 0.35, "learning_rate": 1.959875775008082e-05, "loss": 0.4837, "step": 1910 }, { "epoch": 0.35, "learning_rate": 1.959819742196956e-05, "loss": 0.5098, "step": 1911 }, { "epoch": 0.35, "learning_rate": 1.9597636710907992e-05, "loss": 0.4987, "step": 1912 }, { "epoch": 0.35, "learning_rate": 1.9597075616918494e-05, "loss": 0.4672, "step": 1913 }, { "epoch": 0.35, "learning_rate": 1.9596514140023443e-05, "loss": 0.4781, "step": 1914 }, { "epoch": 0.35, "learning_rate": 1.9595952280245247e-05, "loss": 0.479, "step": 1915 }, { "epoch": 0.35, "learning_rate": 1.959539003760632e-05, "loss": 0.4958, "step": 1916 }, { "epoch": 0.35, "learning_rate": 1.95948274121291e-05, "loss": 0.4814, "step": 1917 }, { "epoch": 0.35, "learning_rate": 1.9594264403836027e-05, "loss": 0.4873, "step": 1918 }, { "epoch": 0.36, "learning_rate": 1.9593701012749568e-05, "loss": 0.4778, "step": 1919 }, { "epoch": 0.36, "learning_rate": 1.95931372388922e-05, "loss": 0.467, "step": 1920 }, { "epoch": 0.36, "learning_rate": 1.959257308228642e-05, "loss": 0.4895, "step": 1921 }, { "epoch": 0.36, "learning_rate": 1.9592008542954733e-05, "loss": 0.5113, "step": 1922 }, { "epoch": 0.36, "learning_rate": 1.959144362091966e-05, "loss": 0.4986, "step": 1923 }, { "epoch": 0.36, "learning_rate": 1.959087831620375e-05, "loss": 0.484, "step": 1924 }, { "epoch": 0.36, "learning_rate": 1.959031262882955e-05, "loss": 0.4845, "step": 1925 }, { "epoch": 0.36, "learning_rate": 1.9589746558819635e-05, "loss": 0.4986, "step": 1926 }, { "epoch": 0.36, "learning_rate": 1.9589180106196584e-05, "loss": 0.5015, "step": 1927 }, { "epoch": 0.36, "learning_rate": 1.9588613270983004e-05, "loss": 0.4967, "step": 1928 }, { "epoch": 0.36, "learning_rate": 1.9588046053201504e-05, "loss": 0.4975, "step": 1929 }, { "epoch": 0.36, "learning_rate": 1.958747845287472e-05, "loss": 0.5046, "step": 1930 }, { "epoch": 0.36, "learning_rate": 1.9586910470025295e-05, "loss": 0.5027, "step": 1931 }, { "epoch": 0.36, "learning_rate": 1.9586342104675892e-05, "loss": 0.4956, "step": 1932 }, { "epoch": 0.36, "learning_rate": 1.9585773356849188e-05, "loss": 0.4998, "step": 1933 }, { "epoch": 0.36, "learning_rate": 1.9585204226567877e-05, "loss": 0.5354, "step": 1934 }, { "epoch": 0.36, "learning_rate": 1.958463471385466e-05, "loss": 0.4926, "step": 1935 }, { "epoch": 0.36, "learning_rate": 1.9584064818732265e-05, "loss": 0.463, "step": 1936 }, { "epoch": 0.36, "learning_rate": 1.958349454122343e-05, "loss": 0.4825, "step": 1937 }, { "epoch": 0.36, "learning_rate": 1.9582923881350905e-05, "loss": 0.4779, "step": 1938 }, { "epoch": 0.36, "learning_rate": 1.9582352839137458e-05, "loss": 0.4828, "step": 1939 }, { "epoch": 0.36, "learning_rate": 1.9581781414605878e-05, "loss": 0.4776, "step": 1940 }, { "epoch": 0.36, "learning_rate": 1.9581209607778957e-05, "loss": 0.476, "step": 1941 }, { "epoch": 0.36, "learning_rate": 1.958063741867951e-05, "loss": 0.4933, "step": 1942 }, { "epoch": 0.36, "learning_rate": 1.9580064847330368e-05, "loss": 0.5019, "step": 1943 }, { "epoch": 0.36, "learning_rate": 1.957949189375438e-05, "loss": 0.4981, "step": 1944 }, { "epoch": 0.36, "learning_rate": 1.9578918557974398e-05, "loss": 0.4826, "step": 1945 }, { "epoch": 0.36, "learning_rate": 1.95783448400133e-05, "loss": 0.452, "step": 1946 }, { "epoch": 0.36, "learning_rate": 1.9577770739893978e-05, "loss": 0.4833, "step": 1947 }, { "epoch": 0.36, "learning_rate": 1.9577196257639337e-05, "loss": 0.5143, "step": 1948 }, { "epoch": 0.36, "learning_rate": 1.9576621393272294e-05, "loss": 0.4941, "step": 1949 }, { "epoch": 0.36, "learning_rate": 1.957604614681579e-05, "loss": 0.5059, "step": 1950 }, { "epoch": 0.36, "learning_rate": 1.9575470518292776e-05, "loss": 0.5026, "step": 1951 }, { "epoch": 0.36, "learning_rate": 1.9574894507726214e-05, "loss": 0.5073, "step": 1952 }, { "epoch": 0.36, "learning_rate": 1.9574318115139092e-05, "loss": 0.4822, "step": 1953 }, { "epoch": 0.36, "learning_rate": 1.9573741340554398e-05, "loss": 0.49, "step": 1954 }, { "epoch": 0.36, "learning_rate": 1.9573164183995156e-05, "loss": 0.5084, "step": 1955 }, { "epoch": 0.36, "learning_rate": 1.9572586645484386e-05, "loss": 0.4808, "step": 1956 }, { "epoch": 0.36, "learning_rate": 1.957200872504513e-05, "loss": 0.5021, "step": 1957 }, { "epoch": 0.36, "learning_rate": 1.9571430422700448e-05, "loss": 0.4915, "step": 1958 }, { "epoch": 0.36, "learning_rate": 1.9570851738473412e-05, "loss": 0.4774, "step": 1959 }, { "epoch": 0.36, "learning_rate": 1.9570272672387115e-05, "loss": 0.4914, "step": 1960 }, { "epoch": 0.36, "learning_rate": 1.9569693224464657e-05, "loss": 0.4912, "step": 1961 }, { "epoch": 0.36, "learning_rate": 1.9569113394729155e-05, "loss": 0.5201, "step": 1962 }, { "epoch": 0.36, "learning_rate": 1.9568533183203748e-05, "loss": 0.4823, "step": 1963 }, { "epoch": 0.36, "learning_rate": 1.9567952589911578e-05, "loss": 0.5197, "step": 1964 }, { "epoch": 0.36, "learning_rate": 1.9567371614875815e-05, "loss": 0.4872, "step": 1965 }, { "epoch": 0.36, "learning_rate": 1.9566790258119643e-05, "loss": 0.5062, "step": 1966 }, { "epoch": 0.36, "learning_rate": 1.956620851966625e-05, "loss": 0.5008, "step": 1967 }, { "epoch": 0.36, "learning_rate": 1.9565626399538847e-05, "loss": 0.4689, "step": 1968 }, { "epoch": 0.36, "learning_rate": 1.956504389776066e-05, "loss": 0.4794, "step": 1969 }, { "epoch": 0.36, "learning_rate": 1.9564461014354934e-05, "loss": 0.5006, "step": 1970 }, { "epoch": 0.36, "learning_rate": 1.956387774934492e-05, "loss": 0.5031, "step": 1971 }, { "epoch": 0.36, "learning_rate": 1.9563294102753892e-05, "loss": 0.4902, "step": 1972 }, { "epoch": 0.37, "learning_rate": 1.9562710074605133e-05, "loss": 0.494, "step": 1973 }, { "epoch": 0.37, "learning_rate": 1.956212566492195e-05, "loss": 0.5161, "step": 1974 }, { "epoch": 0.37, "learning_rate": 1.9561540873727653e-05, "loss": 0.4996, "step": 1975 }, { "epoch": 0.37, "learning_rate": 1.956095570104558e-05, "loss": 0.4917, "step": 1976 }, { "epoch": 0.37, "learning_rate": 1.9560370146899075e-05, "loss": 0.5113, "step": 1977 }, { "epoch": 0.37, "learning_rate": 1.95597842113115e-05, "loss": 0.4912, "step": 1978 }, { "epoch": 0.37, "learning_rate": 1.9559197894306238e-05, "loss": 0.4794, "step": 1979 }, { "epoch": 0.37, "learning_rate": 1.955861119590668e-05, "loss": 0.4831, "step": 1980 }, { "epoch": 0.37, "learning_rate": 1.9558024116136227e-05, "loss": 0.4584, "step": 1981 }, { "epoch": 0.37, "learning_rate": 1.9557436655018312e-05, "loss": 0.5043, "step": 1982 }, { "epoch": 0.37, "learning_rate": 1.955684881257637e-05, "loss": 0.4991, "step": 1983 }, { "epoch": 0.37, "learning_rate": 1.955626058883385e-05, "loss": 0.5124, "step": 1984 }, { "epoch": 0.37, "learning_rate": 1.955567198381423e-05, "loss": 0.5129, "step": 1985 }, { "epoch": 0.37, "learning_rate": 1.9555082997540987e-05, "loss": 0.4991, "step": 1986 }, { "epoch": 0.37, "learning_rate": 1.9554493630037626e-05, "loss": 0.4913, "step": 1987 }, { "epoch": 0.37, "learning_rate": 1.9553903881327655e-05, "loss": 0.4866, "step": 1988 }, { "epoch": 0.37, "learning_rate": 1.955331375143461e-05, "loss": 0.5041, "step": 1989 }, { "epoch": 0.37, "learning_rate": 1.9552723240382034e-05, "loss": 0.4831, "step": 1990 }, { "epoch": 0.37, "learning_rate": 1.9552132348193486e-05, "loss": 0.4971, "step": 1991 }, { "epoch": 0.37, "learning_rate": 1.9551541074892545e-05, "loss": 0.4974, "step": 1992 }, { "epoch": 0.37, "learning_rate": 1.9550949420502795e-05, "loss": 0.4853, "step": 1993 }, { "epoch": 0.37, "learning_rate": 1.955035738504785e-05, "loss": 0.4996, "step": 1994 }, { "epoch": 0.37, "learning_rate": 1.9549764968551325e-05, "loss": 0.5089, "step": 1995 }, { "epoch": 0.37, "learning_rate": 1.9549172171036863e-05, "loss": 0.4663, "step": 1996 }, { "epoch": 0.37, "learning_rate": 1.9548578992528106e-05, "loss": 0.5038, "step": 1997 }, { "epoch": 0.37, "learning_rate": 1.954798543304873e-05, "loss": 0.5017, "step": 1998 }, { "epoch": 0.37, "learning_rate": 1.954739149262241e-05, "loss": 0.4916, "step": 1999 }, { "epoch": 0.37, "learning_rate": 1.9546797171272846e-05, "loss": 0.4938, "step": 2000 }, { "epoch": 0.37, "learning_rate": 1.954620246902375e-05, "loss": 0.4918, "step": 2001 }, { "epoch": 0.37, "learning_rate": 1.9545607385898853e-05, "loss": 0.4972, "step": 2002 }, { "epoch": 0.37, "learning_rate": 1.954501192192189e-05, "loss": 0.4675, "step": 2003 }, { "epoch": 0.37, "learning_rate": 1.9544416077116626e-05, "loss": 0.4737, "step": 2004 }, { "epoch": 0.37, "learning_rate": 1.9543819851506832e-05, "loss": 0.4905, "step": 2005 }, { "epoch": 0.37, "learning_rate": 1.9543223245116297e-05, "loss": 0.4991, "step": 2006 }, { "epoch": 0.37, "learning_rate": 1.954262625796882e-05, "loss": 0.4913, "step": 2007 }, { "epoch": 0.37, "learning_rate": 1.954202889008823e-05, "loss": 0.4744, "step": 2008 }, { "epoch": 0.37, "learning_rate": 1.9541431141498345e-05, "loss": 0.5128, "step": 2009 }, { "epoch": 0.37, "learning_rate": 1.9540833012223026e-05, "loss": 0.5022, "step": 2010 }, { "epoch": 0.37, "learning_rate": 1.9540234502286136e-05, "loss": 0.4684, "step": 2011 }, { "epoch": 0.37, "learning_rate": 1.953963561171155e-05, "loss": 0.5126, "step": 2012 }, { "epoch": 0.37, "learning_rate": 1.9539036340523165e-05, "loss": 0.4927, "step": 2013 }, { "epoch": 0.37, "learning_rate": 1.9538436688744893e-05, "loss": 0.4951, "step": 2014 }, { "epoch": 0.37, "learning_rate": 1.9537836656400657e-05, "loss": 0.4989, "step": 2015 }, { "epoch": 0.37, "learning_rate": 1.9537236243514398e-05, "loss": 0.4922, "step": 2016 }, { "epoch": 0.37, "learning_rate": 1.953663545011007e-05, "loss": 0.504, "step": 2017 }, { "epoch": 0.37, "learning_rate": 1.953603427621164e-05, "loss": 0.5138, "step": 2018 }, { "epoch": 0.37, "learning_rate": 1.95354327218431e-05, "loss": 0.4938, "step": 2019 }, { "epoch": 0.37, "learning_rate": 1.9534830787028452e-05, "loss": 0.4878, "step": 2020 }, { "epoch": 0.37, "learning_rate": 1.9534228471791707e-05, "loss": 0.492, "step": 2021 }, { "epoch": 0.37, "learning_rate": 1.95336257761569e-05, "loss": 0.4915, "step": 2022 }, { "epoch": 0.37, "learning_rate": 1.9533022700148074e-05, "loss": 0.49, "step": 2023 }, { "epoch": 0.37, "learning_rate": 1.953241924378929e-05, "loss": 0.4897, "step": 2024 }, { "epoch": 0.37, "learning_rate": 1.953181540710463e-05, "loss": 0.4981, "step": 2025 }, { "epoch": 0.37, "learning_rate": 1.9531211190118182e-05, "loss": 0.4625, "step": 2026 }, { "epoch": 0.38, "learning_rate": 1.9530606592854052e-05, "loss": 0.4814, "step": 2027 }, { "epoch": 0.38, "learning_rate": 1.953000161533637e-05, "loss": 0.4844, "step": 2028 }, { "epoch": 0.38, "learning_rate": 1.9529396257589264e-05, "loss": 0.4962, "step": 2029 }, { "epoch": 0.38, "learning_rate": 1.952879051963689e-05, "loss": 0.4815, "step": 2030 }, { "epoch": 0.38, "learning_rate": 1.952818440150342e-05, "loss": 0.483, "step": 2031 }, { "epoch": 0.38, "learning_rate": 1.9527577903213027e-05, "loss": 0.4792, "step": 2032 }, { "epoch": 0.38, "learning_rate": 1.952697102478992e-05, "loss": 0.4969, "step": 2033 }, { "epoch": 0.38, "learning_rate": 1.952636376625831e-05, "loss": 0.4914, "step": 2034 }, { "epoch": 0.38, "learning_rate": 1.9525756127642415e-05, "loss": 0.5207, "step": 2035 }, { "epoch": 0.38, "learning_rate": 1.9525148108966494e-05, "loss": 0.4945, "step": 2036 }, { "epoch": 0.38, "learning_rate": 1.9524539710254795e-05, "loss": 0.496, "step": 2037 }, { "epoch": 0.38, "learning_rate": 1.95239309315316e-05, "loss": 0.5026, "step": 2038 }, { "epoch": 0.38, "learning_rate": 1.952332177282119e-05, "loss": 0.5129, "step": 2039 }, { "epoch": 0.38, "learning_rate": 1.9522712234147877e-05, "loss": 0.4927, "step": 2040 }, { "epoch": 0.38, "learning_rate": 1.9522102315535974e-05, "loss": 0.4817, "step": 2041 }, { "epoch": 0.38, "learning_rate": 1.952149201700982e-05, "loss": 0.4941, "step": 2042 }, { "epoch": 0.38, "learning_rate": 1.952088133859376e-05, "loss": 0.4901, "step": 2043 }, { "epoch": 0.38, "learning_rate": 1.9520270280312162e-05, "loss": 0.4828, "step": 2044 }, { "epoch": 0.38, "learning_rate": 1.951965884218941e-05, "loss": 0.4934, "step": 2045 }, { "epoch": 0.38, "learning_rate": 1.9519047024249892e-05, "loss": 0.4852, "step": 2046 }, { "epoch": 0.38, "learning_rate": 1.9518434826518025e-05, "loss": 0.4892, "step": 2047 }, { "epoch": 0.38, "learning_rate": 1.951782224901823e-05, "loss": 0.4976, "step": 2048 }, { "epoch": 0.38, "learning_rate": 1.9517209291774947e-05, "loss": 0.4784, "step": 2049 }, { "epoch": 0.38, "learning_rate": 1.9516595954812637e-05, "loss": 0.4873, "step": 2050 }, { "epoch": 0.38, "learning_rate": 1.9515982238155766e-05, "loss": 0.4895, "step": 2051 }, { "epoch": 0.38, "learning_rate": 1.951536814182882e-05, "loss": 0.5028, "step": 2052 }, { "epoch": 0.38, "learning_rate": 1.9514753665856306e-05, "loss": 0.4922, "step": 2053 }, { "epoch": 0.38, "learning_rate": 1.9514138810262736e-05, "loss": 0.4973, "step": 2054 }, { "epoch": 0.38, "learning_rate": 1.9513523575072645e-05, "loss": 0.4875, "step": 2055 }, { "epoch": 0.38, "learning_rate": 1.9512907960310573e-05, "loss": 0.5078, "step": 2056 }, { "epoch": 0.38, "learning_rate": 1.9512291966001088e-05, "loss": 0.496, "step": 2057 }, { "epoch": 0.38, "learning_rate": 1.9511675592168763e-05, "loss": 0.4759, "step": 2058 }, { "epoch": 0.38, "learning_rate": 1.9511058838838194e-05, "loss": 0.5109, "step": 2059 }, { "epoch": 0.38, "learning_rate": 1.9510441706033987e-05, "loss": 0.4994, "step": 2060 }, { "epoch": 0.38, "learning_rate": 1.9509824193780762e-05, "loss": 0.4866, "step": 2061 }, { "epoch": 0.38, "learning_rate": 1.950920630210316e-05, "loss": 0.4701, "step": 2062 }, { "epoch": 0.38, "learning_rate": 1.9508588031025833e-05, "loss": 0.48, "step": 2063 }, { "epoch": 0.38, "learning_rate": 1.9507969380573447e-05, "loss": 0.4991, "step": 2064 }, { "epoch": 0.38, "learning_rate": 1.9507350350770688e-05, "loss": 0.4909, "step": 2065 }, { "epoch": 0.38, "learning_rate": 1.950673094164225e-05, "loss": 0.5186, "step": 2066 }, { "epoch": 0.38, "learning_rate": 1.950611115321285e-05, "loss": 0.4815, "step": 2067 }, { "epoch": 0.38, "learning_rate": 1.9505490985507216e-05, "loss": 0.4942, "step": 2068 }, { "epoch": 0.38, "learning_rate": 1.950487043855009e-05, "loss": 0.4984, "step": 2069 }, { "epoch": 0.38, "learning_rate": 1.9504249512366228e-05, "loss": 0.4874, "step": 2070 }, { "epoch": 0.38, "learning_rate": 1.9503628206980413e-05, "loss": 0.4828, "step": 2071 }, { "epoch": 0.38, "learning_rate": 1.9503006522417425e-05, "loss": 0.4772, "step": 2072 }, { "epoch": 0.38, "learning_rate": 1.950238445870207e-05, "loss": 0.4741, "step": 2073 }, { "epoch": 0.38, "learning_rate": 1.950176201585917e-05, "loss": 0.4911, "step": 2074 }, { "epoch": 0.38, "learning_rate": 1.9501139193913555e-05, "loss": 0.4947, "step": 2075 }, { "epoch": 0.38, "learning_rate": 1.950051599289008e-05, "loss": 0.4934, "step": 2076 }, { "epoch": 0.38, "learning_rate": 1.9499892412813607e-05, "loss": 0.495, "step": 2077 }, { "epoch": 0.38, "learning_rate": 1.9499268453709014e-05, "loss": 0.4829, "step": 2078 }, { "epoch": 0.38, "learning_rate": 1.9498644115601197e-05, "loss": 0.4764, "step": 2079 }, { "epoch": 0.38, "learning_rate": 1.9498019398515067e-05, "loss": 0.4841, "step": 2080 }, { "epoch": 0.39, "learning_rate": 1.9497394302475548e-05, "loss": 0.4919, "step": 2081 }, { "epoch": 0.39, "learning_rate": 1.949676882750758e-05, "loss": 0.5017, "step": 2082 }, { "epoch": 0.39, "learning_rate": 1.9496142973636115e-05, "loss": 0.4861, "step": 2083 }, { "epoch": 0.39, "learning_rate": 1.949551674088613e-05, "loss": 0.489, "step": 2084 }, { "epoch": 0.39, "learning_rate": 1.949489012928261e-05, "loss": 0.4857, "step": 2085 }, { "epoch": 0.39, "learning_rate": 1.949426313885055e-05, "loss": 0.5052, "step": 2086 }, { "epoch": 0.39, "learning_rate": 1.949363576961497e-05, "loss": 0.4849, "step": 2087 }, { "epoch": 0.39, "learning_rate": 1.9493008021600902e-05, "loss": 0.4972, "step": 2088 }, { "epoch": 0.39, "learning_rate": 1.9492379894833387e-05, "loss": 0.5074, "step": 2089 }, { "epoch": 0.39, "learning_rate": 1.949175138933749e-05, "loss": 0.4875, "step": 2090 }, { "epoch": 0.39, "learning_rate": 1.9491122505138283e-05, "loss": 0.5021, "step": 2091 }, { "epoch": 0.39, "learning_rate": 1.9490493242260862e-05, "loss": 0.4911, "step": 2092 }, { "epoch": 0.39, "learning_rate": 1.9489863600730335e-05, "loss": 0.4902, "step": 2093 }, { "epoch": 0.39, "learning_rate": 1.9489233580571815e-05, "loss": 0.4636, "step": 2094 }, { "epoch": 0.39, "learning_rate": 1.9488603181810452e-05, "loss": 0.4796, "step": 2095 }, { "epoch": 0.39, "learning_rate": 1.9487972404471382e-05, "loss": 0.4825, "step": 2096 }, { "epoch": 0.39, "learning_rate": 1.9487341248579783e-05, "loss": 0.472, "step": 2097 }, { "epoch": 0.39, "learning_rate": 1.9486709714160833e-05, "loss": 0.4906, "step": 2098 }, { "epoch": 0.39, "learning_rate": 1.9486077801239727e-05, "loss": 0.4751, "step": 2099 }, { "epoch": 0.39, "learning_rate": 1.9485445509841682e-05, "loss": 0.4875, "step": 2100 }, { "epoch": 0.39, "learning_rate": 1.9484812839991925e-05, "loss": 0.4918, "step": 2101 }, { "epoch": 0.39, "learning_rate": 1.9484179791715694e-05, "loss": 0.4915, "step": 2102 }, { "epoch": 0.39, "learning_rate": 1.9483546365038247e-05, "loss": 0.4894, "step": 2103 }, { "epoch": 0.39, "learning_rate": 1.9482912559984864e-05, "loss": 0.4772, "step": 2104 }, { "epoch": 0.39, "learning_rate": 1.9482278376580824e-05, "loss": 0.4771, "step": 2105 }, { "epoch": 0.39, "learning_rate": 1.948164381485143e-05, "loss": 0.5041, "step": 2106 }, { "epoch": 0.39, "learning_rate": 1.9481008874822005e-05, "loss": 0.4936, "step": 2107 }, { "epoch": 0.39, "learning_rate": 1.948037355651788e-05, "loss": 0.4964, "step": 2108 }, { "epoch": 0.39, "learning_rate": 1.9479737859964403e-05, "loss": 0.5076, "step": 2109 }, { "epoch": 0.39, "learning_rate": 1.9479101785186932e-05, "loss": 0.4886, "step": 2110 }, { "epoch": 0.39, "learning_rate": 1.9478465332210853e-05, "loss": 0.4902, "step": 2111 }, { "epoch": 0.39, "learning_rate": 1.947782850106156e-05, "loss": 0.4837, "step": 2112 }, { "epoch": 0.39, "learning_rate": 1.9477191291764452e-05, "loss": 0.4797, "step": 2113 }, { "epoch": 0.39, "learning_rate": 1.9476553704344962e-05, "loss": 0.4779, "step": 2114 }, { "epoch": 0.39, "learning_rate": 1.9475915738828522e-05, "loss": 0.4908, "step": 2115 }, { "epoch": 0.39, "learning_rate": 1.947527739524059e-05, "loss": 0.5109, "step": 2116 }, { "epoch": 0.39, "learning_rate": 1.947463867360663e-05, "loss": 0.5078, "step": 2117 }, { "epoch": 0.39, "learning_rate": 1.947399957395213e-05, "loss": 0.4856, "step": 2118 }, { "epoch": 0.39, "learning_rate": 1.947336009630259e-05, "loss": 0.483, "step": 2119 }, { "epoch": 0.39, "learning_rate": 1.947272024068352e-05, "loss": 0.4909, "step": 2120 }, { "epoch": 0.39, "learning_rate": 1.9472080007120452e-05, "loss": 0.4725, "step": 2121 }, { "epoch": 0.39, "learning_rate": 1.9471439395638927e-05, "loss": 0.4953, "step": 2122 }, { "epoch": 0.39, "learning_rate": 1.9470798406264504e-05, "loss": 0.5179, "step": 2123 }, { "epoch": 0.39, "learning_rate": 1.947015703902276e-05, "loss": 0.4923, "step": 2124 }, { "epoch": 0.39, "learning_rate": 1.9469515293939286e-05, "loss": 0.482, "step": 2125 }, { "epoch": 0.39, "learning_rate": 1.9468873171039685e-05, "loss": 0.4999, "step": 2126 }, { "epoch": 0.39, "learning_rate": 1.9468230670349575e-05, "loss": 0.5002, "step": 2127 }, { "epoch": 0.39, "learning_rate": 1.946758779189459e-05, "loss": 0.4639, "step": 2128 }, { "epoch": 0.39, "learning_rate": 1.9466944535700382e-05, "loss": 0.4625, "step": 2129 }, { "epoch": 0.39, "learning_rate": 1.946630090179261e-05, "loss": 0.4788, "step": 2130 }, { "epoch": 0.39, "learning_rate": 1.9465656890196966e-05, "loss": 0.4994, "step": 2131 }, { "epoch": 0.39, "learning_rate": 1.9465012500939134e-05, "loss": 0.4808, "step": 2132 }, { "epoch": 0.39, "learning_rate": 1.9464367734044823e-05, "loss": 0.4869, "step": 2133 }, { "epoch": 0.39, "learning_rate": 1.9463722589539768e-05, "loss": 0.4925, "step": 2134 }, { "epoch": 0.4, "learning_rate": 1.94630770674497e-05, "loss": 0.4827, "step": 2135 }, { "epoch": 0.4, "learning_rate": 1.946243116780038e-05, "loss": 0.4728, "step": 2136 }, { "epoch": 0.4, "learning_rate": 1.9461784890617573e-05, "loss": 0.4814, "step": 2137 }, { "epoch": 0.4, "learning_rate": 1.9461138235927068e-05, "loss": 0.4711, "step": 2138 }, { "epoch": 0.4, "learning_rate": 1.9460491203754666e-05, "loss": 0.4888, "step": 2139 }, { "epoch": 0.4, "learning_rate": 1.945984379412618e-05, "loss": 0.4987, "step": 2140 }, { "epoch": 0.4, "learning_rate": 1.9459196007067437e-05, "loss": 0.4947, "step": 2141 }, { "epoch": 0.4, "learning_rate": 1.945854784260429e-05, "loss": 0.4869, "step": 2142 }, { "epoch": 0.4, "learning_rate": 1.9457899300762598e-05, "loss": 0.4632, "step": 2143 }, { "epoch": 0.4, "learning_rate": 1.945725038156823e-05, "loss": 0.467, "step": 2144 }, { "epoch": 0.4, "learning_rate": 1.9456601085047084e-05, "loss": 0.4957, "step": 2145 }, { "epoch": 0.4, "learning_rate": 1.9455951411225064e-05, "loss": 0.4858, "step": 2146 }, { "epoch": 0.4, "learning_rate": 1.9455301360128088e-05, "loss": 0.489, "step": 2147 }, { "epoch": 0.4, "learning_rate": 1.9454650931782095e-05, "loss": 0.4997, "step": 2148 }, { "epoch": 0.4, "learning_rate": 1.9454000126213036e-05, "loss": 0.5, "step": 2149 }, { "epoch": 0.4, "learning_rate": 1.9453348943446872e-05, "loss": 0.4857, "step": 2150 }, { "epoch": 0.4, "learning_rate": 1.945269738350959e-05, "loss": 0.4988, "step": 2151 }, { "epoch": 0.4, "learning_rate": 1.9452045446427183e-05, "loss": 0.4924, "step": 2152 }, { "epoch": 0.4, "learning_rate": 1.9451393132225664e-05, "loss": 0.4677, "step": 2153 }, { "epoch": 0.4, "learning_rate": 1.9450740440931054e-05, "loss": 0.4876, "step": 2154 }, { "epoch": 0.4, "learning_rate": 1.9450087372569403e-05, "loss": 0.4943, "step": 2155 }, { "epoch": 0.4, "learning_rate": 1.9449433927166758e-05, "loss": 0.476, "step": 2156 }, { "epoch": 0.4, "learning_rate": 1.9448780104749198e-05, "loss": 0.4985, "step": 2157 }, { "epoch": 0.4, "learning_rate": 1.94481259053428e-05, "loss": 0.4817, "step": 2158 }, { "epoch": 0.4, "learning_rate": 1.944747132897368e-05, "loss": 0.4906, "step": 2159 }, { "epoch": 0.4, "learning_rate": 1.9446816375667937e-05, "loss": 0.4893, "step": 2160 }, { "epoch": 0.4, "learning_rate": 1.9446161045451714e-05, "loss": 0.5074, "step": 2161 }, { "epoch": 0.4, "learning_rate": 1.9445505338351155e-05, "loss": 0.4583, "step": 2162 }, { "epoch": 0.4, "learning_rate": 1.9444849254392422e-05, "loss": 0.4924, "step": 2163 }, { "epoch": 0.4, "learning_rate": 1.944419279360169e-05, "loss": 0.4898, "step": 2164 }, { "epoch": 0.4, "learning_rate": 1.944353595600515e-05, "loss": 0.4855, "step": 2165 }, { "epoch": 0.4, "learning_rate": 1.944287874162901e-05, "loss": 0.4915, "step": 2166 }, { "epoch": 0.4, "learning_rate": 1.9442221150499492e-05, "loss": 0.4997, "step": 2167 }, { "epoch": 0.4, "learning_rate": 1.944156318264283e-05, "loss": 0.4859, "step": 2168 }, { "epoch": 0.4, "learning_rate": 1.9440904838085277e-05, "loss": 0.4981, "step": 2169 }, { "epoch": 0.4, "learning_rate": 1.9440246116853104e-05, "loss": 0.4842, "step": 2170 }, { "epoch": 0.4, "learning_rate": 1.9439587018972586e-05, "loss": 0.5079, "step": 2171 }, { "epoch": 0.4, "learning_rate": 1.9438927544470022e-05, "loss": 0.4766, "step": 2172 }, { "epoch": 0.4, "learning_rate": 1.9438267693371728e-05, "loss": 0.482, "step": 2173 }, { "epoch": 0.4, "learning_rate": 1.9437607465704028e-05, "loss": 0.4867, "step": 2174 }, { "epoch": 0.4, "learning_rate": 1.943694686149326e-05, "loss": 0.5061, "step": 2175 }, { "epoch": 0.4, "learning_rate": 1.9436285880765785e-05, "loss": 0.4813, "step": 2176 }, { "epoch": 0.4, "learning_rate": 1.9435624523547974e-05, "loss": 0.4929, "step": 2177 }, { "epoch": 0.4, "learning_rate": 1.9434962789866215e-05, "loss": 0.4877, "step": 2178 }, { "epoch": 0.4, "learning_rate": 1.943430067974691e-05, "loss": 0.4751, "step": 2179 }, { "epoch": 0.4, "learning_rate": 1.9433638193216473e-05, "loss": 0.5022, "step": 2180 }, { "epoch": 0.4, "learning_rate": 1.9432975330301338e-05, "loss": 0.483, "step": 2181 }, { "epoch": 0.4, "learning_rate": 1.9432312091027957e-05, "loss": 0.4847, "step": 2182 }, { "epoch": 0.4, "learning_rate": 1.943164847542278e-05, "loss": 0.4993, "step": 2183 }, { "epoch": 0.4, "learning_rate": 1.9430984483512295e-05, "loss": 0.4867, "step": 2184 }, { "epoch": 0.4, "learning_rate": 1.9430320115322988e-05, "loss": 0.4878, "step": 2185 }, { "epoch": 0.4, "learning_rate": 1.942965537088137e-05, "loss": 0.4792, "step": 2186 }, { "epoch": 0.4, "learning_rate": 1.942899025021396e-05, "loss": 0.4944, "step": 2187 }, { "epoch": 0.4, "learning_rate": 1.94283247533473e-05, "loss": 0.4776, "step": 2188 }, { "epoch": 0.4, "learning_rate": 1.9427658880307934e-05, "loss": 0.4811, "step": 2189 }, { "epoch": 0.41, "learning_rate": 1.9426992631122433e-05, "loss": 0.465, "step": 2190 }, { "epoch": 0.41, "learning_rate": 1.9426326005817383e-05, "loss": 0.4785, "step": 2191 }, { "epoch": 0.41, "learning_rate": 1.9425659004419378e-05, "loss": 0.4895, "step": 2192 }, { "epoch": 0.41, "learning_rate": 1.9424991626955027e-05, "loss": 0.4576, "step": 2193 }, { "epoch": 0.41, "learning_rate": 1.942432387345096e-05, "loss": 0.4967, "step": 2194 }, { "epoch": 0.41, "learning_rate": 1.942365574393382e-05, "loss": 0.5003, "step": 2195 }, { "epoch": 0.41, "learning_rate": 1.9422987238430266e-05, "loss": 0.4965, "step": 2196 }, { "epoch": 0.41, "learning_rate": 1.9422318356966967e-05, "loss": 0.4849, "step": 2197 }, { "epoch": 0.41, "learning_rate": 1.9421649099570605e-05, "loss": 0.5038, "step": 2198 }, { "epoch": 0.41, "learning_rate": 1.9420979466267892e-05, "loss": 0.4929, "step": 2199 }, { "epoch": 0.41, "learning_rate": 1.9420309457085537e-05, "loss": 0.5023, "step": 2200 }, { "epoch": 0.41, "learning_rate": 1.941963907205028e-05, "loss": 0.4939, "step": 2201 }, { "epoch": 0.41, "learning_rate": 1.941896831118886e-05, "loss": 0.5061, "step": 2202 }, { "epoch": 0.41, "learning_rate": 1.941829717452805e-05, "loss": 0.4631, "step": 2203 }, { "epoch": 0.41, "learning_rate": 1.9417625662094613e-05, "loss": 0.4878, "step": 2204 }, { "epoch": 0.41, "learning_rate": 1.941695377391535e-05, "loss": 0.4771, "step": 2205 }, { "epoch": 0.41, "learning_rate": 1.941628151001707e-05, "loss": 0.4783, "step": 2206 }, { "epoch": 0.41, "learning_rate": 1.941560887042659e-05, "loss": 0.4738, "step": 2207 }, { "epoch": 0.41, "learning_rate": 1.941493585517075e-05, "loss": 0.487, "step": 2208 }, { "epoch": 0.41, "learning_rate": 1.9414262464276398e-05, "loss": 0.4733, "step": 2209 }, { "epoch": 0.41, "learning_rate": 1.9413588697770404e-05, "loss": 0.4865, "step": 2210 }, { "epoch": 0.41, "learning_rate": 1.9412914555679648e-05, "loss": 0.4864, "step": 2211 }, { "epoch": 0.41, "learning_rate": 1.9412240038031034e-05, "loss": 0.485, "step": 2212 }, { "epoch": 0.41, "learning_rate": 1.9411565144851467e-05, "loss": 0.5155, "step": 2213 }, { "epoch": 0.41, "learning_rate": 1.9410889876167873e-05, "loss": 0.5143, "step": 2214 }, { "epoch": 0.41, "learning_rate": 1.9410214232007197e-05, "loss": 0.4649, "step": 2215 }, { "epoch": 0.41, "learning_rate": 1.94095382123964e-05, "loss": 0.4917, "step": 2216 }, { "epoch": 0.41, "learning_rate": 1.9408861817362443e-05, "loss": 0.5023, "step": 2217 }, { "epoch": 0.41, "learning_rate": 1.9408185046932324e-05, "loss": 0.4801, "step": 2218 }, { "epoch": 0.41, "learning_rate": 1.940750790113304e-05, "loss": 0.4936, "step": 2219 }, { "epoch": 0.41, "learning_rate": 1.940683037999161e-05, "loss": 0.496, "step": 2220 }, { "epoch": 0.41, "learning_rate": 1.9406152483535063e-05, "loss": 0.486, "step": 2221 }, { "epoch": 0.41, "learning_rate": 1.9405474211790442e-05, "loss": 0.4952, "step": 2222 }, { "epoch": 0.41, "learning_rate": 1.940479556478482e-05, "loss": 0.496, "step": 2223 }, { "epoch": 0.41, "learning_rate": 1.9404116542545263e-05, "loss": 0.474, "step": 2224 }, { "epoch": 0.41, "learning_rate": 1.9403437145098867e-05, "loss": 0.4708, "step": 2225 }, { "epoch": 0.41, "learning_rate": 1.9402757372472746e-05, "loss": 0.4898, "step": 2226 }, { "epoch": 0.41, "learning_rate": 1.9402077224694008e-05, "loss": 0.5021, "step": 2227 }, { "epoch": 0.41, "learning_rate": 1.9401396701789798e-05, "loss": 0.4934, "step": 2228 }, { "epoch": 0.41, "learning_rate": 1.9400715803787267e-05, "loss": 0.4977, "step": 2229 }, { "epoch": 0.41, "learning_rate": 1.940003453071358e-05, "loss": 0.4791, "step": 2230 }, { "epoch": 0.41, "learning_rate": 1.9399352882595915e-05, "loss": 0.4755, "step": 2231 }, { "epoch": 0.41, "learning_rate": 1.9398670859461478e-05, "loss": 0.4869, "step": 2232 }, { "epoch": 0.41, "learning_rate": 1.939798846133747e-05, "loss": 0.4813, "step": 2233 }, { "epoch": 0.41, "learning_rate": 1.9397305688251124e-05, "loss": 0.5072, "step": 2234 }, { "epoch": 0.41, "learning_rate": 1.9396622540229682e-05, "loss": 0.4866, "step": 2235 }, { "epoch": 0.41, "learning_rate": 1.9395939017300396e-05, "loss": 0.4879, "step": 2236 }, { "epoch": 0.41, "learning_rate": 1.9395255119490542e-05, "loss": 0.499, "step": 2237 }, { "epoch": 0.41, "learning_rate": 1.93945708468274e-05, "loss": 0.4725, "step": 2238 }, { "epoch": 0.41, "learning_rate": 1.9393886199338277e-05, "loss": 0.4726, "step": 2239 }, { "epoch": 0.41, "learning_rate": 1.9393201177050484e-05, "loss": 0.4788, "step": 2240 }, { "epoch": 0.41, "learning_rate": 1.939251577999136e-05, "loss": 0.4817, "step": 2241 }, { "epoch": 0.41, "learning_rate": 1.9391830008188242e-05, "loss": 0.5051, "step": 2242 }, { "epoch": 0.41, "learning_rate": 1.9391143861668497e-05, "loss": 0.4878, "step": 2243 }, { "epoch": 0.42, "learning_rate": 1.93904573404595e-05, "loss": 0.5, "step": 2244 }, { "epoch": 0.42, "learning_rate": 1.9389770444588637e-05, "loss": 0.4919, "step": 2245 }, { "epoch": 0.42, "learning_rate": 1.9389083174083323e-05, "loss": 0.4641, "step": 2246 }, { "epoch": 0.42, "learning_rate": 1.938839552897097e-05, "loss": 0.4837, "step": 2247 }, { "epoch": 0.42, "learning_rate": 1.938770750927902e-05, "loss": 0.4888, "step": 2248 }, { "epoch": 0.42, "learning_rate": 1.938701911503492e-05, "loss": 0.485, "step": 2249 }, { "epoch": 0.42, "learning_rate": 1.9386330346266137e-05, "loss": 0.4731, "step": 2250 }, { "epoch": 0.42, "learning_rate": 1.938564120300015e-05, "loss": 0.4733, "step": 2251 }, { "epoch": 0.42, "learning_rate": 1.9384951685264458e-05, "loss": 0.4844, "step": 2252 }, { "epoch": 0.42, "learning_rate": 1.938426179308657e-05, "loss": 0.497, "step": 2253 }, { "epoch": 0.42, "learning_rate": 1.9383571526494012e-05, "loss": 0.5062, "step": 2254 }, { "epoch": 0.42, "learning_rate": 1.938288088551432e-05, "loss": 0.4782, "step": 2255 }, { "epoch": 0.42, "learning_rate": 1.9382189870175055e-05, "loss": 0.4969, "step": 2256 }, { "epoch": 0.42, "learning_rate": 1.9381498480503785e-05, "loss": 0.4993, "step": 2257 }, { "epoch": 0.42, "learning_rate": 1.9380806716528093e-05, "loss": 0.4852, "step": 2258 }, { "epoch": 0.42, "learning_rate": 1.9380114578275582e-05, "loss": 0.4823, "step": 2259 }, { "epoch": 0.42, "learning_rate": 1.9379422065773866e-05, "loss": 0.4916, "step": 2260 }, { "epoch": 0.42, "learning_rate": 1.9378729179050575e-05, "loss": 0.5057, "step": 2261 }, { "epoch": 0.42, "learning_rate": 1.9378035918133356e-05, "loss": 0.4716, "step": 2262 }, { "epoch": 0.42, "learning_rate": 1.9377342283049866e-05, "loss": 0.4693, "step": 2263 }, { "epoch": 0.42, "learning_rate": 1.937664827382778e-05, "loss": 0.4992, "step": 2264 }, { "epoch": 0.42, "learning_rate": 1.9375953890494787e-05, "loss": 0.497, "step": 2265 }, { "epoch": 0.42, "learning_rate": 1.9375259133078595e-05, "loss": 0.4917, "step": 2266 }, { "epoch": 0.42, "learning_rate": 1.937456400160692e-05, "loss": 0.4864, "step": 2267 }, { "epoch": 0.42, "learning_rate": 1.93738684961075e-05, "loss": 0.4896, "step": 2268 }, { "epoch": 0.42, "learning_rate": 1.937317261660808e-05, "loss": 0.4705, "step": 2269 }, { "epoch": 0.42, "learning_rate": 1.9372476363136427e-05, "loss": 0.4871, "step": 2270 }, { "epoch": 0.42, "learning_rate": 1.9371779735720318e-05, "loss": 0.4705, "step": 2271 }, { "epoch": 0.42, "learning_rate": 1.9371082734387552e-05, "loss": 0.5038, "step": 2272 }, { "epoch": 0.42, "learning_rate": 1.9370385359165933e-05, "loss": 0.4852, "step": 2273 }, { "epoch": 0.42, "learning_rate": 1.9369687610083286e-05, "loss": 0.4837, "step": 2274 }, { "epoch": 0.42, "learning_rate": 1.9368989487167456e-05, "loss": 0.4776, "step": 2275 }, { "epoch": 0.42, "learning_rate": 1.936829099044629e-05, "loss": 0.4751, "step": 2276 }, { "epoch": 0.42, "learning_rate": 1.9367592119947653e-05, "loss": 0.4723, "step": 2277 }, { "epoch": 0.42, "learning_rate": 1.936689287569944e-05, "loss": 0.5085, "step": 2278 }, { "epoch": 0.42, "learning_rate": 1.936619325772954e-05, "loss": 0.4979, "step": 2279 }, { "epoch": 0.42, "learning_rate": 1.936549326606587e-05, "loss": 0.4913, "step": 2280 }, { "epoch": 0.42, "learning_rate": 1.9364792900736364e-05, "loss": 0.4918, "step": 2281 }, { "epoch": 0.42, "learning_rate": 1.9364092161768956e-05, "loss": 0.4962, "step": 2282 }, { "epoch": 0.42, "learning_rate": 1.9363391049191605e-05, "loss": 0.4852, "step": 2283 }, { "epoch": 0.42, "learning_rate": 1.936268956303229e-05, "loss": 0.4789, "step": 2284 }, { "epoch": 0.42, "learning_rate": 1.9361987703318995e-05, "loss": 0.4769, "step": 2285 }, { "epoch": 0.42, "learning_rate": 1.9361285470079724e-05, "loss": 0.4754, "step": 2286 }, { "epoch": 0.42, "learning_rate": 1.9360582863342495e-05, "loss": 0.4889, "step": 2287 }, { "epoch": 0.42, "learning_rate": 1.935987988313534e-05, "loss": 0.4782, "step": 2288 }, { "epoch": 0.42, "learning_rate": 1.935917652948631e-05, "loss": 0.4805, "step": 2289 }, { "epoch": 0.42, "learning_rate": 1.9358472802423464e-05, "loss": 0.4911, "step": 2290 }, { "epoch": 0.42, "learning_rate": 1.9357768701974878e-05, "loss": 0.4702, "step": 2291 }, { "epoch": 0.42, "learning_rate": 1.9357064228168646e-05, "loss": 0.492, "step": 2292 }, { "epoch": 0.42, "learning_rate": 1.9356359381032873e-05, "loss": 0.48, "step": 2293 }, { "epoch": 0.42, "learning_rate": 1.9355654160595688e-05, "loss": 0.4641, "step": 2294 }, { "epoch": 0.42, "learning_rate": 1.935494856688522e-05, "loss": 0.4941, "step": 2295 }, { "epoch": 0.42, "learning_rate": 1.9354242599929628e-05, "loss": 0.4878, "step": 2296 }, { "epoch": 0.42, "learning_rate": 1.9353536259757072e-05, "loss": 0.4861, "step": 2297 }, { "epoch": 0.43, "learning_rate": 1.9352829546395738e-05, "loss": 0.4609, "step": 2298 }, { "epoch": 0.43, "learning_rate": 1.9352122459873822e-05, "loss": 0.4933, "step": 2299 }, { "epoch": 0.43, "learning_rate": 1.9351415000219534e-05, "loss": 0.4786, "step": 2300 }, { "epoch": 0.43, "learning_rate": 1.9350707167461104e-05, "loss": 0.4952, "step": 2301 }, { "epoch": 0.43, "learning_rate": 1.9349998961626765e-05, "loss": 0.4808, "step": 2302 }, { "epoch": 0.43, "learning_rate": 1.9349290382744784e-05, "loss": 0.5047, "step": 2303 }, { "epoch": 0.43, "learning_rate": 1.9348581430843425e-05, "loss": 0.4677, "step": 2304 }, { "epoch": 0.43, "learning_rate": 1.9347872105950972e-05, "loss": 0.4999, "step": 2305 }, { "epoch": 0.43, "learning_rate": 1.9347162408095733e-05, "loss": 0.4904, "step": 2306 }, { "epoch": 0.43, "learning_rate": 1.934645233730602e-05, "loss": 0.482, "step": 2307 }, { "epoch": 0.43, "learning_rate": 1.934574189361016e-05, "loss": 0.4859, "step": 2308 }, { "epoch": 0.43, "learning_rate": 1.93450310770365e-05, "loss": 0.4815, "step": 2309 }, { "epoch": 0.43, "learning_rate": 1.9344319887613407e-05, "loss": 0.4955, "step": 2310 }, { "epoch": 0.43, "learning_rate": 1.934360832536925e-05, "loss": 0.4628, "step": 2311 }, { "epoch": 0.43, "learning_rate": 1.9342896390332416e-05, "loss": 0.4782, "step": 2312 }, { "epoch": 0.43, "learning_rate": 1.9342184082531318e-05, "loss": 0.4821, "step": 2313 }, { "epoch": 0.43, "learning_rate": 1.934147140199437e-05, "loss": 0.4785, "step": 2314 }, { "epoch": 0.43, "learning_rate": 1.9340758348750012e-05, "loss": 0.4866, "step": 2315 }, { "epoch": 0.43, "learning_rate": 1.9340044922826683e-05, "loss": 0.4971, "step": 2316 }, { "epoch": 0.43, "learning_rate": 1.933933112425286e-05, "loss": 0.4819, "step": 2317 }, { "epoch": 0.43, "learning_rate": 1.9338616953057015e-05, "loss": 0.4654, "step": 2318 }, { "epoch": 0.43, "learning_rate": 1.933790240926764e-05, "loss": 0.4685, "step": 2319 }, { "epoch": 0.43, "learning_rate": 1.9337187492913256e-05, "loss": 0.4975, "step": 2320 }, { "epoch": 0.43, "learning_rate": 1.9336472204022373e-05, "loss": 0.4812, "step": 2321 }, { "epoch": 0.43, "learning_rate": 1.933575654262353e-05, "loss": 0.4998, "step": 2322 }, { "epoch": 0.43, "learning_rate": 1.9335040508745294e-05, "loss": 0.4795, "step": 2323 }, { "epoch": 0.43, "learning_rate": 1.933432410241622e-05, "loss": 0.4829, "step": 2324 }, { "epoch": 0.43, "learning_rate": 1.93336073236649e-05, "loss": 0.4906, "step": 2325 }, { "epoch": 0.43, "learning_rate": 1.9332890172519925e-05, "loss": 0.4655, "step": 2326 }, { "epoch": 0.43, "learning_rate": 1.9332172649009913e-05, "loss": 0.5041, "step": 2327 }, { "epoch": 0.43, "learning_rate": 1.9331454753163493e-05, "loss": 0.4913, "step": 2328 }, { "epoch": 0.43, "learning_rate": 1.9330736485009303e-05, "loss": 0.4867, "step": 2329 }, { "epoch": 0.43, "learning_rate": 1.9330017844576e-05, "loss": 0.5001, "step": 2330 }, { "epoch": 0.43, "learning_rate": 1.932929883189226e-05, "loss": 0.4772, "step": 2331 }, { "epoch": 0.43, "learning_rate": 1.932857944698677e-05, "loss": 0.4904, "step": 2332 }, { "epoch": 0.43, "learning_rate": 1.9327859689888237e-05, "loss": 0.4912, "step": 2333 }, { "epoch": 0.43, "learning_rate": 1.9327139560625365e-05, "loss": 0.4907, "step": 2334 }, { "epoch": 0.43, "learning_rate": 1.9326419059226896e-05, "loss": 0.4922, "step": 2335 }, { "epoch": 0.43, "learning_rate": 1.9325698185721574e-05, "loss": 0.4876, "step": 2336 }, { "epoch": 0.43, "learning_rate": 1.932497694013816e-05, "loss": 0.4758, "step": 2337 }, { "epoch": 0.43, "learning_rate": 1.932425532250543e-05, "loss": 0.4998, "step": 2338 }, { "epoch": 0.43, "learning_rate": 1.9323533332852177e-05, "loss": 0.4857, "step": 2339 }, { "epoch": 0.43, "learning_rate": 1.9322810971207206e-05, "loss": 0.4873, "step": 2340 }, { "epoch": 0.43, "learning_rate": 1.9322088237599338e-05, "loss": 0.509, "step": 2341 }, { "epoch": 0.43, "learning_rate": 1.932136513205741e-05, "loss": 0.4974, "step": 2342 }, { "epoch": 0.43, "learning_rate": 1.932064165461027e-05, "loss": 0.4814, "step": 2343 }, { "epoch": 0.43, "learning_rate": 1.9319917805286784e-05, "loss": 0.4729, "step": 2344 }, { "epoch": 0.43, "learning_rate": 1.9319193584115835e-05, "loss": 0.5017, "step": 2345 }, { "epoch": 0.43, "learning_rate": 1.9318468991126313e-05, "loss": 0.4687, "step": 2346 }, { "epoch": 0.43, "learning_rate": 1.9317744026347133e-05, "loss": 0.4786, "step": 2347 }, { "epoch": 0.43, "learning_rate": 1.9317018689807218e-05, "loss": 0.4733, "step": 2348 }, { "epoch": 0.43, "learning_rate": 1.9316292981535506e-05, "loss": 0.4789, "step": 2349 }, { "epoch": 0.43, "learning_rate": 1.9315566901560953e-05, "loss": 0.4934, "step": 2350 }, { "epoch": 0.43, "learning_rate": 1.9314840449912527e-05, "loss": 0.4855, "step": 2351 }, { "epoch": 0.44, "learning_rate": 1.9314113626619217e-05, "loss": 0.4592, "step": 2352 }, { "epoch": 0.44, "learning_rate": 1.9313386431710015e-05, "loss": 0.4754, "step": 2353 }, { "epoch": 0.44, "learning_rate": 1.9312658865213938e-05, "loss": 0.4904, "step": 2354 }, { "epoch": 0.44, "learning_rate": 1.9311930927160014e-05, "loss": 0.4805, "step": 2355 }, { "epoch": 0.44, "learning_rate": 1.9311202617577286e-05, "loss": 0.4698, "step": 2356 }, { "epoch": 0.44, "learning_rate": 1.9310473936494812e-05, "loss": 0.4897, "step": 2357 }, { "epoch": 0.44, "learning_rate": 1.930974488394167e-05, "loss": 0.4967, "step": 2358 }, { "epoch": 0.44, "learning_rate": 1.930901545994694e-05, "loss": 0.4947, "step": 2359 }, { "epoch": 0.44, "learning_rate": 1.930828566453973e-05, "loss": 0.4752, "step": 2360 }, { "epoch": 0.44, "learning_rate": 1.9307555497749155e-05, "loss": 0.4854, "step": 2361 }, { "epoch": 0.44, "learning_rate": 1.9306824959604346e-05, "loss": 0.4827, "step": 2362 }, { "epoch": 0.44, "learning_rate": 1.9306094050134455e-05, "loss": 0.4858, "step": 2363 }, { "epoch": 0.44, "learning_rate": 1.9305362769368645e-05, "loss": 0.4831, "step": 2364 }, { "epoch": 0.44, "learning_rate": 1.9304631117336082e-05, "loss": 0.4785, "step": 2365 }, { "epoch": 0.44, "learning_rate": 1.9303899094065967e-05, "loss": 0.4535, "step": 2366 }, { "epoch": 0.44, "learning_rate": 1.9303166699587502e-05, "loss": 0.4878, "step": 2367 }, { "epoch": 0.44, "learning_rate": 1.9302433933929915e-05, "loss": 0.5002, "step": 2368 }, { "epoch": 0.44, "learning_rate": 1.930170079712243e-05, "loss": 0.5173, "step": 2369 }, { "epoch": 0.44, "learning_rate": 1.930096728919431e-05, "loss": 0.4845, "step": 2370 }, { "epoch": 0.44, "learning_rate": 1.9300233410174816e-05, "loss": 0.4658, "step": 2371 }, { "epoch": 0.44, "learning_rate": 1.9299499160093226e-05, "loss": 0.4839, "step": 2372 }, { "epoch": 0.44, "learning_rate": 1.9298764538978835e-05, "loss": 0.4887, "step": 2373 }, { "epoch": 0.44, "learning_rate": 1.929802954686096e-05, "loss": 0.5001, "step": 2374 }, { "epoch": 0.44, "learning_rate": 1.9297294183768917e-05, "loss": 0.4835, "step": 2375 }, { "epoch": 0.44, "learning_rate": 1.929655844973205e-05, "loss": 0.4913, "step": 2376 }, { "epoch": 0.44, "learning_rate": 1.9295822344779712e-05, "loss": 0.4964, "step": 2377 }, { "epoch": 0.44, "learning_rate": 1.9295085868941278e-05, "loss": 0.489, "step": 2378 }, { "epoch": 0.44, "learning_rate": 1.9294349022246124e-05, "loss": 0.4818, "step": 2379 }, { "epoch": 0.44, "learning_rate": 1.9293611804723653e-05, "loss": 0.491, "step": 2380 }, { "epoch": 0.44, "learning_rate": 1.9292874216403276e-05, "loss": 0.4813, "step": 2381 }, { "epoch": 0.44, "learning_rate": 1.9292136257314423e-05, "loss": 0.4763, "step": 2382 }, { "epoch": 0.44, "learning_rate": 1.929139792748654e-05, "loss": 0.5018, "step": 2383 }, { "epoch": 0.44, "learning_rate": 1.9290659226949077e-05, "loss": 0.4787, "step": 2384 }, { "epoch": 0.44, "learning_rate": 1.9289920155731518e-05, "loss": 0.4859, "step": 2385 }, { "epoch": 0.44, "learning_rate": 1.9289180713863342e-05, "loss": 0.4835, "step": 2386 }, { "epoch": 0.44, "learning_rate": 1.9288440901374054e-05, "loss": 0.5003, "step": 2387 }, { "epoch": 0.44, "learning_rate": 1.928770071829317e-05, "loss": 0.496, "step": 2388 }, { "epoch": 0.44, "learning_rate": 1.9286960164650222e-05, "loss": 0.4847, "step": 2389 }, { "epoch": 0.44, "learning_rate": 1.928621924047476e-05, "loss": 0.4861, "step": 2390 }, { "epoch": 0.44, "learning_rate": 1.9285477945796346e-05, "loss": 0.4944, "step": 2391 }, { "epoch": 0.44, "learning_rate": 1.928473628064455e-05, "loss": 0.502, "step": 2392 }, { "epoch": 0.44, "learning_rate": 1.928399424504897e-05, "loss": 0.4796, "step": 2393 }, { "epoch": 0.44, "learning_rate": 1.9283251839039204e-05, "loss": 0.4863, "step": 2394 }, { "epoch": 0.44, "learning_rate": 1.9282509062644878e-05, "loss": 0.5001, "step": 2395 }, { "epoch": 0.44, "learning_rate": 1.9281765915895628e-05, "loss": 0.4586, "step": 2396 }, { "epoch": 0.44, "learning_rate": 1.9281022398821103e-05, "loss": 0.4916, "step": 2397 }, { "epoch": 0.44, "learning_rate": 1.928027851145097e-05, "loss": 0.4792, "step": 2398 }, { "epoch": 0.44, "learning_rate": 1.9279534253814904e-05, "loss": 0.4887, "step": 2399 }, { "epoch": 0.44, "learning_rate": 1.92787896259426e-05, "loss": 0.4765, "step": 2400 }, { "epoch": 0.44, "learning_rate": 1.927804462786377e-05, "loss": 0.4933, "step": 2401 }, { "epoch": 0.44, "learning_rate": 1.9277299259608137e-05, "loss": 0.4743, "step": 2402 }, { "epoch": 0.44, "learning_rate": 1.927655352120544e-05, "loss": 0.4729, "step": 2403 }, { "epoch": 0.44, "learning_rate": 1.9275807412685435e-05, "loss": 0.4696, "step": 2404 }, { "epoch": 0.44, "learning_rate": 1.9275060934077883e-05, "loss": 0.4947, "step": 2405 }, { "epoch": 0.45, "learning_rate": 1.9274314085412574e-05, "loss": 0.4817, "step": 2406 }, { "epoch": 0.45, "learning_rate": 1.9273566866719306e-05, "loss": 0.4858, "step": 2407 }, { "epoch": 0.45, "learning_rate": 1.927281927802789e-05, "loss": 0.4803, "step": 2408 }, { "epoch": 0.45, "learning_rate": 1.927207131936815e-05, "loss": 0.473, "step": 2409 }, { "epoch": 0.45, "learning_rate": 1.9271322990769935e-05, "loss": 0.4953, "step": 2410 }, { "epoch": 0.45, "learning_rate": 1.9270574292263094e-05, "loss": 0.4655, "step": 2411 }, { "epoch": 0.45, "learning_rate": 1.9269825223877504e-05, "loss": 0.4733, "step": 2412 }, { "epoch": 0.45, "learning_rate": 1.9269075785643052e-05, "loss": 0.4912, "step": 2413 }, { "epoch": 0.45, "learning_rate": 1.9268325977589634e-05, "loss": 0.4882, "step": 2414 }, { "epoch": 0.45, "learning_rate": 1.9267575799747174e-05, "loss": 0.4848, "step": 2415 }, { "epoch": 0.45, "learning_rate": 1.9266825252145596e-05, "loss": 0.4712, "step": 2416 }, { "epoch": 0.45, "learning_rate": 1.9266074334814845e-05, "loss": 0.4861, "step": 2417 }, { "epoch": 0.45, "learning_rate": 1.926532304778489e-05, "loss": 0.4723, "step": 2418 }, { "epoch": 0.45, "learning_rate": 1.9264571391085692e-05, "loss": 0.467, "step": 2419 }, { "epoch": 0.45, "learning_rate": 1.9263819364747253e-05, "loss": 0.5061, "step": 2420 }, { "epoch": 0.45, "learning_rate": 1.926306696879957e-05, "loss": 0.4862, "step": 2421 }, { "epoch": 0.45, "learning_rate": 1.9262314203272666e-05, "loss": 0.489, "step": 2422 }, { "epoch": 0.45, "learning_rate": 1.9261561068196576e-05, "loss": 0.499, "step": 2423 }, { "epoch": 0.45, "learning_rate": 1.9260807563601343e-05, "loss": 0.5017, "step": 2424 }, { "epoch": 0.45, "learning_rate": 1.926005368951704e-05, "loss": 0.4912, "step": 2425 }, { "epoch": 0.45, "learning_rate": 1.9259299445973734e-05, "loss": 0.4741, "step": 2426 }, { "epoch": 0.45, "learning_rate": 1.9258544833001527e-05, "loss": 0.5075, "step": 2427 }, { "epoch": 0.45, "learning_rate": 1.925778985063052e-05, "loss": 0.4937, "step": 2428 }, { "epoch": 0.45, "learning_rate": 1.9257034498890837e-05, "loss": 0.5043, "step": 2429 }, { "epoch": 0.45, "learning_rate": 1.925627877781262e-05, "loss": 0.4765, "step": 2430 }, { "epoch": 0.45, "learning_rate": 1.925552268742602e-05, "loss": 0.5027, "step": 2431 }, { "epoch": 0.45, "learning_rate": 1.9254766227761194e-05, "loss": 0.482, "step": 2432 }, { "epoch": 0.45, "learning_rate": 1.9254009398848333e-05, "loss": 0.4936, "step": 2433 }, { "epoch": 0.45, "learning_rate": 1.9253252200717633e-05, "loss": 0.4881, "step": 2434 }, { "epoch": 0.45, "learning_rate": 1.9252494633399297e-05, "loss": 0.4918, "step": 2435 }, { "epoch": 0.45, "learning_rate": 1.925173669692356e-05, "loss": 0.4809, "step": 2436 }, { "epoch": 0.45, "learning_rate": 1.9250978391320655e-05, "loss": 0.5023, "step": 2437 }, { "epoch": 0.45, "learning_rate": 1.925021971662084e-05, "loss": 0.4813, "step": 2438 }, { "epoch": 0.45, "learning_rate": 1.9249460672854387e-05, "loss": 0.496, "step": 2439 }, { "epoch": 0.45, "learning_rate": 1.9248701260051577e-05, "loss": 0.4736, "step": 2440 }, { "epoch": 0.45, "learning_rate": 1.924794147824271e-05, "loss": 0.4914, "step": 2441 }, { "epoch": 0.45, "learning_rate": 1.92471813274581e-05, "loss": 0.4823, "step": 2442 }, { "epoch": 0.45, "learning_rate": 1.9246420807728078e-05, "loss": 0.4886, "step": 2443 }, { "epoch": 0.45, "learning_rate": 1.924565991908298e-05, "loss": 0.4774, "step": 2444 }, { "epoch": 0.45, "learning_rate": 1.9244898661553173e-05, "loss": 0.4785, "step": 2445 }, { "epoch": 0.45, "learning_rate": 1.9244137035169027e-05, "loss": 0.4744, "step": 2446 }, { "epoch": 0.45, "learning_rate": 1.9243375039960925e-05, "loss": 0.4811, "step": 2447 }, { "epoch": 0.45, "learning_rate": 1.9242612675959272e-05, "loss": 0.4987, "step": 2448 }, { "epoch": 0.45, "learning_rate": 1.924184994319449e-05, "loss": 0.4903, "step": 2449 }, { "epoch": 0.45, "learning_rate": 1.9241086841697002e-05, "loss": 0.4809, "step": 2450 }, { "epoch": 0.45, "learning_rate": 1.924032337149726e-05, "loss": 0.4649, "step": 2451 }, { "epoch": 0.45, "learning_rate": 1.9239559532625724e-05, "loss": 0.4624, "step": 2452 }, { "epoch": 0.45, "learning_rate": 1.9238795325112867e-05, "loss": 0.4757, "step": 2453 }, { "epoch": 0.45, "learning_rate": 1.923803074898919e-05, "loss": 0.4741, "step": 2454 }, { "epoch": 0.45, "learning_rate": 1.923726580428518e-05, "loss": 0.4706, "step": 2455 }, { "epoch": 0.45, "learning_rate": 1.923650049103137e-05, "loss": 0.4864, "step": 2456 }, { "epoch": 0.45, "learning_rate": 1.9235734809258292e-05, "loss": 0.5051, "step": 2457 }, { "epoch": 0.45, "learning_rate": 1.923496875899649e-05, "loss": 0.4852, "step": 2458 }, { "epoch": 0.45, "learning_rate": 1.923420234027654e-05, "loss": 0.4972, "step": 2459 }, { "epoch": 0.46, "learning_rate": 1.9233435553129008e-05, "loss": 0.4738, "step": 2460 }, { "epoch": 0.46, "learning_rate": 1.9232668397584494e-05, "loss": 0.4797, "step": 2461 }, { "epoch": 0.46, "learning_rate": 1.9231900873673605e-05, "loss": 0.4676, "step": 2462 }, { "epoch": 0.46, "learning_rate": 1.9231132981426966e-05, "loss": 0.4732, "step": 2463 }, { "epoch": 0.46, "learning_rate": 1.923036472087521e-05, "loss": 0.4917, "step": 2464 }, { "epoch": 0.46, "learning_rate": 1.922959609204899e-05, "loss": 0.5003, "step": 2465 }, { "epoch": 0.46, "learning_rate": 1.9228827094978975e-05, "loss": 0.4806, "step": 2466 }, { "epoch": 0.46, "learning_rate": 1.9228057729695847e-05, "loss": 0.4848, "step": 2467 }, { "epoch": 0.46, "learning_rate": 1.92272879962303e-05, "loss": 0.4984, "step": 2468 }, { "epoch": 0.46, "learning_rate": 1.9226517894613047e-05, "loss": 0.4633, "step": 2469 }, { "epoch": 0.46, "learning_rate": 1.922574742487481e-05, "loss": 0.4946, "step": 2470 }, { "epoch": 0.46, "learning_rate": 1.9224976587046332e-05, "loss": 0.5125, "step": 2471 }, { "epoch": 0.46, "learning_rate": 1.9224205381158367e-05, "loss": 0.4965, "step": 2472 }, { "epoch": 0.46, "learning_rate": 1.9223433807241687e-05, "loss": 0.4669, "step": 2473 }, { "epoch": 0.46, "learning_rate": 1.9222661865327078e-05, "loss": 0.4795, "step": 2474 }, { "epoch": 0.46, "learning_rate": 1.922188955544533e-05, "loss": 0.4774, "step": 2475 }, { "epoch": 0.46, "learning_rate": 1.9221116877627267e-05, "loss": 0.473, "step": 2476 }, { "epoch": 0.46, "learning_rate": 1.922034383190371e-05, "loss": 0.4662, "step": 2477 }, { "epoch": 0.46, "learning_rate": 1.9219570418305506e-05, "loss": 0.4746, "step": 2478 }, { "epoch": 0.46, "learning_rate": 1.921879663686351e-05, "loss": 0.469, "step": 2479 }, { "epoch": 0.46, "learning_rate": 1.9218022487608602e-05, "loss": 0.4623, "step": 2480 }, { "epoch": 0.46, "learning_rate": 1.921724797057166e-05, "loss": 0.4637, "step": 2481 }, { "epoch": 0.46, "learning_rate": 1.9216473085783588e-05, "loss": 0.5006, "step": 2482 }, { "epoch": 0.46, "learning_rate": 1.9215697833275304e-05, "loss": 0.4951, "step": 2483 }, { "epoch": 0.46, "learning_rate": 1.9214922213077743e-05, "loss": 0.4882, "step": 2484 }, { "epoch": 0.46, "learning_rate": 1.921414622522184e-05, "loss": 0.4826, "step": 2485 }, { "epoch": 0.46, "learning_rate": 1.9213369869738567e-05, "loss": 0.4813, "step": 2486 }, { "epoch": 0.46, "learning_rate": 1.9212593146658893e-05, "loss": 0.4799, "step": 2487 }, { "epoch": 0.46, "learning_rate": 1.921181605601381e-05, "loss": 0.4843, "step": 2488 }, { "epoch": 0.46, "learning_rate": 1.9211038597834323e-05, "loss": 0.4977, "step": 2489 }, { "epoch": 0.46, "learning_rate": 1.9210260772151445e-05, "loss": 0.489, "step": 2490 }, { "epoch": 0.46, "learning_rate": 1.9209482578996216e-05, "loss": 0.4805, "step": 2491 }, { "epoch": 0.46, "learning_rate": 1.9208704018399686e-05, "loss": 0.4587, "step": 2492 }, { "epoch": 0.46, "learning_rate": 1.920792509039291e-05, "loss": 0.5, "step": 2493 }, { "epoch": 0.46, "learning_rate": 1.9207145795006975e-05, "loss": 0.5015, "step": 2494 }, { "epoch": 0.46, "learning_rate": 1.920636613227297e-05, "loss": 0.4707, "step": 2495 }, { "epoch": 0.46, "learning_rate": 1.9205586102222e-05, "loss": 0.4743, "step": 2496 }, { "epoch": 0.46, "learning_rate": 1.920480570488519e-05, "loss": 0.5034, "step": 2497 }, { "epoch": 0.46, "learning_rate": 1.920402494029367e-05, "loss": 0.4945, "step": 2498 }, { "epoch": 0.46, "learning_rate": 1.92032438084786e-05, "loss": 0.4776, "step": 2499 }, { "epoch": 0.46, "learning_rate": 1.9202462309471138e-05, "loss": 0.4888, "step": 2500 }, { "epoch": 0.46, "learning_rate": 1.920168044330247e-05, "loss": 0.4768, "step": 2501 }, { "epoch": 0.46, "learning_rate": 1.920089821000379e-05, "loss": 0.4957, "step": 2502 }, { "epoch": 0.46, "learning_rate": 1.9200115609606302e-05, "loss": 0.5077, "step": 2503 }, { "epoch": 0.46, "learning_rate": 1.919933264214124e-05, "loss": 0.4706, "step": 2504 }, { "epoch": 0.46, "learning_rate": 1.9198549307639832e-05, "loss": 0.4769, "step": 2505 }, { "epoch": 0.46, "learning_rate": 1.9197765606133344e-05, "loss": 0.4494, "step": 2506 }, { "epoch": 0.46, "learning_rate": 1.9196981537653032e-05, "loss": 0.4881, "step": 2507 }, { "epoch": 0.46, "learning_rate": 1.9196197102230185e-05, "loss": 0.4671, "step": 2508 }, { "epoch": 0.46, "learning_rate": 1.91954122998961e-05, "loss": 0.4938, "step": 2509 }, { "epoch": 0.46, "learning_rate": 1.9194627130682094e-05, "loss": 0.4644, "step": 2510 }, { "epoch": 0.46, "learning_rate": 1.919384159461948e-05, "loss": 0.4947, "step": 2511 }, { "epoch": 0.46, "learning_rate": 1.919305569173962e-05, "loss": 0.4713, "step": 2512 }, { "epoch": 0.46, "learning_rate": 1.919226942207385e-05, "loss": 0.4655, "step": 2513 }, { "epoch": 0.47, "learning_rate": 1.919148278565355e-05, "loss": 0.486, "step": 2514 }, { "epoch": 0.47, "learning_rate": 1.9190695782510106e-05, "loss": 0.5162, "step": 2515 }, { "epoch": 0.47, "learning_rate": 1.9189908412674915e-05, "loss": 0.4839, "step": 2516 }, { "epoch": 0.47, "learning_rate": 1.9189120676179392e-05, "loss": 0.4844, "step": 2517 }, { "epoch": 0.47, "learning_rate": 1.918833257305497e-05, "loss": 0.483, "step": 2518 }, { "epoch": 0.47, "learning_rate": 1.9187544103333092e-05, "loss": 0.4972, "step": 2519 }, { "epoch": 0.47, "learning_rate": 1.918675526704521e-05, "loss": 0.4809, "step": 2520 }, { "epoch": 0.47, "learning_rate": 1.9185966064222806e-05, "loss": 0.4893, "step": 2521 }, { "epoch": 0.47, "learning_rate": 1.9185176494897358e-05, "loss": 0.4809, "step": 2522 }, { "epoch": 0.47, "learning_rate": 1.9184386559100377e-05, "loss": 0.4827, "step": 2523 }, { "epoch": 0.47, "learning_rate": 1.9183596256863378e-05, "loss": 0.4966, "step": 2524 }, { "epoch": 0.47, "learning_rate": 1.918280558821789e-05, "loss": 0.4837, "step": 2525 }, { "epoch": 0.47, "learning_rate": 1.9182014553195458e-05, "loss": 0.5027, "step": 2526 }, { "epoch": 0.47, "learning_rate": 1.918122315182765e-05, "loss": 0.4947, "step": 2527 }, { "epoch": 0.47, "learning_rate": 1.918043138414603e-05, "loss": 0.464, "step": 2528 }, { "epoch": 0.47, "learning_rate": 1.91796392501822e-05, "loss": 0.4763, "step": 2529 }, { "epoch": 0.47, "learning_rate": 1.9178846749967758e-05, "loss": 0.4736, "step": 2530 }, { "epoch": 0.47, "learning_rate": 1.9178053883534328e-05, "loss": 0.4672, "step": 2531 }, { "epoch": 0.47, "learning_rate": 1.9177260650913538e-05, "loss": 0.4948, "step": 2532 }, { "epoch": 0.47, "learning_rate": 1.917646705213704e-05, "loss": 0.4589, "step": 2533 }, { "epoch": 0.47, "learning_rate": 1.9175673087236495e-05, "loss": 0.5032, "step": 2534 }, { "epoch": 0.47, "learning_rate": 1.9174878756243583e-05, "loss": 0.4799, "step": 2535 }, { "epoch": 0.47, "learning_rate": 1.9174084059189998e-05, "loss": 0.509, "step": 2536 }, { "epoch": 0.47, "learning_rate": 1.917328899610744e-05, "loss": 0.4934, "step": 2537 }, { "epoch": 0.47, "learning_rate": 1.917249356702764e-05, "loss": 0.4882, "step": 2538 }, { "epoch": 0.47, "learning_rate": 1.9171697771982325e-05, "loss": 0.4975, "step": 2539 }, { "epoch": 0.47, "learning_rate": 1.9170901611003248e-05, "loss": 0.4902, "step": 2540 }, { "epoch": 0.47, "learning_rate": 1.917010508412218e-05, "loss": 0.4767, "step": 2541 }, { "epoch": 0.47, "learning_rate": 1.9169308191370897e-05, "loss": 0.4637, "step": 2542 }, { "epoch": 0.47, "learning_rate": 1.9168510932781195e-05, "loss": 0.5, "step": 2543 }, { "epoch": 0.47, "learning_rate": 1.9167713308384877e-05, "loss": 0.472, "step": 2544 }, { "epoch": 0.47, "learning_rate": 1.9166915318213773e-05, "loss": 0.4918, "step": 2545 }, { "epoch": 0.47, "learning_rate": 1.9166116962299725e-05, "loss": 0.4919, "step": 2546 }, { "epoch": 0.47, "learning_rate": 1.9165318240674576e-05, "loss": 0.4647, "step": 2547 }, { "epoch": 0.47, "learning_rate": 1.91645191533702e-05, "loss": 0.4659, "step": 2548 }, { "epoch": 0.47, "learning_rate": 1.9163719700418476e-05, "loss": 0.4807, "step": 2549 }, { "epoch": 0.47, "learning_rate": 1.91629198818513e-05, "loss": 0.4877, "step": 2550 }, { "epoch": 0.47, "learning_rate": 1.916211969770059e-05, "loss": 0.4814, "step": 2551 }, { "epoch": 0.47, "learning_rate": 1.9161319147998266e-05, "loss": 0.473, "step": 2552 }, { "epoch": 0.47, "learning_rate": 1.916051823277627e-05, "loss": 0.4719, "step": 2553 }, { "epoch": 0.47, "learning_rate": 1.9159716952066557e-05, "loss": 0.4713, "step": 2554 }, { "epoch": 0.47, "learning_rate": 1.9158915305901095e-05, "loss": 0.4687, "step": 2555 }, { "epoch": 0.47, "learning_rate": 1.915811329431187e-05, "loss": 0.5101, "step": 2556 }, { "epoch": 0.47, "learning_rate": 1.915731091733088e-05, "loss": 0.487, "step": 2557 }, { "epoch": 0.47, "learning_rate": 1.915650817499014e-05, "loss": 0.4922, "step": 2558 }, { "epoch": 0.47, "learning_rate": 1.9155705067321678e-05, "loss": 0.4876, "step": 2559 }, { "epoch": 0.47, "learning_rate": 1.915490159435753e-05, "loss": 0.486, "step": 2560 }, { "epoch": 0.47, "learning_rate": 1.9154097756129763e-05, "loss": 0.4961, "step": 2561 }, { "epoch": 0.47, "learning_rate": 1.915329355267044e-05, "loss": 0.465, "step": 2562 }, { "epoch": 0.47, "learning_rate": 1.9152488984011653e-05, "loss": 0.4813, "step": 2563 }, { "epoch": 0.47, "learning_rate": 1.9151684050185504e-05, "loss": 0.4725, "step": 2564 }, { "epoch": 0.47, "learning_rate": 1.91508787512241e-05, "loss": 0.4905, "step": 2565 }, { "epoch": 0.47, "learning_rate": 1.915007308715958e-05, "loss": 0.4844, "step": 2566 }, { "epoch": 0.47, "learning_rate": 1.9149267058024084e-05, "loss": 0.4783, "step": 2567 }, { "epoch": 0.48, "learning_rate": 1.9148460663849772e-05, "loss": 0.5078, "step": 2568 }, { "epoch": 0.48, "learning_rate": 1.9147653904668814e-05, "loss": 0.4805, "step": 2569 }, { "epoch": 0.48, "learning_rate": 1.9146846780513404e-05, "loss": 0.4868, "step": 2570 }, { "epoch": 0.48, "learning_rate": 1.9146039291415742e-05, "loss": 0.4788, "step": 2571 }, { "epoch": 0.48, "learning_rate": 1.9145231437408047e-05, "loss": 0.4919, "step": 2572 }, { "epoch": 0.48, "learning_rate": 1.914442321852255e-05, "loss": 0.4612, "step": 2573 }, { "epoch": 0.48, "learning_rate": 1.9143614634791498e-05, "loss": 0.4651, "step": 2574 }, { "epoch": 0.48, "learning_rate": 1.9142805686247147e-05, "loss": 0.5016, "step": 2575 }, { "epoch": 0.48, "learning_rate": 1.914199637292178e-05, "loss": 0.4855, "step": 2576 }, { "epoch": 0.48, "learning_rate": 1.914118669484768e-05, "loss": 0.4804, "step": 2577 }, { "epoch": 0.48, "learning_rate": 1.914037665205716e-05, "loss": 0.496, "step": 2578 }, { "epoch": 0.48, "learning_rate": 1.913956624458253e-05, "loss": 0.5015, "step": 2579 }, { "epoch": 0.48, "learning_rate": 1.913875547245613e-05, "loss": 0.4964, "step": 2580 }, { "epoch": 0.48, "learning_rate": 1.9137944335710306e-05, "loss": 0.4914, "step": 2581 }, { "epoch": 0.48, "learning_rate": 1.9137132834377422e-05, "loss": 0.4926, "step": 2582 }, { "epoch": 0.48, "learning_rate": 1.9136320968489855e-05, "loss": 0.4788, "step": 2583 }, { "epoch": 0.48, "learning_rate": 1.913550873808e-05, "loss": 0.4564, "step": 2584 }, { "epoch": 0.48, "learning_rate": 1.9134696143180255e-05, "loss": 0.497, "step": 2585 }, { "epoch": 0.48, "learning_rate": 1.913388318382305e-05, "loss": 0.4889, "step": 2586 }, { "epoch": 0.48, "learning_rate": 1.9133069860040815e-05, "loss": 0.4619, "step": 2587 }, { "epoch": 0.48, "learning_rate": 1.9132256171866003e-05, "loss": 0.4766, "step": 2588 }, { "epoch": 0.48, "learning_rate": 1.9131442119331082e-05, "loss": 0.4745, "step": 2589 }, { "epoch": 0.48, "learning_rate": 1.913062770246852e-05, "loss": 0.4729, "step": 2590 }, { "epoch": 0.48, "learning_rate": 1.912981292131082e-05, "loss": 0.4642, "step": 2591 }, { "epoch": 0.48, "learning_rate": 1.912899777589049e-05, "loss": 0.4932, "step": 2592 }, { "epoch": 0.48, "learning_rate": 1.9128182266240045e-05, "loss": 0.4685, "step": 2593 }, { "epoch": 0.48, "learning_rate": 1.912736639239203e-05, "loss": 0.4932, "step": 2594 }, { "epoch": 0.48, "learning_rate": 1.9126550154378996e-05, "loss": 0.4839, "step": 2595 }, { "epoch": 0.48, "learning_rate": 1.912573355223351e-05, "loss": 0.4805, "step": 2596 }, { "epoch": 0.48, "learning_rate": 1.9124916585988148e-05, "loss": 0.4875, "step": 2597 }, { "epoch": 0.48, "learning_rate": 1.912409925567551e-05, "loss": 0.4794, "step": 2598 }, { "epoch": 0.48, "learning_rate": 1.9123281561328207e-05, "loss": 0.4746, "step": 2599 }, { "epoch": 0.48, "learning_rate": 1.9122463502978858e-05, "loss": 0.471, "step": 2600 }, { "epoch": 0.48, "learning_rate": 1.9121645080660105e-05, "loss": 0.473, "step": 2601 }, { "epoch": 0.48, "learning_rate": 1.9120826294404603e-05, "loss": 0.479, "step": 2602 }, { "epoch": 0.48, "learning_rate": 1.9120007144245014e-05, "loss": 0.4923, "step": 2603 }, { "epoch": 0.48, "learning_rate": 1.911918763021403e-05, "loss": 0.4702, "step": 2604 }, { "epoch": 0.48, "learning_rate": 1.9118367752344343e-05, "loss": 0.4568, "step": 2605 }, { "epoch": 0.48, "learning_rate": 1.9117547510668662e-05, "loss": 0.4819, "step": 2606 }, { "epoch": 0.48, "learning_rate": 1.911672690521972e-05, "loss": 0.4954, "step": 2607 }, { "epoch": 0.48, "learning_rate": 1.911590593603025e-05, "loss": 0.4786, "step": 2608 }, { "epoch": 0.48, "learning_rate": 1.9115084603133014e-05, "loss": 0.4767, "step": 2609 }, { "epoch": 0.48, "learning_rate": 1.9114262906560776e-05, "loss": 0.4881, "step": 2610 }, { "epoch": 0.48, "learning_rate": 1.9113440846346324e-05, "loss": 0.4813, "step": 2611 }, { "epoch": 0.48, "learning_rate": 1.9112618422522457e-05, "loss": 0.5024, "step": 2612 }, { "epoch": 0.48, "learning_rate": 1.9111795635121982e-05, "loss": 0.4668, "step": 2613 }, { "epoch": 0.48, "learning_rate": 1.9110972484177735e-05, "loss": 0.4962, "step": 2614 }, { "epoch": 0.48, "learning_rate": 1.911014896972255e-05, "loss": 0.4792, "step": 2615 }, { "epoch": 0.48, "learning_rate": 1.9109325091789293e-05, "loss": 0.4834, "step": 2616 }, { "epoch": 0.48, "learning_rate": 1.910850085041083e-05, "loss": 0.4678, "step": 2617 }, { "epoch": 0.48, "learning_rate": 1.9107676245620044e-05, "loss": 0.4689, "step": 2618 }, { "epoch": 0.48, "learning_rate": 1.9106851277449837e-05, "loss": 0.476, "step": 2619 }, { "epoch": 0.48, "learning_rate": 1.910602594593313e-05, "loss": 0.4826, "step": 2620 }, { "epoch": 0.48, "learning_rate": 1.910520025110284e-05, "loss": 0.505, "step": 2621 }, { "epoch": 0.49, "learning_rate": 1.9104374192991926e-05, "loss": 0.4673, "step": 2622 }, { "epoch": 0.49, "learning_rate": 1.9103547771633333e-05, "loss": 0.4767, "step": 2623 }, { "epoch": 0.49, "learning_rate": 1.910272098706004e-05, "loss": 0.4878, "step": 2624 }, { "epoch": 0.49, "learning_rate": 1.9101893839305034e-05, "loss": 0.4664, "step": 2625 }, { "epoch": 0.49, "learning_rate": 1.9101066328401314e-05, "loss": 0.4806, "step": 2626 }, { "epoch": 0.49, "learning_rate": 1.9100238454381898e-05, "loss": 0.4702, "step": 2627 }, { "epoch": 0.49, "learning_rate": 1.9099410217279817e-05, "loss": 0.4843, "step": 2628 }, { "epoch": 0.49, "learning_rate": 1.9098581617128116e-05, "loss": 0.4888, "step": 2629 }, { "epoch": 0.49, "learning_rate": 1.909775265395985e-05, "loss": 0.4602, "step": 2630 }, { "epoch": 0.49, "learning_rate": 1.9096923327808103e-05, "loss": 0.4766, "step": 2631 }, { "epoch": 0.49, "learning_rate": 1.9096093638705952e-05, "loss": 0.4718, "step": 2632 }, { "epoch": 0.49, "learning_rate": 1.909526358668651e-05, "loss": 0.4715, "step": 2633 }, { "epoch": 0.49, "learning_rate": 1.9094433171782888e-05, "loss": 0.4913, "step": 2634 }, { "epoch": 0.49, "learning_rate": 1.9093602394028223e-05, "loss": 0.4808, "step": 2635 }, { "epoch": 0.49, "learning_rate": 1.9092771253455658e-05, "loss": 0.4669, "step": 2636 }, { "epoch": 0.49, "learning_rate": 1.9091939750098354e-05, "loss": 0.4733, "step": 2637 }, { "epoch": 0.49, "learning_rate": 1.9091107883989486e-05, "loss": 0.4886, "step": 2638 }, { "epoch": 0.49, "learning_rate": 1.909027565516225e-05, "loss": 0.4695, "step": 2639 }, { "epoch": 0.49, "learning_rate": 1.908944306364984e-05, "loss": 0.4679, "step": 2640 }, { "epoch": 0.49, "learning_rate": 1.908861010948548e-05, "loss": 0.471, "step": 2641 }, { "epoch": 0.49, "learning_rate": 1.9087776792702406e-05, "loss": 0.493, "step": 2642 }, { "epoch": 0.49, "learning_rate": 1.9086943113333865e-05, "loss": 0.4857, "step": 2643 }, { "epoch": 0.49, "learning_rate": 1.9086109071413115e-05, "loss": 0.5013, "step": 2644 }, { "epoch": 0.49, "learning_rate": 1.908527466697344e-05, "loss": 0.5035, "step": 2645 }, { "epoch": 0.49, "learning_rate": 1.9084439900048123e-05, "loss": 0.4889, "step": 2646 }, { "epoch": 0.49, "learning_rate": 1.9083604770670473e-05, "loss": 0.4977, "step": 2647 }, { "epoch": 0.49, "learning_rate": 1.9082769278873812e-05, "loss": 0.4646, "step": 2648 }, { "epoch": 0.49, "learning_rate": 1.9081933424691472e-05, "loss": 0.4806, "step": 2649 }, { "epoch": 0.49, "learning_rate": 1.9081097208156803e-05, "loss": 0.4732, "step": 2650 }, { "epoch": 0.49, "learning_rate": 1.908026062930317e-05, "loss": 0.4625, "step": 2651 }, { "epoch": 0.49, "learning_rate": 1.9079423688163948e-05, "loss": 0.4962, "step": 2652 }, { "epoch": 0.49, "learning_rate": 1.907858638477253e-05, "loss": 0.4813, "step": 2653 }, { "epoch": 0.49, "learning_rate": 1.9077748719162326e-05, "loss": 0.4786, "step": 2654 }, { "epoch": 0.49, "learning_rate": 1.9076910691366754e-05, "loss": 0.4785, "step": 2655 }, { "epoch": 0.49, "learning_rate": 1.907607230141925e-05, "loss": 0.4695, "step": 2656 }, { "epoch": 0.49, "learning_rate": 1.907523354935327e-05, "loss": 0.4666, "step": 2657 }, { "epoch": 0.49, "learning_rate": 1.907439443520227e-05, "loss": 0.4878, "step": 2658 }, { "epoch": 0.49, "learning_rate": 1.9073554958999733e-05, "loss": 0.4536, "step": 2659 }, { "epoch": 0.49, "learning_rate": 1.9072715120779152e-05, "loss": 0.5027, "step": 2660 }, { "epoch": 0.49, "learning_rate": 1.9071874920574037e-05, "loss": 0.4729, "step": 2661 }, { "epoch": 0.49, "learning_rate": 1.907103435841791e-05, "loss": 0.4598, "step": 2662 }, { "epoch": 0.49, "learning_rate": 1.9070193434344302e-05, "loss": 0.4884, "step": 2663 }, { "epoch": 0.49, "learning_rate": 1.9069352148386772e-05, "loss": 0.4853, "step": 2664 }, { "epoch": 0.49, "learning_rate": 1.9068510500578884e-05, "loss": 0.5027, "step": 2665 }, { "epoch": 0.49, "learning_rate": 1.9067668490954214e-05, "loss": 0.4644, "step": 2666 }, { "epoch": 0.49, "learning_rate": 1.906682611954636e-05, "loss": 0.49, "step": 2667 }, { "epoch": 0.49, "learning_rate": 1.906598338638893e-05, "loss": 0.4774, "step": 2668 }, { "epoch": 0.49, "learning_rate": 1.906514029151555e-05, "loss": 0.4604, "step": 2669 }, { "epoch": 0.49, "learning_rate": 1.9064296834959853e-05, "loss": 0.4893, "step": 2670 }, { "epoch": 0.49, "learning_rate": 1.90634530167555e-05, "loss": 0.5003, "step": 2671 }, { "epoch": 0.49, "learning_rate": 1.906260883693615e-05, "loss": 0.4812, "step": 2672 }, { "epoch": 0.49, "learning_rate": 1.9061764295535483e-05, "loss": 0.4679, "step": 2673 }, { "epoch": 0.49, "learning_rate": 1.9060919392587202e-05, "loss": 0.4845, "step": 2674 }, { "epoch": 0.49, "learning_rate": 1.906007412812501e-05, "loss": 0.4816, "step": 2675 }, { "epoch": 0.5, "learning_rate": 1.9059228502182635e-05, "loss": 0.4888, "step": 2676 }, { "epoch": 0.5, "learning_rate": 1.9058382514793816e-05, "loss": 0.4546, "step": 2677 }, { "epoch": 0.5, "learning_rate": 1.9057536165992308e-05, "loss": 0.4685, "step": 2678 }, { "epoch": 0.5, "learning_rate": 1.9056689455811875e-05, "loss": 0.4731, "step": 2679 }, { "epoch": 0.5, "learning_rate": 1.90558423842863e-05, "loss": 0.4732, "step": 2680 }, { "epoch": 0.5, "learning_rate": 1.905499495144938e-05, "loss": 0.4855, "step": 2681 }, { "epoch": 0.5, "learning_rate": 1.9054147157334926e-05, "loss": 0.4713, "step": 2682 }, { "epoch": 0.5, "learning_rate": 1.9053299001976765e-05, "loss": 0.4544, "step": 2683 }, { "epoch": 0.5, "learning_rate": 1.9052450485408735e-05, "loss": 0.473, "step": 2684 }, { "epoch": 0.5, "learning_rate": 1.9051601607664694e-05, "loss": 0.5036, "step": 2685 }, { "epoch": 0.5, "learning_rate": 1.9050752368778504e-05, "loss": 0.5078, "step": 2686 }, { "epoch": 0.5, "learning_rate": 1.904990276878405e-05, "loss": 0.4789, "step": 2687 }, { "epoch": 0.5, "learning_rate": 1.9049052807715235e-05, "loss": 0.4521, "step": 2688 }, { "epoch": 0.5, "learning_rate": 1.9048202485605968e-05, "loss": 0.4762, "step": 2689 }, { "epoch": 0.5, "learning_rate": 1.9047351802490167e-05, "loss": 0.4601, "step": 2690 }, { "epoch": 0.5, "learning_rate": 1.9046500758401786e-05, "loss": 0.5123, "step": 2691 }, { "epoch": 0.5, "learning_rate": 1.904564935337477e-05, "loss": 0.484, "step": 2692 }, { "epoch": 0.5, "learning_rate": 1.9044797587443095e-05, "loss": 0.4661, "step": 2693 }, { "epoch": 0.5, "learning_rate": 1.9043945460640744e-05, "loss": 0.4919, "step": 2694 }, { "epoch": 0.5, "learning_rate": 1.9043092973001707e-05, "loss": 0.4677, "step": 2695 }, { "epoch": 0.5, "learning_rate": 1.9042240124560008e-05, "loss": 0.4567, "step": 2696 }, { "epoch": 0.5, "learning_rate": 1.904138691534967e-05, "loss": 0.4453, "step": 2697 }, { "epoch": 0.5, "learning_rate": 1.9040533345404734e-05, "loss": 0.4679, "step": 2698 }, { "epoch": 0.5, "learning_rate": 1.903967941475925e-05, "loss": 0.477, "step": 2699 }, { "epoch": 0.5, "learning_rate": 1.90388251234473e-05, "loss": 0.4967, "step": 2700 }, { "epoch": 0.5, "learning_rate": 1.903797047150296e-05, "loss": 0.475, "step": 2701 }, { "epoch": 0.5, "learning_rate": 1.9037115458960332e-05, "loss": 0.4806, "step": 2702 }, { "epoch": 0.5, "learning_rate": 1.9036260085853528e-05, "loss": 0.4859, "step": 2703 }, { "epoch": 0.5, "learning_rate": 1.9035404352216677e-05, "loss": 0.5036, "step": 2704 }, { "epoch": 0.5, "learning_rate": 1.9034548258083922e-05, "loss": 0.4889, "step": 2705 }, { "epoch": 0.5, "learning_rate": 1.903369180348942e-05, "loss": 0.4797, "step": 2706 }, { "epoch": 0.5, "learning_rate": 1.9032834988467336e-05, "loss": 0.5014, "step": 2707 }, { "epoch": 0.5, "learning_rate": 1.9031977813051866e-05, "loss": 0.4571, "step": 2708 }, { "epoch": 0.5, "learning_rate": 1.9031120277277197e-05, "loss": 0.4638, "step": 2709 }, { "epoch": 0.5, "learning_rate": 1.9030262381177555e-05, "loss": 0.461, "step": 2710 }, { "epoch": 0.5, "learning_rate": 1.902940412478716e-05, "loss": 0.4877, "step": 2711 }, { "epoch": 0.5, "learning_rate": 1.9028545508140258e-05, "loss": 0.4769, "step": 2712 }, { "epoch": 0.5, "learning_rate": 1.9027686531271105e-05, "loss": 0.4933, "step": 2713 }, { "epoch": 0.5, "learning_rate": 1.9026827194213978e-05, "loss": 0.4727, "step": 2714 }, { "epoch": 0.5, "learning_rate": 1.902596749700315e-05, "loss": 0.4693, "step": 2715 }, { "epoch": 0.5, "learning_rate": 1.902510743967294e-05, "loss": 0.4935, "step": 2716 }, { "epoch": 0.5, "learning_rate": 1.9024247022257646e-05, "loss": 0.484, "step": 2717 }, { "epoch": 0.5, "learning_rate": 1.9023386244791607e-05, "loss": 0.4681, "step": 2718 }, { "epoch": 0.5, "learning_rate": 1.9022525107309165e-05, "loss": 0.4629, "step": 2719 }, { "epoch": 0.5, "learning_rate": 1.902166360984467e-05, "loss": 0.4689, "step": 2720 }, { "epoch": 0.5, "learning_rate": 1.9020801752432505e-05, "loss": 0.4836, "step": 2721 }, { "epoch": 0.5, "learning_rate": 1.901993953510705e-05, "loss": 0.485, "step": 2722 }, { "epoch": 0.5, "learning_rate": 1.901907695790271e-05, "loss": 0.4665, "step": 2723 }, { "epoch": 0.5, "learning_rate": 1.9018214020853896e-05, "loss": 0.4941, "step": 2724 }, { "epoch": 0.5, "learning_rate": 1.9017350723995037e-05, "loss": 0.4838, "step": 2725 }, { "epoch": 0.5, "learning_rate": 1.9016487067360584e-05, "loss": 0.4704, "step": 2726 }, { "epoch": 0.5, "learning_rate": 1.9015623050984988e-05, "loss": 0.4801, "step": 2727 }, { "epoch": 0.5, "learning_rate": 1.901475867490272e-05, "loss": 0.4746, "step": 2728 }, { "epoch": 0.5, "learning_rate": 1.9013893939148277e-05, "loss": 0.4789, "step": 2729 }, { "epoch": 0.51, "learning_rate": 1.9013028843756155e-05, "loss": 0.4949, "step": 2730 }, { "epoch": 0.51, "learning_rate": 1.9012163388760868e-05, "loss": 0.4901, "step": 2731 }, { "epoch": 0.51, "learning_rate": 1.9011297574196944e-05, "loss": 0.4778, "step": 2732 }, { "epoch": 0.51, "learning_rate": 1.9010431400098935e-05, "loss": 0.4825, "step": 2733 }, { "epoch": 0.51, "learning_rate": 1.9009564866501393e-05, "loss": 0.4958, "step": 2734 }, { "epoch": 0.51, "learning_rate": 1.9008697973438894e-05, "loss": 0.4769, "step": 2735 }, { "epoch": 0.51, "learning_rate": 1.9007830720946025e-05, "loss": 0.4865, "step": 2736 }, { "epoch": 0.51, "learning_rate": 1.900696310905739e-05, "loss": 0.4985, "step": 2737 }, { "epoch": 0.51, "learning_rate": 1.9006095137807602e-05, "loss": 0.4918, "step": 2738 }, { "epoch": 0.51, "learning_rate": 1.9005226807231293e-05, "loss": 0.469, "step": 2739 }, { "epoch": 0.51, "learning_rate": 1.9004358117363102e-05, "loss": 0.4635, "step": 2740 }, { "epoch": 0.51, "learning_rate": 1.9003489068237698e-05, "loss": 0.4754, "step": 2741 }, { "epoch": 0.51, "learning_rate": 1.9002619659889747e-05, "loss": 0.4902, "step": 2742 }, { "epoch": 0.51, "learning_rate": 1.9001749892353945e-05, "loss": 0.4741, "step": 2743 }, { "epoch": 0.51, "learning_rate": 1.9000879765664983e-05, "loss": 0.4745, "step": 2744 }, { "epoch": 0.51, "learning_rate": 1.9000009279857584e-05, "loss": 0.4853, "step": 2745 }, { "epoch": 0.51, "learning_rate": 1.899913843496648e-05, "loss": 0.4971, "step": 2746 }, { "epoch": 0.51, "learning_rate": 1.899826723102641e-05, "loss": 0.4465, "step": 2747 }, { "epoch": 0.51, "learning_rate": 1.899739566807214e-05, "loss": 0.4698, "step": 2748 }, { "epoch": 0.51, "learning_rate": 1.899652374613844e-05, "loss": 0.4791, "step": 2749 }, { "epoch": 0.51, "learning_rate": 1.89956514652601e-05, "loss": 0.465, "step": 2750 }, { "epoch": 0.51, "learning_rate": 1.8994778825471923e-05, "loss": 0.4743, "step": 2751 }, { "epoch": 0.51, "learning_rate": 1.8993905826808723e-05, "loss": 0.4895, "step": 2752 }, { "epoch": 0.51, "learning_rate": 1.8993032469305333e-05, "loss": 0.4655, "step": 2753 }, { "epoch": 0.51, "learning_rate": 1.8992158752996596e-05, "loss": 0.4683, "step": 2754 }, { "epoch": 0.51, "learning_rate": 1.8991284677917373e-05, "loss": 0.4591, "step": 2755 }, { "epoch": 0.51, "learning_rate": 1.899041024410254e-05, "loss": 0.4704, "step": 2756 }, { "epoch": 0.51, "learning_rate": 1.8989535451586984e-05, "loss": 0.4688, "step": 2757 }, { "epoch": 0.51, "learning_rate": 1.8988660300405602e-05, "loss": 0.4733, "step": 2758 }, { "epoch": 0.51, "learning_rate": 1.8987784790593324e-05, "loss": 0.4632, "step": 2759 }, { "epoch": 0.51, "learning_rate": 1.898690892218507e-05, "loss": 0.4708, "step": 2760 }, { "epoch": 0.51, "learning_rate": 1.8986032695215785e-05, "loss": 0.5048, "step": 2761 }, { "epoch": 0.51, "learning_rate": 1.898515610972044e-05, "loss": 0.4735, "step": 2762 }, { "epoch": 0.51, "learning_rate": 1.8984279165733993e-05, "loss": 0.468, "step": 2763 }, { "epoch": 0.51, "learning_rate": 1.8983401863291448e-05, "loss": 0.4811, "step": 2764 }, { "epoch": 0.51, "learning_rate": 1.89825242024278e-05, "loss": 0.4846, "step": 2765 }, { "epoch": 0.51, "learning_rate": 1.8981646183178065e-05, "loss": 0.4957, "step": 2766 }, { "epoch": 0.51, "learning_rate": 1.8980767805577277e-05, "loss": 0.4617, "step": 2767 }, { "epoch": 0.51, "learning_rate": 1.8979889069660482e-05, "loss": 0.4816, "step": 2768 }, { "epoch": 0.51, "learning_rate": 1.8979009975462736e-05, "loss": 0.4792, "step": 2769 }, { "epoch": 0.51, "learning_rate": 1.897813052301912e-05, "loss": 0.4776, "step": 2770 }, { "epoch": 0.51, "learning_rate": 1.8977250712364716e-05, "loss": 0.4976, "step": 2771 }, { "epoch": 0.51, "learning_rate": 1.8976370543534633e-05, "loss": 0.4738, "step": 2772 }, { "epoch": 0.51, "learning_rate": 1.897549001656398e-05, "loss": 0.4851, "step": 2773 }, { "epoch": 0.51, "learning_rate": 1.8974609131487897e-05, "loss": 0.4833, "step": 2774 }, { "epoch": 0.51, "learning_rate": 1.8973727888341522e-05, "loss": 0.4567, "step": 2775 }, { "epoch": 0.51, "learning_rate": 1.897284628716002e-05, "loss": 0.4882, "step": 2776 }, { "epoch": 0.51, "learning_rate": 1.8971964327978566e-05, "loss": 0.4801, "step": 2777 }, { "epoch": 0.51, "learning_rate": 1.8971082010832345e-05, "loss": 0.4723, "step": 2778 }, { "epoch": 0.51, "learning_rate": 1.8970199335756563e-05, "loss": 0.4709, "step": 2779 }, { "epoch": 0.51, "learning_rate": 1.896931630278643e-05, "loss": 0.4825, "step": 2780 }, { "epoch": 0.51, "learning_rate": 1.896843291195719e-05, "loss": 0.4789, "step": 2781 }, { "epoch": 0.51, "learning_rate": 1.8967549163304078e-05, "loss": 0.4763, "step": 2782 }, { "epoch": 0.51, "learning_rate": 1.8966665056862355e-05, "loss": 0.5028, "step": 2783 }, { "epoch": 0.52, "learning_rate": 1.89657805926673e-05, "loss": 0.4878, "step": 2784 }, { "epoch": 0.52, "learning_rate": 1.89648957707542e-05, "loss": 0.4691, "step": 2785 }, { "epoch": 0.52, "learning_rate": 1.8964010591158355e-05, "loss": 0.4659, "step": 2786 }, { "epoch": 0.52, "learning_rate": 1.8963125053915083e-05, "loss": 0.4862, "step": 2787 }, { "epoch": 0.52, "learning_rate": 1.896223915905972e-05, "loss": 0.4693, "step": 2788 }, { "epoch": 0.52, "learning_rate": 1.8961352906627603e-05, "loss": 0.4911, "step": 2789 }, { "epoch": 0.52, "learning_rate": 1.89604662966541e-05, "loss": 0.4572, "step": 2790 }, { "epoch": 0.52, "learning_rate": 1.895957932917458e-05, "loss": 0.4779, "step": 2791 }, { "epoch": 0.52, "learning_rate": 1.8958692004224435e-05, "loss": 0.4708, "step": 2792 }, { "epoch": 0.52, "learning_rate": 1.8957804321839063e-05, "loss": 0.4607, "step": 2793 }, { "epoch": 0.52, "learning_rate": 1.8956916282053886e-05, "loss": 0.4733, "step": 2794 }, { "epoch": 0.52, "learning_rate": 1.895602788490433e-05, "loss": 0.4884, "step": 2795 }, { "epoch": 0.52, "learning_rate": 1.8955139130425843e-05, "loss": 0.4843, "step": 2796 }, { "epoch": 0.52, "learning_rate": 1.8954250018653887e-05, "loss": 0.4918, "step": 2797 }, { "epoch": 0.52, "learning_rate": 1.8953360549623933e-05, "loss": 0.4697, "step": 2798 }, { "epoch": 0.52, "learning_rate": 1.8952470723371466e-05, "loss": 0.4625, "step": 2799 }, { "epoch": 0.52, "learning_rate": 1.8951580539931996e-05, "loss": 0.4701, "step": 2800 }, { "epoch": 0.52, "learning_rate": 1.895068999934104e-05, "loss": 0.4702, "step": 2801 }, { "epoch": 0.52, "learning_rate": 1.8949799101634118e-05, "loss": 0.4727, "step": 2802 }, { "epoch": 0.52, "learning_rate": 1.8948907846846786e-05, "loss": 0.4651, "step": 2803 }, { "epoch": 0.52, "learning_rate": 1.8948016235014596e-05, "loss": 0.482, "step": 2804 }, { "epoch": 0.52, "learning_rate": 1.8947124266173123e-05, "loss": 0.4719, "step": 2805 }, { "epoch": 0.52, "learning_rate": 1.8946231940357963e-05, "loss": 0.4678, "step": 2806 }, { "epoch": 0.52, "learning_rate": 1.8945339257604708e-05, "loss": 0.4846, "step": 2807 }, { "epoch": 0.52, "learning_rate": 1.894444621794898e-05, "loss": 0.5031, "step": 2808 }, { "epoch": 0.52, "learning_rate": 1.894355282142641e-05, "loss": 0.4779, "step": 2809 }, { "epoch": 0.52, "learning_rate": 1.8942659068072638e-05, "loss": 0.4975, "step": 2810 }, { "epoch": 0.52, "learning_rate": 1.8941764957923326e-05, "loss": 0.4676, "step": 2811 }, { "epoch": 0.52, "learning_rate": 1.894087049101415e-05, "loss": 0.4685, "step": 2812 }, { "epoch": 0.52, "learning_rate": 1.8939975667380793e-05, "loss": 0.477, "step": 2813 }, { "epoch": 0.52, "learning_rate": 1.893908048705896e-05, "loss": 0.4906, "step": 2814 }, { "epoch": 0.52, "learning_rate": 1.8938184950084365e-05, "loss": 0.4773, "step": 2815 }, { "epoch": 0.52, "learning_rate": 1.893728905649274e-05, "loss": 0.4655, "step": 2816 }, { "epoch": 0.52, "learning_rate": 1.8936392806319826e-05, "loss": 0.4835, "step": 2817 }, { "epoch": 0.52, "learning_rate": 1.8935496199601387e-05, "loss": 0.5006, "step": 2818 }, { "epoch": 0.52, "learning_rate": 1.893459923637319e-05, "loss": 0.4868, "step": 2819 }, { "epoch": 0.52, "learning_rate": 1.8933701916671033e-05, "loss": 0.483, "step": 2820 }, { "epoch": 0.52, "learning_rate": 1.8932804240530703e-05, "loss": 0.4837, "step": 2821 }, { "epoch": 0.52, "learning_rate": 1.8931906207988026e-05, "loss": 0.4866, "step": 2822 }, { "epoch": 0.52, "learning_rate": 1.8931007819078825e-05, "loss": 0.468, "step": 2823 }, { "epoch": 0.52, "learning_rate": 1.8930109073838947e-05, "loss": 0.4998, "step": 2824 }, { "epoch": 0.52, "learning_rate": 1.892920997230425e-05, "loss": 0.473, "step": 2825 }, { "epoch": 0.52, "learning_rate": 1.892831051451061e-05, "loss": 0.4838, "step": 2826 }, { "epoch": 0.52, "learning_rate": 1.8927410700493915e-05, "loss": 0.482, "step": 2827 }, { "epoch": 0.52, "learning_rate": 1.8926510530290055e-05, "loss": 0.4649, "step": 2828 }, { "epoch": 0.52, "learning_rate": 1.8925610003934954e-05, "loss": 0.4722, "step": 2829 }, { "epoch": 0.52, "learning_rate": 1.8924709121464538e-05, "loss": 0.4666, "step": 2830 }, { "epoch": 0.52, "learning_rate": 1.8923807882914756e-05, "loss": 0.4823, "step": 2831 }, { "epoch": 0.52, "learning_rate": 1.8922906288321556e-05, "loss": 0.4591, "step": 2832 }, { "epoch": 0.52, "learning_rate": 1.8922004337720917e-05, "loss": 0.4862, "step": 2833 }, { "epoch": 0.52, "learning_rate": 1.8921102031148826e-05, "loss": 0.4949, "step": 2834 }, { "epoch": 0.52, "learning_rate": 1.8920199368641278e-05, "loss": 0.4943, "step": 2835 }, { "epoch": 0.52, "learning_rate": 1.8919296350234293e-05, "loss": 0.5033, "step": 2836 }, { "epoch": 0.52, "learning_rate": 1.8918392975963894e-05, "loss": 0.494, "step": 2837 }, { "epoch": 0.53, "learning_rate": 1.891748924586613e-05, "loss": 0.4645, "step": 2838 }, { "epoch": 0.53, "learning_rate": 1.8916585159977053e-05, "loss": 0.4797, "step": 2839 }, { "epoch": 0.53, "learning_rate": 1.891568071833274e-05, "loss": 0.4702, "step": 2840 }, { "epoch": 0.53, "learning_rate": 1.8914775920969273e-05, "loss": 0.4936, "step": 2841 }, { "epoch": 0.53, "learning_rate": 1.891387076792275e-05, "loss": 0.4556, "step": 2842 }, { "epoch": 0.53, "learning_rate": 1.8912965259229285e-05, "loss": 0.4824, "step": 2843 }, { "epoch": 0.53, "learning_rate": 1.891205939492501e-05, "loss": 0.4995, "step": 2844 }, { "epoch": 0.53, "learning_rate": 1.8911153175046068e-05, "loss": 0.4636, "step": 2845 }, { "epoch": 0.53, "learning_rate": 1.891024659962861e-05, "loss": 0.4893, "step": 2846 }, { "epoch": 0.53, "learning_rate": 1.890933966870881e-05, "loss": 0.4676, "step": 2847 }, { "epoch": 0.53, "learning_rate": 1.8908432382322853e-05, "loss": 0.4784, "step": 2848 }, { "epoch": 0.53, "learning_rate": 1.8907524740506937e-05, "loss": 0.4619, "step": 2849 }, { "epoch": 0.53, "learning_rate": 1.8906616743297276e-05, "loss": 0.4961, "step": 2850 }, { "epoch": 0.53, "learning_rate": 1.8905708390730098e-05, "loss": 0.4777, "step": 2851 }, { "epoch": 0.53, "learning_rate": 1.890479968284164e-05, "loss": 0.4849, "step": 2852 }, { "epoch": 0.53, "learning_rate": 1.8903890619668165e-05, "loss": 0.4759, "step": 2853 }, { "epoch": 0.53, "learning_rate": 1.890298120124594e-05, "loss": 0.4735, "step": 2854 }, { "epoch": 0.53, "learning_rate": 1.8902071427611245e-05, "loss": 0.4771, "step": 2855 }, { "epoch": 0.53, "learning_rate": 1.8901161298800387e-05, "loss": 0.4738, "step": 2856 }, { "epoch": 0.53, "learning_rate": 1.890025081484967e-05, "loss": 0.47, "step": 2857 }, { "epoch": 0.53, "learning_rate": 1.8899339975795424e-05, "loss": 0.472, "step": 2858 }, { "epoch": 0.53, "learning_rate": 1.889842878167399e-05, "loss": 0.4767, "step": 2859 }, { "epoch": 0.53, "learning_rate": 1.889751723252172e-05, "loss": 0.4648, "step": 2860 }, { "epoch": 0.53, "learning_rate": 1.8896605328374987e-05, "loss": 0.4898, "step": 2861 }, { "epoch": 0.53, "learning_rate": 1.8895693069270175e-05, "loss": 0.4559, "step": 2862 }, { "epoch": 0.53, "learning_rate": 1.889478045524368e-05, "loss": 0.4652, "step": 2863 }, { "epoch": 0.53, "learning_rate": 1.889386748633191e-05, "loss": 0.4859, "step": 2864 }, { "epoch": 0.53, "learning_rate": 1.88929541625713e-05, "loss": 0.4729, "step": 2865 }, { "epoch": 0.53, "learning_rate": 1.8892040483998276e-05, "loss": 0.4812, "step": 2866 }, { "epoch": 0.53, "learning_rate": 1.8891126450649304e-05, "loss": 0.4646, "step": 2867 }, { "epoch": 0.53, "learning_rate": 1.8890212062560848e-05, "loss": 0.4636, "step": 2868 }, { "epoch": 0.53, "learning_rate": 1.888929731976939e-05, "loss": 0.4775, "step": 2869 }, { "epoch": 0.53, "learning_rate": 1.8888382222311425e-05, "loss": 0.4953, "step": 2870 }, { "epoch": 0.53, "learning_rate": 1.8887466770223466e-05, "loss": 0.4884, "step": 2871 }, { "epoch": 0.53, "learning_rate": 1.888655096354204e-05, "loss": 0.4504, "step": 2872 }, { "epoch": 0.53, "learning_rate": 1.8885634802303682e-05, "loss": 0.4725, "step": 2873 }, { "epoch": 0.53, "learning_rate": 1.888471828654495e-05, "loss": 0.4645, "step": 2874 }, { "epoch": 0.53, "learning_rate": 1.8883801416302402e-05, "loss": 0.4775, "step": 2875 }, { "epoch": 0.53, "learning_rate": 1.888288419161263e-05, "loss": 0.4961, "step": 2876 }, { "epoch": 0.53, "learning_rate": 1.8881966612512225e-05, "loss": 0.4634, "step": 2877 }, { "epoch": 0.53, "learning_rate": 1.8881048679037795e-05, "loss": 0.4729, "step": 2878 }, { "epoch": 0.53, "learning_rate": 1.8880130391225963e-05, "loss": 0.4541, "step": 2879 }, { "epoch": 0.53, "learning_rate": 1.8879211749113374e-05, "loss": 0.4625, "step": 2880 }, { "epoch": 0.53, "learning_rate": 1.8878292752736676e-05, "loss": 0.4718, "step": 2881 }, { "epoch": 0.53, "learning_rate": 1.887737340213253e-05, "loss": 0.4638, "step": 2882 }, { "epoch": 0.53, "learning_rate": 1.8876453697337624e-05, "loss": 0.469, "step": 2883 }, { "epoch": 0.53, "learning_rate": 1.887553363838865e-05, "loss": 0.4867, "step": 2884 }, { "epoch": 0.53, "learning_rate": 1.8874613225322317e-05, "loss": 0.4902, "step": 2885 }, { "epoch": 0.53, "learning_rate": 1.8873692458175347e-05, "loss": 0.4759, "step": 2886 }, { "epoch": 0.53, "learning_rate": 1.8872771336984476e-05, "loss": 0.4677, "step": 2887 }, { "epoch": 0.53, "learning_rate": 1.8871849861786457e-05, "loss": 0.4689, "step": 2888 }, { "epoch": 0.53, "learning_rate": 1.8870928032618055e-05, "loss": 0.4637, "step": 2889 }, { "epoch": 0.53, "learning_rate": 1.8870005849516046e-05, "loss": 0.4975, "step": 2890 }, { "epoch": 0.53, "learning_rate": 1.886908331251723e-05, "loss": 0.4678, "step": 2891 }, { "epoch": 0.54, "learning_rate": 1.886816042165841e-05, "loss": 0.4484, "step": 2892 }, { "epoch": 0.54, "learning_rate": 1.8867237176976407e-05, "loss": 0.4685, "step": 2893 }, { "epoch": 0.54, "learning_rate": 1.8866313578508055e-05, "loss": 0.4516, "step": 2894 }, { "epoch": 0.54, "learning_rate": 1.886538962629021e-05, "loss": 0.4763, "step": 2895 }, { "epoch": 0.54, "learning_rate": 1.886446532035973e-05, "loss": 0.4784, "step": 2896 }, { "epoch": 0.54, "learning_rate": 1.8863540660753498e-05, "loss": 0.4923, "step": 2897 }, { "epoch": 0.54, "learning_rate": 1.8862615647508403e-05, "loss": 0.4802, "step": 2898 }, { "epoch": 0.54, "learning_rate": 1.8861690280661354e-05, "loss": 0.4565, "step": 2899 }, { "epoch": 0.54, "learning_rate": 1.886076456024927e-05, "loss": 0.4645, "step": 2900 }, { "epoch": 0.54, "learning_rate": 1.8859838486309082e-05, "loss": 0.4774, "step": 2901 }, { "epoch": 0.54, "learning_rate": 1.8858912058877744e-05, "loss": 0.469, "step": 2902 }, { "epoch": 0.54, "learning_rate": 1.8857985277992216e-05, "loss": 0.4759, "step": 2903 }, { "epoch": 0.54, "learning_rate": 1.8857058143689478e-05, "loss": 0.4598, "step": 2904 }, { "epoch": 0.54, "learning_rate": 1.885613065600652e-05, "loss": 0.4741, "step": 2905 }, { "epoch": 0.54, "learning_rate": 1.885520281498034e-05, "loss": 0.4786, "step": 2906 }, { "epoch": 0.54, "learning_rate": 1.8854274620647965e-05, "loss": 0.4791, "step": 2907 }, { "epoch": 0.54, "learning_rate": 1.8853346073046424e-05, "loss": 0.4663, "step": 2908 }, { "epoch": 0.54, "learning_rate": 1.8852417172212768e-05, "loss": 0.4748, "step": 2909 }, { "epoch": 0.54, "learning_rate": 1.8851487918184055e-05, "loss": 0.466, "step": 2910 }, { "epoch": 0.54, "learning_rate": 1.8850558310997366e-05, "loss": 0.4777, "step": 2911 }, { "epoch": 0.54, "learning_rate": 1.8849628350689783e-05, "loss": 0.4797, "step": 2912 }, { "epoch": 0.54, "learning_rate": 1.8848698037298417e-05, "loss": 0.4856, "step": 2913 }, { "epoch": 0.54, "learning_rate": 1.884776737086038e-05, "loss": 0.4708, "step": 2914 }, { "epoch": 0.54, "learning_rate": 1.8846836351412807e-05, "loss": 0.4938, "step": 2915 }, { "epoch": 0.54, "learning_rate": 1.8845904978992843e-05, "loss": 0.4788, "step": 2916 }, { "epoch": 0.54, "learning_rate": 1.8844973253637646e-05, "loss": 0.4731, "step": 2917 }, { "epoch": 0.54, "learning_rate": 1.8844041175384396e-05, "loss": 0.447, "step": 2918 }, { "epoch": 0.54, "learning_rate": 1.8843108744270274e-05, "loss": 0.47, "step": 2919 }, { "epoch": 0.54, "learning_rate": 1.8842175960332487e-05, "loss": 0.4913, "step": 2920 }, { "epoch": 0.54, "learning_rate": 1.884124282360825e-05, "loss": 0.4817, "step": 2921 }, { "epoch": 0.54, "learning_rate": 1.8840309334134793e-05, "loss": 0.4745, "step": 2922 }, { "epoch": 0.54, "learning_rate": 1.883937549194936e-05, "loss": 0.4799, "step": 2923 }, { "epoch": 0.54, "learning_rate": 1.8838441297089215e-05, "loss": 0.4892, "step": 2924 }, { "epoch": 0.54, "learning_rate": 1.8837506749591622e-05, "loss": 0.475, "step": 2925 }, { "epoch": 0.54, "learning_rate": 1.8836571849493872e-05, "loss": 0.4751, "step": 2926 }, { "epoch": 0.54, "learning_rate": 1.883563659683327e-05, "loss": 0.4779, "step": 2927 }, { "epoch": 0.54, "learning_rate": 1.883470099164712e-05, "loss": 0.4888, "step": 2928 }, { "epoch": 0.54, "learning_rate": 1.883376503397276e-05, "loss": 0.4808, "step": 2929 }, { "epoch": 0.54, "learning_rate": 1.8832828723847533e-05, "loss": 0.4807, "step": 2930 }, { "epoch": 0.54, "learning_rate": 1.883189206130879e-05, "loss": 0.4834, "step": 2931 }, { "epoch": 0.54, "learning_rate": 1.883095504639391e-05, "loss": 0.4677, "step": 2932 }, { "epoch": 0.54, "learning_rate": 1.8830017679140267e-05, "loss": 0.4755, "step": 2933 }, { "epoch": 0.54, "learning_rate": 1.8829079959585274e-05, "loss": 0.467, "step": 2934 }, { "epoch": 0.54, "learning_rate": 1.8828141887766334e-05, "loss": 0.4858, "step": 2935 }, { "epoch": 0.54, "learning_rate": 1.8827203463720875e-05, "loss": 0.4573, "step": 2936 }, { "epoch": 0.54, "learning_rate": 1.8826264687486344e-05, "loss": 0.4565, "step": 2937 }, { "epoch": 0.54, "learning_rate": 1.8825325559100193e-05, "loss": 0.5058, "step": 2938 }, { "epoch": 0.54, "learning_rate": 1.882438607859989e-05, "loss": 0.4747, "step": 2939 }, { "epoch": 0.54, "learning_rate": 1.8823446246022924e-05, "loss": 0.4839, "step": 2940 }, { "epoch": 0.54, "learning_rate": 1.8822506061406786e-05, "loss": 0.4747, "step": 2941 }, { "epoch": 0.54, "learning_rate": 1.882156552478899e-05, "loss": 0.4816, "step": 2942 }, { "epoch": 0.54, "learning_rate": 1.8820624636207066e-05, "loss": 0.452, "step": 2943 }, { "epoch": 0.54, "learning_rate": 1.881968339569855e-05, "loss": 0.465, "step": 2944 }, { "epoch": 0.54, "learning_rate": 1.8818741803300994e-05, "loss": 0.4765, "step": 2945 }, { "epoch": 0.55, "learning_rate": 1.8817799859051967e-05, "loss": 0.4828, "step": 2946 }, { "epoch": 0.55, "learning_rate": 1.881685756298905e-05, "loss": 0.4585, "step": 2947 }, { "epoch": 0.55, "learning_rate": 1.881591491514984e-05, "loss": 0.4936, "step": 2948 }, { "epoch": 0.55, "learning_rate": 1.881497191557195e-05, "loss": 0.4885, "step": 2949 }, { "epoch": 0.55, "learning_rate": 1.8814028564293e-05, "loss": 0.4947, "step": 2950 }, { "epoch": 0.55, "learning_rate": 1.8813084861350627e-05, "loss": 0.4664, "step": 2951 }, { "epoch": 0.55, "learning_rate": 1.881214080678249e-05, "loss": 0.4793, "step": 2952 }, { "epoch": 0.55, "learning_rate": 1.8811196400626245e-05, "loss": 0.479, "step": 2953 }, { "epoch": 0.55, "learning_rate": 1.8810251642919577e-05, "loss": 0.4703, "step": 2954 }, { "epoch": 0.55, "learning_rate": 1.8809306533700186e-05, "loss": 0.4686, "step": 2955 }, { "epoch": 0.55, "learning_rate": 1.880836107300577e-05, "loss": 0.4574, "step": 2956 }, { "epoch": 0.55, "learning_rate": 1.8807415260874052e-05, "loss": 0.4716, "step": 2957 }, { "epoch": 0.55, "learning_rate": 1.880646909734278e-05, "loss": 0.4711, "step": 2958 }, { "epoch": 0.55, "learning_rate": 1.880552258244969e-05, "loss": 0.491, "step": 2959 }, { "epoch": 0.55, "learning_rate": 1.8804575716232555e-05, "loss": 0.5007, "step": 2960 }, { "epoch": 0.55, "learning_rate": 1.8803628498729144e-05, "loss": 0.4919, "step": 2961 }, { "epoch": 0.55, "learning_rate": 1.880268092997726e-05, "loss": 0.4848, "step": 2962 }, { "epoch": 0.55, "learning_rate": 1.8801733010014708e-05, "loss": 0.4802, "step": 2963 }, { "epoch": 0.55, "learning_rate": 1.88007847388793e-05, "loss": 0.4639, "step": 2964 }, { "epoch": 0.55, "learning_rate": 1.8799836116608875e-05, "loss": 0.4676, "step": 2965 }, { "epoch": 0.55, "learning_rate": 1.8798887143241283e-05, "loss": 0.4711, "step": 2966 }, { "epoch": 0.55, "learning_rate": 1.8797937818814383e-05, "loss": 0.4528, "step": 2967 }, { "epoch": 0.55, "learning_rate": 1.8796988143366056e-05, "loss": 0.4833, "step": 2968 }, { "epoch": 0.55, "learning_rate": 1.8796038116934187e-05, "loss": 0.4546, "step": 2969 }, { "epoch": 0.55, "learning_rate": 1.8795087739556684e-05, "loss": 0.4711, "step": 2970 }, { "epoch": 0.55, "learning_rate": 1.8794137011271462e-05, "loss": 0.4715, "step": 2971 }, { "epoch": 0.55, "learning_rate": 1.879318593211646e-05, "loss": 0.4702, "step": 2972 }, { "epoch": 0.55, "learning_rate": 1.8792234502129614e-05, "loss": 0.4851, "step": 2973 }, { "epoch": 0.55, "learning_rate": 1.8791282721348892e-05, "loss": 0.4609, "step": 2974 }, { "epoch": 0.55, "learning_rate": 1.8790330589812264e-05, "loss": 0.4893, "step": 2975 }, { "epoch": 0.55, "learning_rate": 1.878937810755772e-05, "loss": 0.4685, "step": 2976 }, { "epoch": 0.55, "learning_rate": 1.8788425274623267e-05, "loss": 0.4785, "step": 2977 }, { "epoch": 0.55, "learning_rate": 1.8787472091046914e-05, "loss": 0.4859, "step": 2978 }, { "epoch": 0.55, "learning_rate": 1.8786518556866696e-05, "loss": 0.4542, "step": 2979 }, { "epoch": 0.55, "learning_rate": 1.8785564672120654e-05, "loss": 0.4513, "step": 2980 }, { "epoch": 0.55, "learning_rate": 1.8784610436846845e-05, "loss": 0.493, "step": 2981 }, { "epoch": 0.55, "learning_rate": 1.878365585108335e-05, "loss": 0.4873, "step": 2982 }, { "epoch": 0.55, "learning_rate": 1.8782700914868244e-05, "loss": 0.4837, "step": 2983 }, { "epoch": 0.55, "learning_rate": 1.878174562823963e-05, "loss": 0.4742, "step": 2984 }, { "epoch": 0.55, "learning_rate": 1.878078999123563e-05, "loss": 0.513, "step": 2985 }, { "epoch": 0.55, "learning_rate": 1.8779834003894365e-05, "loss": 0.4814, "step": 2986 }, { "epoch": 0.55, "learning_rate": 1.877887766625398e-05, "loss": 0.4599, "step": 2987 }, { "epoch": 0.55, "learning_rate": 1.8777920978352626e-05, "loss": 0.4956, "step": 2988 }, { "epoch": 0.55, "learning_rate": 1.877696394022848e-05, "loss": 0.4878, "step": 2989 }, { "epoch": 0.55, "learning_rate": 1.877600655191972e-05, "loss": 0.468, "step": 2990 }, { "epoch": 0.55, "learning_rate": 1.877504881346455e-05, "loss": 0.4984, "step": 2991 }, { "epoch": 0.55, "learning_rate": 1.8774090724901177e-05, "loss": 0.4826, "step": 2992 }, { "epoch": 0.55, "learning_rate": 1.877313228626783e-05, "loss": 0.4761, "step": 2993 }, { "epoch": 0.55, "learning_rate": 1.8772173497602748e-05, "loss": 0.4719, "step": 2994 }, { "epoch": 0.55, "learning_rate": 1.8771214358944183e-05, "loss": 0.4861, "step": 2995 }, { "epoch": 0.55, "learning_rate": 1.8770254870330405e-05, "loss": 0.4665, "step": 2996 }, { "epoch": 0.55, "learning_rate": 1.87692950317997e-05, "loss": 0.4891, "step": 2997 }, { "epoch": 0.55, "learning_rate": 1.876833484339035e-05, "loss": 0.4707, "step": 2998 }, { "epoch": 0.55, "learning_rate": 1.8767374305140683e-05, "loss": 0.4792, "step": 2999 }, { "epoch": 0.56, "learning_rate": 1.8766413417089007e-05, "loss": 0.4712, "step": 3000 }, { "epoch": 0.56, "learning_rate": 1.876545217927367e-05, "loss": 0.4701, "step": 3001 }, { "epoch": 0.56, "learning_rate": 1.876449059173302e-05, "loss": 0.4668, "step": 3002 }, { "epoch": 0.56, "learning_rate": 1.876352865450542e-05, "loss": 0.4803, "step": 3003 }, { "epoch": 0.56, "learning_rate": 1.8762566367629253e-05, "loss": 0.4756, "step": 3004 }, { "epoch": 0.56, "learning_rate": 1.876160373114291e-05, "loss": 0.467, "step": 3005 }, { "epoch": 0.56, "learning_rate": 1.87606407450848e-05, "loss": 0.4859, "step": 3006 }, { "epoch": 0.56, "learning_rate": 1.8759677409493345e-05, "loss": 0.4994, "step": 3007 }, { "epoch": 0.56, "learning_rate": 1.8758713724406984e-05, "loss": 0.4828, "step": 3008 }, { "epoch": 0.56, "learning_rate": 1.8757749689864157e-05, "loss": 0.4502, "step": 3009 }, { "epoch": 0.56, "learning_rate": 1.8756785305903332e-05, "loss": 0.4831, "step": 3010 }, { "epoch": 0.56, "learning_rate": 1.8755820572562985e-05, "loss": 0.4631, "step": 3011 }, { "epoch": 0.56, "learning_rate": 1.8754855489881613e-05, "loss": 0.4907, "step": 3012 }, { "epoch": 0.56, "learning_rate": 1.8753890057897713e-05, "loss": 0.4828, "step": 3013 }, { "epoch": 0.56, "learning_rate": 1.8752924276649804e-05, "loss": 0.4839, "step": 3014 }, { "epoch": 0.56, "learning_rate": 1.8751958146176424e-05, "loss": 0.4748, "step": 3015 }, { "epoch": 0.56, "learning_rate": 1.8750991666516117e-05, "loss": 0.4728, "step": 3016 }, { "epoch": 0.56, "learning_rate": 1.8750024837707447e-05, "loss": 0.4915, "step": 3017 }, { "epoch": 0.56, "learning_rate": 1.8749057659788988e-05, "loss": 0.4791, "step": 3018 }, { "epoch": 0.56, "learning_rate": 1.8748090132799323e-05, "loss": 0.4728, "step": 3019 }, { "epoch": 0.56, "learning_rate": 1.8747122256777058e-05, "loss": 0.4657, "step": 3020 }, { "epoch": 0.56, "learning_rate": 1.8746154031760816e-05, "loss": 0.4696, "step": 3021 }, { "epoch": 0.56, "learning_rate": 1.8745185457789216e-05, "loss": 0.4774, "step": 3022 }, { "epoch": 0.56, "learning_rate": 1.8744216534900906e-05, "loss": 0.4813, "step": 3023 }, { "epoch": 0.56, "learning_rate": 1.8743247263134548e-05, "loss": 0.4771, "step": 3024 }, { "epoch": 0.56, "learning_rate": 1.874227764252881e-05, "loss": 0.4823, "step": 3025 }, { "epoch": 0.56, "learning_rate": 1.8741307673122384e-05, "loss": 0.4592, "step": 3026 }, { "epoch": 0.56, "learning_rate": 1.8740337354953963e-05, "loss": 0.4818, "step": 3027 }, { "epoch": 0.56, "learning_rate": 1.8739366688062264e-05, "loss": 0.4616, "step": 3028 }, { "epoch": 0.56, "learning_rate": 1.8738395672486016e-05, "loss": 0.4636, "step": 3029 }, { "epoch": 0.56, "learning_rate": 1.873742430826396e-05, "loss": 0.4954, "step": 3030 }, { "epoch": 0.56, "learning_rate": 1.873645259543485e-05, "loss": 0.4701, "step": 3031 }, { "epoch": 0.56, "learning_rate": 1.8735480534037454e-05, "loss": 0.4824, "step": 3032 }, { "epoch": 0.56, "learning_rate": 1.873450812411056e-05, "loss": 0.4756, "step": 3033 }, { "epoch": 0.56, "learning_rate": 1.873353536569296e-05, "loss": 0.4589, "step": 3034 }, { "epoch": 0.56, "learning_rate": 1.8732562258823477e-05, "loss": 0.4612, "step": 3035 }, { "epoch": 0.56, "learning_rate": 1.873158880354092e-05, "loss": 0.4879, "step": 3036 }, { "epoch": 0.56, "learning_rate": 1.873061499988414e-05, "loss": 0.469, "step": 3037 }, { "epoch": 0.56, "learning_rate": 1.8729640847891985e-05, "loss": 0.4767, "step": 3038 }, { "epoch": 0.56, "learning_rate": 1.872866634760332e-05, "loss": 0.4694, "step": 3039 }, { "epoch": 0.56, "learning_rate": 1.8727691499057032e-05, "loss": 0.4698, "step": 3040 }, { "epoch": 0.56, "learning_rate": 1.872671630229201e-05, "loss": 0.4735, "step": 3041 }, { "epoch": 0.56, "learning_rate": 1.8725740757347166e-05, "loss": 0.4856, "step": 3042 }, { "epoch": 0.56, "learning_rate": 1.872476486426142e-05, "loss": 0.4768, "step": 3043 }, { "epoch": 0.56, "learning_rate": 1.8723788623073708e-05, "loss": 0.4736, "step": 3044 }, { "epoch": 0.56, "learning_rate": 1.8722812033822987e-05, "loss": 0.4806, "step": 3045 }, { "epoch": 0.56, "learning_rate": 1.872183509654821e-05, "loss": 0.4659, "step": 3046 }, { "epoch": 0.56, "learning_rate": 1.872085781128836e-05, "loss": 0.478, "step": 3047 }, { "epoch": 0.56, "learning_rate": 1.8719880178082435e-05, "loss": 0.4723, "step": 3048 }, { "epoch": 0.56, "learning_rate": 1.871890219696943e-05, "loss": 0.4667, "step": 3049 }, { "epoch": 0.56, "learning_rate": 1.871792386798838e-05, "loss": 0.488, "step": 3050 }, { "epoch": 0.56, "learning_rate": 1.8716945191178297e-05, "loss": 0.4868, "step": 3051 }, { "epoch": 0.56, "learning_rate": 1.8715966166578243e-05, "loss": 0.4852, "step": 3052 }, { "epoch": 0.56, "learning_rate": 1.8714986794227278e-05, "loss": 0.4907, "step": 3053 }, { "epoch": 0.57, "learning_rate": 1.8714007074164473e-05, "loss": 0.4701, "step": 3054 }, { "epoch": 0.57, "learning_rate": 1.871302700642892e-05, "loss": 0.4689, "step": 3055 }, { "epoch": 0.57, "learning_rate": 1.871204659105972e-05, "loss": 0.4668, "step": 3056 }, { "epoch": 0.57, "learning_rate": 1.8711065828095996e-05, "loss": 0.4729, "step": 3057 }, { "epoch": 0.57, "learning_rate": 1.8710084717576872e-05, "loss": 0.4701, "step": 3058 }, { "epoch": 0.57, "learning_rate": 1.870910325954149e-05, "loss": 0.4573, "step": 3059 }, { "epoch": 0.57, "learning_rate": 1.8708121454029015e-05, "loss": 0.4797, "step": 3060 }, { "epoch": 0.57, "learning_rate": 1.870713930107862e-05, "loss": 0.458, "step": 3061 }, { "epoch": 0.57, "learning_rate": 1.870615680072948e-05, "loss": 0.4928, "step": 3062 }, { "epoch": 0.57, "learning_rate": 1.870517395302081e-05, "loss": 0.4729, "step": 3063 }, { "epoch": 0.57, "learning_rate": 1.8704190757991813e-05, "loss": 0.4704, "step": 3064 }, { "epoch": 0.57, "learning_rate": 1.870320721568172e-05, "loss": 0.4679, "step": 3065 }, { "epoch": 0.57, "learning_rate": 1.870222332612977e-05, "loss": 0.4812, "step": 3066 }, { "epoch": 0.57, "learning_rate": 1.8701239089375227e-05, "loss": 0.4947, "step": 3067 }, { "epoch": 0.57, "learning_rate": 1.8700254505457352e-05, "loss": 0.482, "step": 3068 }, { "epoch": 0.57, "learning_rate": 1.8699269574415428e-05, "loss": 0.473, "step": 3069 }, { "epoch": 0.57, "learning_rate": 1.8698284296288757e-05, "loss": 0.4818, "step": 3070 }, { "epoch": 0.57, "learning_rate": 1.8697298671116645e-05, "loss": 0.4833, "step": 3071 }, { "epoch": 0.57, "learning_rate": 1.869631269893842e-05, "loss": 0.481, "step": 3072 }, { "epoch": 0.57, "learning_rate": 1.869532637979342e-05, "loss": 0.4874, "step": 3073 }, { "epoch": 0.57, "learning_rate": 1.869433971372099e-05, "loss": 0.4652, "step": 3074 }, { "epoch": 0.57, "learning_rate": 1.8693352700760513e-05, "loss": 0.4862, "step": 3075 }, { "epoch": 0.57, "learning_rate": 1.8692365340951353e-05, "loss": 0.4771, "step": 3076 }, { "epoch": 0.57, "learning_rate": 1.8691377634332907e-05, "loss": 0.4689, "step": 3077 }, { "epoch": 0.57, "learning_rate": 1.8690389580944587e-05, "loss": 0.4857, "step": 3078 }, { "epoch": 0.57, "learning_rate": 1.8689401180825814e-05, "loss": 0.4806, "step": 3079 }, { "epoch": 0.57, "learning_rate": 1.8688412434016025e-05, "loss": 0.4853, "step": 3080 }, { "epoch": 0.57, "learning_rate": 1.8687423340554658e-05, "loss": 0.4824, "step": 3081 }, { "epoch": 0.57, "learning_rate": 1.868643390048119e-05, "loss": 0.4959, "step": 3082 }, { "epoch": 0.57, "learning_rate": 1.8685444113835088e-05, "loss": 0.4693, "step": 3083 }, { "epoch": 0.57, "learning_rate": 1.868445398065585e-05, "loss": 0.4924, "step": 3084 }, { "epoch": 0.57, "learning_rate": 1.8683463500982973e-05, "loss": 0.4885, "step": 3085 }, { "epoch": 0.57, "learning_rate": 1.8682472674855984e-05, "loss": 0.4717, "step": 3086 }, { "epoch": 0.57, "learning_rate": 1.868148150231441e-05, "loss": 0.4882, "step": 3087 }, { "epoch": 0.57, "learning_rate": 1.8680489983397793e-05, "loss": 0.4585, "step": 3088 }, { "epoch": 0.57, "learning_rate": 1.86794981181457e-05, "loss": 0.4841, "step": 3089 }, { "epoch": 0.57, "learning_rate": 1.8678505906597705e-05, "loss": 0.4839, "step": 3090 }, { "epoch": 0.57, "learning_rate": 1.867751334879339e-05, "loss": 0.4733, "step": 3091 }, { "epoch": 0.57, "learning_rate": 1.8676520444772353e-05, "loss": 0.4774, "step": 3092 }, { "epoch": 0.57, "learning_rate": 1.867552719457422e-05, "loss": 0.497, "step": 3093 }, { "epoch": 0.57, "learning_rate": 1.8674533598238614e-05, "loss": 0.4672, "step": 3094 }, { "epoch": 0.57, "learning_rate": 1.8673539655805176e-05, "loss": 0.4838, "step": 3095 }, { "epoch": 0.57, "learning_rate": 1.8672545367313565e-05, "loss": 0.4556, "step": 3096 }, { "epoch": 0.57, "learning_rate": 1.867155073280345e-05, "loss": 0.4805, "step": 3097 }, { "epoch": 0.57, "learning_rate": 1.8670555752314515e-05, "loss": 0.461, "step": 3098 }, { "epoch": 0.57, "learning_rate": 1.866956042588646e-05, "loss": 0.4614, "step": 3099 }, { "epoch": 0.57, "learning_rate": 1.8668564753558997e-05, "loss": 0.4756, "step": 3100 }, { "epoch": 0.57, "learning_rate": 1.866756873537185e-05, "loss": 0.481, "step": 3101 }, { "epoch": 0.57, "learning_rate": 1.8666572371364755e-05, "loss": 0.4825, "step": 3102 }, { "epoch": 0.57, "learning_rate": 1.866557566157747e-05, "loss": 0.4723, "step": 3103 }, { "epoch": 0.57, "learning_rate": 1.866457860604976e-05, "loss": 0.4661, "step": 3104 }, { "epoch": 0.57, "learning_rate": 1.8663581204821403e-05, "loss": 0.4746, "step": 3105 }, { "epoch": 0.57, "learning_rate": 1.8662583457932198e-05, "loss": 0.4938, "step": 3106 }, { "epoch": 0.57, "learning_rate": 1.8661585365421953e-05, "loss": 0.4871, "step": 3107 }, { "epoch": 0.58, "learning_rate": 1.8660586927330485e-05, "loss": 0.4619, "step": 3108 }, { "epoch": 0.58, "learning_rate": 1.8659588143697636e-05, "loss": 0.4726, "step": 3109 }, { "epoch": 0.58, "learning_rate": 1.8658589014563252e-05, "loss": 0.448, "step": 3110 }, { "epoch": 0.58, "learning_rate": 1.8657589539967196e-05, "loss": 0.4611, "step": 3111 }, { "epoch": 0.58, "learning_rate": 1.865658971994935e-05, "loss": 0.4865, "step": 3112 }, { "epoch": 0.58, "learning_rate": 1.86555895545496e-05, "loss": 0.4581, "step": 3113 }, { "epoch": 0.58, "learning_rate": 1.865458904380785e-05, "loss": 0.4766, "step": 3114 }, { "epoch": 0.58, "learning_rate": 1.865358818776402e-05, "loss": 0.4529, "step": 3115 }, { "epoch": 0.58, "learning_rate": 1.8652586986458043e-05, "loss": 0.4723, "step": 3116 }, { "epoch": 0.58, "learning_rate": 1.865158543992987e-05, "loss": 0.4593, "step": 3117 }, { "epoch": 0.58, "learning_rate": 1.8650583548219453e-05, "loss": 0.4878, "step": 3118 }, { "epoch": 0.58, "learning_rate": 1.864958131136677e-05, "loss": 0.4622, "step": 3119 }, { "epoch": 0.58, "learning_rate": 1.86485787294118e-05, "loss": 0.4711, "step": 3120 }, { "epoch": 0.58, "learning_rate": 1.864757580239456e-05, "loss": 0.458, "step": 3121 }, { "epoch": 0.58, "learning_rate": 1.8646572530355055e-05, "loss": 0.4489, "step": 3122 }, { "epoch": 0.58, "learning_rate": 1.864556891333331e-05, "loss": 0.4728, "step": 3123 }, { "epoch": 0.58, "learning_rate": 1.8644564951369374e-05, "loss": 0.4984, "step": 3124 }, { "epoch": 0.58, "learning_rate": 1.8643560644503303e-05, "loss": 0.4784, "step": 3125 }, { "epoch": 0.58, "learning_rate": 1.864255599277516e-05, "loss": 0.4756, "step": 3126 }, { "epoch": 0.58, "learning_rate": 1.8641550996225042e-05, "loss": 0.4889, "step": 3127 }, { "epoch": 0.58, "learning_rate": 1.8640545654893036e-05, "loss": 0.4733, "step": 3128 }, { "epoch": 0.58, "learning_rate": 1.8639539968819253e-05, "loss": 0.4722, "step": 3129 }, { "epoch": 0.58, "learning_rate": 1.8638533938043823e-05, "loss": 0.4843, "step": 3130 }, { "epoch": 0.58, "learning_rate": 1.8637527562606883e-05, "loss": 0.4828, "step": 3131 }, { "epoch": 0.58, "learning_rate": 1.8636520842548584e-05, "loss": 0.4664, "step": 3132 }, { "epoch": 0.58, "learning_rate": 1.8635513777909096e-05, "loss": 0.4679, "step": 3133 }, { "epoch": 0.58, "learning_rate": 1.8634506368728596e-05, "loss": 0.4787, "step": 3134 }, { "epoch": 0.58, "learning_rate": 1.8633498615047277e-05, "loss": 0.4597, "step": 3135 }, { "epoch": 0.58, "learning_rate": 1.8632490516905347e-05, "loss": 0.4603, "step": 3136 }, { "epoch": 0.58, "learning_rate": 1.863148207434303e-05, "loss": 0.4743, "step": 3137 }, { "epoch": 0.58, "learning_rate": 1.8630473287400556e-05, "loss": 0.4697, "step": 3138 }, { "epoch": 0.58, "learning_rate": 1.862946415611818e-05, "loss": 0.4736, "step": 3139 }, { "epoch": 0.58, "learning_rate": 1.862845468053616e-05, "loss": 0.4802, "step": 3140 }, { "epoch": 0.58, "learning_rate": 1.8627444860694773e-05, "loss": 0.4685, "step": 3141 }, { "epoch": 0.58, "learning_rate": 1.8626434696634307e-05, "loss": 0.4684, "step": 3142 }, { "epoch": 0.58, "learning_rate": 1.862542418839507e-05, "loss": 0.4923, "step": 3143 }, { "epoch": 0.58, "learning_rate": 1.862441333601738e-05, "loss": 0.4687, "step": 3144 }, { "epoch": 0.58, "learning_rate": 1.8623402139541564e-05, "loss": 0.4853, "step": 3145 }, { "epoch": 0.58, "learning_rate": 1.8622390599007967e-05, "loss": 0.4683, "step": 3146 }, { "epoch": 0.58, "learning_rate": 1.862137871445695e-05, "loss": 0.4762, "step": 3147 }, { "epoch": 0.58, "learning_rate": 1.8620366485928886e-05, "loss": 0.4724, "step": 3148 }, { "epoch": 0.58, "learning_rate": 1.8619353913464157e-05, "loss": 0.457, "step": 3149 }, { "epoch": 0.58, "learning_rate": 1.8618340997103167e-05, "loss": 0.4663, "step": 3150 }, { "epoch": 0.58, "learning_rate": 1.8617327736886327e-05, "loss": 0.4636, "step": 3151 }, { "epoch": 0.58, "learning_rate": 1.8616314132854067e-05, "loss": 0.474, "step": 3152 }, { "epoch": 0.58, "learning_rate": 1.861530018504682e-05, "loss": 0.5112, "step": 3153 }, { "epoch": 0.58, "learning_rate": 1.8614285893505052e-05, "loss": 0.4957, "step": 3154 }, { "epoch": 0.58, "learning_rate": 1.861327125826922e-05, "loss": 0.4625, "step": 3155 }, { "epoch": 0.58, "learning_rate": 1.8612256279379815e-05, "loss": 0.4872, "step": 3156 }, { "epoch": 0.58, "learning_rate": 1.8611240956877334e-05, "loss": 0.4698, "step": 3157 }, { "epoch": 0.58, "learning_rate": 1.8610225290802276e-05, "loss": 0.4797, "step": 3158 }, { "epoch": 0.58, "learning_rate": 1.860920928119517e-05, "loss": 0.4544, "step": 3159 }, { "epoch": 0.58, "learning_rate": 1.8608192928096556e-05, "loss": 0.4809, "step": 3160 }, { "epoch": 0.58, "learning_rate": 1.8607176231546984e-05, "loss": 0.46, "step": 3161 }, { "epoch": 0.59, "learning_rate": 1.860615919158701e-05, "loss": 0.4691, "step": 3162 }, { "epoch": 0.59, "learning_rate": 1.8605141808257224e-05, "loss": 0.4584, "step": 3163 }, { "epoch": 0.59, "learning_rate": 1.860412408159821e-05, "loss": 0.4867, "step": 3164 }, { "epoch": 0.59, "learning_rate": 1.8603106011650574e-05, "loss": 0.5018, "step": 3165 }, { "epoch": 0.59, "learning_rate": 1.8602087598454937e-05, "loss": 0.4716, "step": 3166 }, { "epoch": 0.59, "learning_rate": 1.8601068842051932e-05, "loss": 0.4786, "step": 3167 }, { "epoch": 0.59, "learning_rate": 1.8600049742482202e-05, "loss": 0.4763, "step": 3168 }, { "epoch": 0.59, "learning_rate": 1.859903029978641e-05, "loss": 0.4767, "step": 3169 }, { "epoch": 0.59, "learning_rate": 1.8598010514005235e-05, "loss": 0.4683, "step": 3170 }, { "epoch": 0.59, "learning_rate": 1.8596990385179353e-05, "loss": 0.4939, "step": 3171 }, { "epoch": 0.59, "learning_rate": 1.8595969913349476e-05, "loss": 0.4937, "step": 3172 }, { "epoch": 0.59, "learning_rate": 1.8594949098556313e-05, "loss": 0.4442, "step": 3173 }, { "epoch": 0.59, "learning_rate": 1.859392794084059e-05, "loss": 0.4852, "step": 3174 }, { "epoch": 0.59, "learning_rate": 1.8592906440243063e-05, "loss": 0.4607, "step": 3175 }, { "epoch": 0.59, "learning_rate": 1.859188459680447e-05, "loss": 0.4567, "step": 3176 }, { "epoch": 0.59, "learning_rate": 1.8590862410565592e-05, "loss": 0.4655, "step": 3177 }, { "epoch": 0.59, "learning_rate": 1.858983988156721e-05, "loss": 0.4664, "step": 3178 }, { "epoch": 0.59, "learning_rate": 1.8588817009850116e-05, "loss": 0.4746, "step": 3179 }, { "epoch": 0.59, "learning_rate": 1.8587793795455132e-05, "loss": 0.4824, "step": 3180 }, { "epoch": 0.59, "learning_rate": 1.8586770238423072e-05, "loss": 0.5019, "step": 3181 }, { "epoch": 0.59, "learning_rate": 1.8585746338794774e-05, "loss": 0.4996, "step": 3182 }, { "epoch": 0.59, "learning_rate": 1.85847220966111e-05, "loss": 0.4725, "step": 3183 }, { "epoch": 0.59, "learning_rate": 1.8583697511912905e-05, "loss": 0.5028, "step": 3184 }, { "epoch": 0.59, "learning_rate": 1.858267258474107e-05, "loss": 0.4566, "step": 3185 }, { "epoch": 0.59, "learning_rate": 1.8581647315136494e-05, "loss": 0.4574, "step": 3186 }, { "epoch": 0.59, "learning_rate": 1.8580621703140075e-05, "loss": 0.4756, "step": 3187 }, { "epoch": 0.59, "learning_rate": 1.8579595748792735e-05, "loss": 0.4509, "step": 3188 }, { "epoch": 0.59, "learning_rate": 1.8578569452135413e-05, "loss": 0.4866, "step": 3189 }, { "epoch": 0.59, "learning_rate": 1.857754281320905e-05, "loss": 0.466, "step": 3190 }, { "epoch": 0.59, "learning_rate": 1.857651583205461e-05, "loss": 0.472, "step": 3191 }, { "epoch": 0.59, "learning_rate": 1.857548850871307e-05, "loss": 0.4664, "step": 3192 }, { "epoch": 0.59, "learning_rate": 1.8574460843225413e-05, "loss": 0.4905, "step": 3193 }, { "epoch": 0.59, "learning_rate": 1.8573432835632644e-05, "loss": 0.4624, "step": 3194 }, { "epoch": 0.59, "learning_rate": 1.8572404485975778e-05, "loss": 0.4803, "step": 3195 }, { "epoch": 0.59, "learning_rate": 1.8571375794295844e-05, "loss": 0.4581, "step": 3196 }, { "epoch": 0.59, "learning_rate": 1.8570346760633886e-05, "loss": 0.4798, "step": 3197 }, { "epoch": 0.59, "learning_rate": 1.856931738503096e-05, "loss": 0.4568, "step": 3198 }, { "epoch": 0.59, "learning_rate": 1.8568287667528137e-05, "loss": 0.4705, "step": 3199 }, { "epoch": 0.59, "learning_rate": 1.85672576081665e-05, "loss": 0.4711, "step": 3200 }, { "epoch": 0.59, "learning_rate": 1.8566227206987143e-05, "loss": 0.447, "step": 3201 }, { "epoch": 0.59, "learning_rate": 1.8565196464031183e-05, "loss": 0.4726, "step": 3202 }, { "epoch": 0.59, "learning_rate": 1.8564165379339743e-05, "loss": 0.4798, "step": 3203 }, { "epoch": 0.59, "learning_rate": 1.856313395295396e-05, "loss": 0.4688, "step": 3204 }, { "epoch": 0.59, "learning_rate": 1.8562102184914982e-05, "loss": 0.4755, "step": 3205 }, { "epoch": 0.59, "learning_rate": 1.8561070075263985e-05, "loss": 0.4943, "step": 3206 }, { "epoch": 0.59, "learning_rate": 1.856003762404214e-05, "loss": 0.4865, "step": 3207 }, { "epoch": 0.59, "learning_rate": 1.855900483129064e-05, "loss": 0.4948, "step": 3208 }, { "epoch": 0.59, "learning_rate": 1.8557971697050695e-05, "loss": 0.4774, "step": 3209 }, { "epoch": 0.59, "learning_rate": 1.855693822136353e-05, "loss": 0.4777, "step": 3210 }, { "epoch": 0.59, "learning_rate": 1.8555904404270368e-05, "loss": 0.4524, "step": 3211 }, { "epoch": 0.59, "learning_rate": 1.8554870245812457e-05, "loss": 0.4677, "step": 3212 }, { "epoch": 0.59, "learning_rate": 1.855383574603107e-05, "loss": 0.4635, "step": 3213 }, { "epoch": 0.59, "learning_rate": 1.8552800904967466e-05, "loss": 0.4617, "step": 3214 }, { "epoch": 0.59, "learning_rate": 1.8551765722662946e-05, "loss": 0.4504, "step": 3215 }, { "epoch": 0.6, "learning_rate": 1.8550730199158805e-05, "loss": 0.4738, "step": 3216 }, { "epoch": 0.6, "learning_rate": 1.8549694334496363e-05, "loss": 0.4858, "step": 3217 }, { "epoch": 0.6, "learning_rate": 1.8548658128716942e-05, "loss": 0.4773, "step": 3218 }, { "epoch": 0.6, "learning_rate": 1.8547621581861893e-05, "loss": 0.4752, "step": 3219 }, { "epoch": 0.6, "learning_rate": 1.8546584693972565e-05, "loss": 0.4717, "step": 3220 }, { "epoch": 0.6, "learning_rate": 1.8545547465090334e-05, "loss": 0.4646, "step": 3221 }, { "epoch": 0.6, "learning_rate": 1.854450989525658e-05, "loss": 0.488, "step": 3222 }, { "epoch": 0.6, "learning_rate": 1.85434719845127e-05, "loss": 0.4849, "step": 3223 }, { "epoch": 0.6, "learning_rate": 1.854243373290011e-05, "loss": 0.4716, "step": 3224 }, { "epoch": 0.6, "learning_rate": 1.8541395140460222e-05, "loss": 0.4488, "step": 3225 }, { "epoch": 0.6, "learning_rate": 1.854035620723449e-05, "loss": 0.461, "step": 3226 }, { "epoch": 0.6, "learning_rate": 1.853931693326435e-05, "loss": 0.4758, "step": 3227 }, { "epoch": 0.6, "learning_rate": 1.853827731859128e-05, "loss": 0.476, "step": 3228 }, { "epoch": 0.6, "learning_rate": 1.853723736325675e-05, "loss": 0.4704, "step": 3229 }, { "epoch": 0.6, "learning_rate": 1.853619706730226e-05, "loss": 0.445, "step": 3230 }, { "epoch": 0.6, "learning_rate": 1.8535156430769306e-05, "loss": 0.4608, "step": 3231 }, { "epoch": 0.6, "learning_rate": 1.8534115453699416e-05, "loss": 0.465, "step": 3232 }, { "epoch": 0.6, "learning_rate": 1.8533074136134118e-05, "loss": 0.4784, "step": 3233 }, { "epoch": 0.6, "learning_rate": 1.853203247811496e-05, "loss": 0.4819, "step": 3234 }, { "epoch": 0.6, "learning_rate": 1.8530990479683505e-05, "loss": 0.4527, "step": 3235 }, { "epoch": 0.6, "learning_rate": 1.8529948140881323e-05, "loss": 0.4603, "step": 3236 }, { "epoch": 0.6, "learning_rate": 1.8528905461750004e-05, "loss": 0.4763, "step": 3237 }, { "epoch": 0.6, "learning_rate": 1.8527862442331148e-05, "loss": 0.471, "step": 3238 }, { "epoch": 0.6, "learning_rate": 1.852681908266637e-05, "loss": 0.4541, "step": 3239 }, { "epoch": 0.6, "learning_rate": 1.8525775382797296e-05, "loss": 0.4733, "step": 3240 }, { "epoch": 0.6, "learning_rate": 1.852473134276557e-05, "loss": 0.4974, "step": 3241 }, { "epoch": 0.6, "learning_rate": 1.8523686962612845e-05, "loss": 0.4756, "step": 3242 }, { "epoch": 0.6, "learning_rate": 1.852264224238079e-05, "loss": 0.5023, "step": 3243 }, { "epoch": 0.6, "learning_rate": 1.85215971821111e-05, "loss": 0.4766, "step": 3244 }, { "epoch": 0.6, "learning_rate": 1.8520551781845447e-05, "loss": 0.4562, "step": 3245 }, { "epoch": 0.6, "learning_rate": 1.8519506041625558e-05, "loss": 0.4724, "step": 3246 }, { "epoch": 0.6, "learning_rate": 1.851845996149315e-05, "loss": 0.4641, "step": 3247 }, { "epoch": 0.6, "learning_rate": 1.8517413541489964e-05, "loss": 0.4576, "step": 3248 }, { "epoch": 0.6, "learning_rate": 1.8516366781657743e-05, "loss": 0.4661, "step": 3249 }, { "epoch": 0.6, "learning_rate": 1.851531968203826e-05, "loss": 0.4812, "step": 3250 }, { "epoch": 0.6, "learning_rate": 1.8514272242673286e-05, "loss": 0.461, "step": 3251 }, { "epoch": 0.6, "learning_rate": 1.8513224463604608e-05, "loss": 0.4589, "step": 3252 }, { "epoch": 0.6, "learning_rate": 1.851217634487404e-05, "loss": 0.471, "step": 3253 }, { "epoch": 0.6, "learning_rate": 1.8511127886523395e-05, "loss": 0.462, "step": 3254 }, { "epoch": 0.6, "learning_rate": 1.8510079088594507e-05, "loss": 0.4835, "step": 3255 }, { "epoch": 0.6, "learning_rate": 1.850902995112922e-05, "loss": 0.4914, "step": 3256 }, { "epoch": 0.6, "learning_rate": 1.8507980474169388e-05, "loss": 0.465, "step": 3257 }, { "epoch": 0.6, "learning_rate": 1.8506930657756892e-05, "loss": 0.4721, "step": 3258 }, { "epoch": 0.6, "learning_rate": 1.850588050193361e-05, "loss": 0.4581, "step": 3259 }, { "epoch": 0.6, "learning_rate": 1.8504830006741442e-05, "loss": 0.4558, "step": 3260 }, { "epoch": 0.6, "learning_rate": 1.8503779172222306e-05, "loss": 0.4636, "step": 3261 }, { "epoch": 0.6, "learning_rate": 1.8502727998418123e-05, "loss": 0.4892, "step": 3262 }, { "epoch": 0.6, "learning_rate": 1.850167648537084e-05, "loss": 0.4315, "step": 3263 }, { "epoch": 0.6, "learning_rate": 1.8500624633122402e-05, "loss": 0.4675, "step": 3264 }, { "epoch": 0.6, "learning_rate": 1.849957244171478e-05, "loss": 0.4855, "step": 3265 }, { "epoch": 0.6, "learning_rate": 1.8498519911189955e-05, "loss": 0.4858, "step": 3266 }, { "epoch": 0.6, "learning_rate": 1.8497467041589917e-05, "loss": 0.481, "step": 3267 }, { "epoch": 0.6, "learning_rate": 1.849641383295668e-05, "loss": 0.4712, "step": 3268 }, { "epoch": 0.6, "learning_rate": 1.8495360285332264e-05, "loss": 0.4961, "step": 3269 }, { "epoch": 0.6, "learning_rate": 1.8494306398758697e-05, "loss": 0.463, "step": 3270 }, { "epoch": 0.61, "learning_rate": 1.8493252173278035e-05, "loss": 0.4595, "step": 3271 }, { "epoch": 0.61, "learning_rate": 1.8492197608932332e-05, "loss": 0.4763, "step": 3272 }, { "epoch": 0.61, "learning_rate": 1.849114270576367e-05, "loss": 0.4669, "step": 3273 }, { "epoch": 0.61, "learning_rate": 1.8490087463814133e-05, "loss": 0.4938, "step": 3274 }, { "epoch": 0.61, "learning_rate": 1.8489031883125824e-05, "loss": 0.4839, "step": 3275 }, { "epoch": 0.61, "learning_rate": 1.8487975963740865e-05, "loss": 0.4661, "step": 3276 }, { "epoch": 0.61, "learning_rate": 1.848691970570138e-05, "loss": 0.4585, "step": 3277 }, { "epoch": 0.61, "learning_rate": 1.8485863109049506e-05, "loss": 0.4959, "step": 3278 }, { "epoch": 0.61, "learning_rate": 1.848480617382741e-05, "loss": 0.4675, "step": 3279 }, { "epoch": 0.61, "learning_rate": 1.8483748900077252e-05, "loss": 0.4531, "step": 3280 }, { "epoch": 0.61, "learning_rate": 1.8482691287841227e-05, "loss": 0.4661, "step": 3281 }, { "epoch": 0.61, "learning_rate": 1.848163333716152e-05, "loss": 0.4869, "step": 3282 }, { "epoch": 0.61, "learning_rate": 1.8480575048080347e-05, "loss": 0.4814, "step": 3283 }, { "epoch": 0.61, "learning_rate": 1.847951642063993e-05, "loss": 0.4547, "step": 3284 }, { "epoch": 0.61, "learning_rate": 1.847845745488251e-05, "loss": 0.4694, "step": 3285 }, { "epoch": 0.61, "learning_rate": 1.8477398150850332e-05, "loss": 0.4809, "step": 3286 }, { "epoch": 0.61, "learning_rate": 1.8476338508585668e-05, "loss": 0.442, "step": 3287 }, { "epoch": 0.61, "learning_rate": 1.8475278528130788e-05, "loss": 0.4806, "step": 3288 }, { "epoch": 0.61, "learning_rate": 1.8474218209527985e-05, "loss": 0.4679, "step": 3289 }, { "epoch": 0.61, "learning_rate": 1.8473157552819567e-05, "loss": 0.4594, "step": 3290 }, { "epoch": 0.61, "learning_rate": 1.8472096558047848e-05, "loss": 0.4662, "step": 3291 }, { "epoch": 0.61, "learning_rate": 1.8471035225255164e-05, "loss": 0.4555, "step": 3292 }, { "epoch": 0.61, "learning_rate": 1.8469973554483858e-05, "loss": 0.4908, "step": 3293 }, { "epoch": 0.61, "learning_rate": 1.846891154577629e-05, "loss": 0.4743, "step": 3294 }, { "epoch": 0.61, "learning_rate": 1.8467849199174827e-05, "loss": 0.4765, "step": 3295 }, { "epoch": 0.61, "learning_rate": 1.8466786514721863e-05, "loss": 0.463, "step": 3296 }, { "epoch": 0.61, "learning_rate": 1.846572349245979e-05, "loss": 0.4729, "step": 3297 }, { "epoch": 0.61, "learning_rate": 1.8464660132431026e-05, "loss": 0.4618, "step": 3298 }, { "epoch": 0.61, "learning_rate": 1.8463596434677992e-05, "loss": 0.4508, "step": 3299 }, { "epoch": 0.61, "learning_rate": 1.8462532399243134e-05, "loss": 0.4736, "step": 3300 }, { "epoch": 0.61, "learning_rate": 1.84614680261689e-05, "loss": 0.4561, "step": 3301 }, { "epoch": 0.61, "learning_rate": 1.8460403315497755e-05, "loss": 0.501, "step": 3302 }, { "epoch": 0.61, "learning_rate": 1.8459338267272185e-05, "loss": 0.4825, "step": 3303 }, { "epoch": 0.61, "learning_rate": 1.8458272881534675e-05, "loss": 0.4796, "step": 3304 }, { "epoch": 0.61, "learning_rate": 1.845720715832774e-05, "loss": 0.4773, "step": 3305 }, { "epoch": 0.61, "learning_rate": 1.84561410976939e-05, "loss": 0.4953, "step": 3306 }, { "epoch": 0.61, "learning_rate": 1.8455074699675687e-05, "loss": 0.464, "step": 3307 }, { "epoch": 0.61, "learning_rate": 1.8454007964315642e-05, "loss": 0.4725, "step": 3308 }, { "epoch": 0.61, "learning_rate": 1.8452940891656337e-05, "loss": 0.4595, "step": 3309 }, { "epoch": 0.61, "learning_rate": 1.8451873481740337e-05, "loss": 0.4715, "step": 3310 }, { "epoch": 0.61, "learning_rate": 1.8450805734610235e-05, "loss": 0.4822, "step": 3311 }, { "epoch": 0.61, "learning_rate": 1.844973765030863e-05, "loss": 0.4876, "step": 3312 }, { "epoch": 0.61, "learning_rate": 1.8448669228878135e-05, "loss": 0.4708, "step": 3313 }, { "epoch": 0.61, "learning_rate": 1.8447600470361383e-05, "loss": 0.4689, "step": 3314 }, { "epoch": 0.61, "learning_rate": 1.8446531374801012e-05, "loss": 0.4792, "step": 3315 }, { "epoch": 0.61, "learning_rate": 1.8445461942239676e-05, "loss": 0.4696, "step": 3316 }, { "epoch": 0.61, "learning_rate": 1.8444392172720044e-05, "loss": 0.4612, "step": 3317 }, { "epoch": 0.61, "learning_rate": 1.8443322066284804e-05, "loss": 0.4922, "step": 3318 }, { "epoch": 0.61, "learning_rate": 1.844225162297664e-05, "loss": 0.4769, "step": 3319 }, { "epoch": 0.61, "learning_rate": 1.844118084283827e-05, "loss": 0.4741, "step": 3320 }, { "epoch": 0.61, "learning_rate": 1.8440109725912414e-05, "loss": 0.4768, "step": 3321 }, { "epoch": 0.61, "learning_rate": 1.84390382722418e-05, "loss": 0.4554, "step": 3322 }, { "epoch": 0.61, "learning_rate": 1.8437966481869192e-05, "loss": 0.446, "step": 3323 }, { "epoch": 0.61, "learning_rate": 1.8436894354837338e-05, "loss": 0.451, "step": 3324 }, { "epoch": 0.62, "learning_rate": 1.843582189118902e-05, "loss": 0.4575, "step": 3325 }, { "epoch": 0.62, "learning_rate": 1.843474909096703e-05, "loss": 0.4452, "step": 3326 }, { "epoch": 0.62, "learning_rate": 1.8433675954214166e-05, "loss": 0.4753, "step": 3327 }, { "epoch": 0.62, "learning_rate": 1.8432602480973245e-05, "loss": 0.4828, "step": 3328 }, { "epoch": 0.62, "learning_rate": 1.84315286712871e-05, "loss": 0.4582, "step": 3329 }, { "epoch": 0.62, "learning_rate": 1.8430454525198567e-05, "loss": 0.4776, "step": 3330 }, { "epoch": 0.62, "learning_rate": 1.8429380042750514e-05, "loss": 0.484, "step": 3331 }, { "epoch": 0.62, "learning_rate": 1.84283052239858e-05, "loss": 0.4936, "step": 3332 }, { "epoch": 0.62, "learning_rate": 1.842723006894731e-05, "loss": 0.4575, "step": 3333 }, { "epoch": 0.62, "learning_rate": 1.8426154577677948e-05, "loss": 0.4561, "step": 3334 }, { "epoch": 0.62, "learning_rate": 1.8425078750220616e-05, "loss": 0.4887, "step": 3335 }, { "epoch": 0.62, "learning_rate": 1.8424002586618242e-05, "loss": 0.4807, "step": 3336 }, { "epoch": 0.62, "learning_rate": 1.8422926086913756e-05, "loss": 0.4711, "step": 3337 }, { "epoch": 0.62, "learning_rate": 1.842184925115012e-05, "loss": 0.4595, "step": 3338 }, { "epoch": 0.62, "learning_rate": 1.842077207937029e-05, "loss": 0.4592, "step": 3339 }, { "epoch": 0.62, "learning_rate": 1.8419694571617243e-05, "loss": 0.4557, "step": 3340 }, { "epoch": 0.62, "learning_rate": 1.8418616727933973e-05, "loss": 0.4756, "step": 3341 }, { "epoch": 0.62, "learning_rate": 1.8417538548363484e-05, "loss": 0.4556, "step": 3342 }, { "epoch": 0.62, "learning_rate": 1.8416460032948785e-05, "loss": 0.4755, "step": 3343 }, { "epoch": 0.62, "learning_rate": 1.841538118173292e-05, "loss": 0.4693, "step": 3344 }, { "epoch": 0.62, "learning_rate": 1.8414301994758922e-05, "loss": 0.4644, "step": 3345 }, { "epoch": 0.62, "learning_rate": 1.8413222472069858e-05, "loss": 0.4788, "step": 3346 }, { "epoch": 0.62, "learning_rate": 1.841214261370879e-05, "loss": 0.4864, "step": 3347 }, { "epoch": 0.62, "learning_rate": 1.8411062419718805e-05, "loss": 0.4811, "step": 3348 }, { "epoch": 0.62, "learning_rate": 1.8409981890143004e-05, "loss": 0.4469, "step": 3349 }, { "epoch": 0.62, "learning_rate": 1.8408901025024496e-05, "loss": 0.4903, "step": 3350 }, { "epoch": 0.62, "learning_rate": 1.840781982440641e-05, "loss": 0.4644, "step": 3351 }, { "epoch": 0.62, "learning_rate": 1.8406738288331874e-05, "loss": 0.4643, "step": 3352 }, { "epoch": 0.62, "learning_rate": 1.8405656416844048e-05, "loss": 0.4689, "step": 3353 }, { "epoch": 0.62, "learning_rate": 1.8404574209986094e-05, "loss": 0.456, "step": 3354 }, { "epoch": 0.62, "learning_rate": 1.840349166780119e-05, "loss": 0.4803, "step": 3355 }, { "epoch": 0.62, "learning_rate": 1.840240879033252e-05, "loss": 0.4738, "step": 3356 }, { "epoch": 0.62, "learning_rate": 1.8401325577623305e-05, "loss": 0.5031, "step": 3357 }, { "epoch": 0.62, "learning_rate": 1.840024202971675e-05, "loss": 0.4708, "step": 3358 }, { "epoch": 0.62, "learning_rate": 1.839915814665609e-05, "loss": 0.4792, "step": 3359 }, { "epoch": 0.62, "learning_rate": 1.8398073928484576e-05, "loss": 0.4827, "step": 3360 }, { "epoch": 0.62, "learning_rate": 1.8396989375245455e-05, "loss": 0.4565, "step": 3361 }, { "epoch": 0.62, "learning_rate": 1.8395904486982005e-05, "loss": 0.4972, "step": 3362 }, { "epoch": 0.62, "learning_rate": 1.8394819263737512e-05, "loss": 0.4711, "step": 3363 }, { "epoch": 0.62, "learning_rate": 1.8393733705555274e-05, "loss": 0.4739, "step": 3364 }, { "epoch": 0.62, "learning_rate": 1.83926478124786e-05, "loss": 0.4733, "step": 3365 }, { "epoch": 0.62, "learning_rate": 1.8391561584550815e-05, "loss": 0.4639, "step": 3366 }, { "epoch": 0.62, "learning_rate": 1.839047502181526e-05, "loss": 0.4736, "step": 3367 }, { "epoch": 0.62, "learning_rate": 1.838938812431529e-05, "loss": 0.4796, "step": 3368 }, { "epoch": 0.62, "learning_rate": 1.8388300892094265e-05, "loss": 0.477, "step": 3369 }, { "epoch": 0.62, "learning_rate": 1.8387213325195564e-05, "loss": 0.4494, "step": 3370 }, { "epoch": 0.62, "learning_rate": 1.838612542366258e-05, "loss": 0.4806, "step": 3371 }, { "epoch": 0.62, "learning_rate": 1.8385037187538718e-05, "loss": 0.4688, "step": 3372 }, { "epoch": 0.62, "learning_rate": 1.8383948616867397e-05, "loss": 0.4695, "step": 3373 }, { "epoch": 0.62, "learning_rate": 1.838285971169205e-05, "loss": 0.4738, "step": 3374 }, { "epoch": 0.62, "learning_rate": 1.838177047205612e-05, "loss": 0.4667, "step": 3375 }, { "epoch": 0.62, "learning_rate": 1.8380680898003064e-05, "loss": 0.4469, "step": 3376 }, { "epoch": 0.62, "learning_rate": 1.837959098957636e-05, "loss": 0.4615, "step": 3377 }, { "epoch": 0.62, "learning_rate": 1.8378500746819487e-05, "loss": 0.471, "step": 3378 }, { "epoch": 0.63, "learning_rate": 1.837741016977595e-05, "loss": 0.4505, "step": 3379 }, { "epoch": 0.63, "learning_rate": 1.8376319258489252e-05, "loss": 0.4685, "step": 3380 }, { "epoch": 0.63, "learning_rate": 1.8375228013002928e-05, "loss": 0.4649, "step": 3381 }, { "epoch": 0.63, "learning_rate": 1.8374136433360514e-05, "loss": 0.4865, "step": 3382 }, { "epoch": 0.63, "learning_rate": 1.8373044519605557e-05, "loss": 0.4459, "step": 3383 }, { "epoch": 0.63, "learning_rate": 1.837195227178163e-05, "loss": 0.4693, "step": 3384 }, { "epoch": 0.63, "learning_rate": 1.8370859689932305e-05, "loss": 0.4683, "step": 3385 }, { "epoch": 0.63, "learning_rate": 1.8369766774101176e-05, "loss": 0.4852, "step": 3386 }, { "epoch": 0.63, "learning_rate": 1.836867352433185e-05, "loss": 0.4706, "step": 3387 }, { "epoch": 0.63, "learning_rate": 1.8367579940667946e-05, "loss": 0.4767, "step": 3388 }, { "epoch": 0.63, "learning_rate": 1.8366486023153093e-05, "loss": 0.4528, "step": 3389 }, { "epoch": 0.63, "learning_rate": 1.8365391771830937e-05, "loss": 0.4764, "step": 3390 }, { "epoch": 0.63, "learning_rate": 1.836429718674514e-05, "loss": 0.4526, "step": 3391 }, { "epoch": 0.63, "learning_rate": 1.8363202267939367e-05, "loss": 0.4696, "step": 3392 }, { "epoch": 0.63, "learning_rate": 1.836210701545731e-05, "loss": 0.4674, "step": 3393 }, { "epoch": 0.63, "learning_rate": 1.8361011429342667e-05, "loss": 0.4338, "step": 3394 }, { "epoch": 0.63, "learning_rate": 1.8359915509639146e-05, "loss": 0.4814, "step": 3395 }, { "epoch": 0.63, "learning_rate": 1.8358819256390473e-05, "loss": 0.4446, "step": 3396 }, { "epoch": 0.63, "learning_rate": 1.835772266964039e-05, "loss": 0.4675, "step": 3397 }, { "epoch": 0.63, "learning_rate": 1.8356625749432642e-05, "loss": 0.4638, "step": 3398 }, { "epoch": 0.63, "learning_rate": 1.8355528495811007e-05, "loss": 0.4587, "step": 3399 }, { "epoch": 0.63, "learning_rate": 1.8354430908819248e-05, "loss": 0.4742, "step": 3400 }, { "epoch": 0.63, "learning_rate": 1.8353332988501165e-05, "loss": 0.4832, "step": 3401 }, { "epoch": 0.63, "learning_rate": 1.8352234734900564e-05, "loss": 0.4669, "step": 3402 }, { "epoch": 0.63, "learning_rate": 1.8351136148061254e-05, "loss": 0.4576, "step": 3403 }, { "epoch": 0.63, "learning_rate": 1.835003722802708e-05, "loss": 0.4759, "step": 3404 }, { "epoch": 0.63, "learning_rate": 1.834893797484188e-05, "loss": 0.4726, "step": 3405 }, { "epoch": 0.63, "learning_rate": 1.8347838388549508e-05, "loss": 0.4801, "step": 3406 }, { "epoch": 0.63, "learning_rate": 1.8346738469193842e-05, "loss": 0.4934, "step": 3407 }, { "epoch": 0.63, "learning_rate": 1.8345638216818767e-05, "loss": 0.4563, "step": 3408 }, { "epoch": 0.63, "learning_rate": 1.8344537631468176e-05, "loss": 0.5073, "step": 3409 }, { "epoch": 0.63, "learning_rate": 1.8343436713185983e-05, "loss": 0.4932, "step": 3410 }, { "epoch": 0.63, "learning_rate": 1.8342335462016115e-05, "loss": 0.4491, "step": 3411 }, { "epoch": 0.63, "learning_rate": 1.8341233878002508e-05, "loss": 0.4805, "step": 3412 }, { "epoch": 0.63, "learning_rate": 1.8340131961189108e-05, "loss": 0.4944, "step": 3413 }, { "epoch": 0.63, "learning_rate": 1.833902971161989e-05, "loss": 0.4619, "step": 3414 }, { "epoch": 0.63, "learning_rate": 1.833792712933882e-05, "loss": 0.4578, "step": 3415 }, { "epoch": 0.63, "learning_rate": 1.83368242143899e-05, "loss": 0.473, "step": 3416 }, { "epoch": 0.63, "learning_rate": 1.8335720966817124e-05, "loss": 0.4477, "step": 3417 }, { "epoch": 0.63, "learning_rate": 1.833461738666452e-05, "loss": 0.4718, "step": 3418 }, { "epoch": 0.63, "learning_rate": 1.833351347397611e-05, "loss": 0.4532, "step": 3419 }, { "epoch": 0.63, "learning_rate": 1.833240922879594e-05, "loss": 0.4846, "step": 3420 }, { "epoch": 0.63, "learning_rate": 1.833130465116807e-05, "loss": 0.4534, "step": 3421 }, { "epoch": 0.63, "learning_rate": 1.8330199741136573e-05, "loss": 0.4632, "step": 3422 }, { "epoch": 0.63, "learning_rate": 1.8329094498745523e-05, "loss": 0.4704, "step": 3423 }, { "epoch": 0.63, "learning_rate": 1.832798892403903e-05, "loss": 0.454, "step": 3424 }, { "epoch": 0.63, "learning_rate": 1.8326883017061194e-05, "loss": 0.4725, "step": 3425 }, { "epoch": 0.63, "learning_rate": 1.832577677785614e-05, "loss": 0.4674, "step": 3426 }, { "epoch": 0.63, "learning_rate": 1.8324670206468013e-05, "loss": 0.4752, "step": 3427 }, { "epoch": 0.63, "learning_rate": 1.8323563302940958e-05, "loss": 0.4633, "step": 3428 }, { "epoch": 0.63, "learning_rate": 1.8322456067319132e-05, "loss": 0.4529, "step": 3429 }, { "epoch": 0.63, "learning_rate": 1.832134849964672e-05, "loss": 0.4685, "step": 3430 }, { "epoch": 0.63, "learning_rate": 1.8320240599967908e-05, "loss": 0.4836, "step": 3431 }, { "epoch": 0.63, "learning_rate": 1.8319132368326903e-05, "loss": 0.4663, "step": 3432 }, { "epoch": 0.64, "learning_rate": 1.831802380476792e-05, "loss": 0.4605, "step": 3433 }, { "epoch": 0.64, "learning_rate": 1.8316914909335188e-05, "loss": 0.456, "step": 3434 }, { "epoch": 0.64, "learning_rate": 1.8315805682072944e-05, "loss": 0.4396, "step": 3435 }, { "epoch": 0.64, "learning_rate": 1.8314696123025456e-05, "loss": 0.4591, "step": 3436 }, { "epoch": 0.64, "learning_rate": 1.831358623223698e-05, "loss": 0.4985, "step": 3437 }, { "epoch": 0.64, "learning_rate": 1.831247600975181e-05, "loss": 0.4764, "step": 3438 }, { "epoch": 0.64, "learning_rate": 1.8311365455614238e-05, "loss": 0.4704, "step": 3439 }, { "epoch": 0.64, "learning_rate": 1.8310254569868572e-05, "loss": 0.4756, "step": 3440 }, { "epoch": 0.64, "learning_rate": 1.8309143352559133e-05, "loss": 0.4587, "step": 3441 }, { "epoch": 0.64, "learning_rate": 1.830803180373026e-05, "loss": 0.4617, "step": 3442 }, { "epoch": 0.64, "learning_rate": 1.8306919923426298e-05, "loss": 0.4838, "step": 3443 }, { "epoch": 0.64, "learning_rate": 1.8305807711691613e-05, "loss": 0.4714, "step": 3444 }, { "epoch": 0.64, "learning_rate": 1.8304695168570575e-05, "loss": 0.4595, "step": 3445 }, { "epoch": 0.64, "learning_rate": 1.830358229410758e-05, "loss": 0.4726, "step": 3446 }, { "epoch": 0.64, "learning_rate": 1.8302469088347022e-05, "loss": 0.4759, "step": 3447 }, { "epoch": 0.64, "learning_rate": 1.830135555133332e-05, "loss": 0.4455, "step": 3448 }, { "epoch": 0.64, "learning_rate": 1.83002416831109e-05, "loss": 0.4786, "step": 3449 }, { "epoch": 0.64, "learning_rate": 1.8299127483724205e-05, "loss": 0.4627, "step": 3450 }, { "epoch": 0.64, "learning_rate": 1.8298012953217688e-05, "loss": 0.4762, "step": 3451 }, { "epoch": 0.64, "learning_rate": 1.829689809163582e-05, "loss": 0.4781, "step": 3452 }, { "epoch": 0.64, "learning_rate": 1.8295782899023077e-05, "loss": 0.4818, "step": 3453 }, { "epoch": 0.64, "learning_rate": 1.8294667375423958e-05, "loss": 0.4716, "step": 3454 }, { "epoch": 0.64, "learning_rate": 1.8293551520882965e-05, "loss": 0.4654, "step": 3455 }, { "epoch": 0.64, "learning_rate": 1.8292435335444624e-05, "loss": 0.4798, "step": 3456 }, { "epoch": 0.64, "learning_rate": 1.8291318819153466e-05, "loss": 0.4812, "step": 3457 }, { "epoch": 0.64, "learning_rate": 1.8290201972054037e-05, "loss": 0.463, "step": 3458 }, { "epoch": 0.64, "learning_rate": 1.8289084794190895e-05, "loss": 0.4756, "step": 3459 }, { "epoch": 0.64, "learning_rate": 1.8287967285608622e-05, "loss": 0.4571, "step": 3460 }, { "epoch": 0.64, "learning_rate": 1.8286849446351794e-05, "loss": 0.4619, "step": 3461 }, { "epoch": 0.64, "learning_rate": 1.828573127646502e-05, "loss": 0.4761, "step": 3462 }, { "epoch": 0.64, "learning_rate": 1.8284612775992908e-05, "loss": 0.4322, "step": 3463 }, { "epoch": 0.64, "learning_rate": 1.8283493944980083e-05, "loss": 0.4769, "step": 3464 }, { "epoch": 0.64, "learning_rate": 1.8282374783471187e-05, "loss": 0.4374, "step": 3465 }, { "epoch": 0.64, "learning_rate": 1.8281255291510872e-05, "loss": 0.4817, "step": 3466 }, { "epoch": 0.64, "learning_rate": 1.8280135469143805e-05, "loss": 0.457, "step": 3467 }, { "epoch": 0.64, "learning_rate": 1.827901531641466e-05, "loss": 0.4857, "step": 3468 }, { "epoch": 0.64, "learning_rate": 1.827789483336813e-05, "loss": 0.4581, "step": 3469 }, { "epoch": 0.64, "learning_rate": 1.8276774020048927e-05, "loss": 0.4769, "step": 3470 }, { "epoch": 0.64, "learning_rate": 1.8275652876501763e-05, "loss": 0.4904, "step": 3471 }, { "epoch": 0.64, "learning_rate": 1.827453140277137e-05, "loss": 0.4771, "step": 3472 }, { "epoch": 0.64, "learning_rate": 1.8273409598902497e-05, "loss": 0.4675, "step": 3473 }, { "epoch": 0.64, "learning_rate": 1.8272287464939897e-05, "loss": 0.4827, "step": 3474 }, { "epoch": 0.64, "learning_rate": 1.827116500092834e-05, "loss": 0.4804, "step": 3475 }, { "epoch": 0.64, "learning_rate": 1.827004220691262e-05, "loss": 0.4621, "step": 3476 }, { "epoch": 0.64, "learning_rate": 1.826891908293752e-05, "loss": 0.4732, "step": 3477 }, { "epoch": 0.64, "learning_rate": 1.826779562904786e-05, "loss": 0.4568, "step": 3478 }, { "epoch": 0.64, "learning_rate": 1.8266671845288466e-05, "loss": 0.4794, "step": 3479 }, { "epoch": 0.64, "learning_rate": 1.826554773170417e-05, "loss": 0.4744, "step": 3480 }, { "epoch": 0.64, "learning_rate": 1.8264423288339818e-05, "loss": 0.4846, "step": 3481 }, { "epoch": 0.64, "learning_rate": 1.8263298515240282e-05, "loss": 0.4497, "step": 3482 }, { "epoch": 0.64, "learning_rate": 1.826217341245043e-05, "loss": 0.4577, "step": 3483 }, { "epoch": 0.64, "learning_rate": 1.826104798001516e-05, "loss": 0.4572, "step": 3484 }, { "epoch": 0.64, "learning_rate": 1.825992221797937e-05, "loss": 0.4767, "step": 3485 }, { "epoch": 0.64, "learning_rate": 1.8258796126387976e-05, "loss": 0.443, "step": 3486 }, { "epoch": 0.65, "learning_rate": 1.825766970528591e-05, "loss": 0.4471, "step": 3487 }, { "epoch": 0.65, "learning_rate": 1.8256542954718105e-05, "loss": 0.4746, "step": 3488 }, { "epoch": 0.65, "learning_rate": 1.8255415874729528e-05, "loss": 0.4943, "step": 3489 }, { "epoch": 0.65, "learning_rate": 1.825428846536514e-05, "loss": 0.471, "step": 3490 }, { "epoch": 0.65, "learning_rate": 1.8253160726669925e-05, "loss": 0.4473, "step": 3491 }, { "epoch": 0.65, "learning_rate": 1.8252032658688878e-05, "loss": 0.4823, "step": 3492 }, { "epoch": 0.65, "learning_rate": 1.8250904261467005e-05, "loss": 0.4678, "step": 3493 }, { "epoch": 0.65, "learning_rate": 1.8249775535049328e-05, "loss": 0.4814, "step": 3494 }, { "epoch": 0.65, "learning_rate": 1.824864647948088e-05, "loss": 0.4545, "step": 3495 }, { "epoch": 0.65, "learning_rate": 1.824751709480671e-05, "loss": 0.4619, "step": 3496 }, { "epoch": 0.65, "learning_rate": 1.8246387381071883e-05, "loss": 0.474, "step": 3497 }, { "epoch": 0.65, "learning_rate": 1.824525733832146e-05, "loss": 0.449, "step": 3498 }, { "epoch": 0.65, "learning_rate": 1.824412696660054e-05, "loss": 0.4588, "step": 3499 }, { "epoch": 0.65, "learning_rate": 1.8242996265954214e-05, "loss": 0.4673, "step": 3500 }, { "epoch": 0.65, "learning_rate": 1.82418652364276e-05, "loss": 0.4416, "step": 3501 }, { "epoch": 0.65, "learning_rate": 1.8240733878065825e-05, "loss": 0.477, "step": 3502 }, { "epoch": 0.65, "learning_rate": 1.823960219091402e-05, "loss": 0.4815, "step": 3503 }, { "epoch": 0.65, "learning_rate": 1.823847017501735e-05, "loss": 0.4941, "step": 3504 }, { "epoch": 0.65, "learning_rate": 1.8237337830420968e-05, "loss": 0.4748, "step": 3505 }, { "epoch": 0.65, "learning_rate": 1.8236205157170057e-05, "loss": 0.4654, "step": 3506 }, { "epoch": 0.65, "learning_rate": 1.823507215530981e-05, "loss": 0.47, "step": 3507 }, { "epoch": 0.65, "learning_rate": 1.8233938824885433e-05, "loss": 0.4443, "step": 3508 }, { "epoch": 0.65, "learning_rate": 1.8232805165942143e-05, "loss": 0.4573, "step": 3509 }, { "epoch": 0.65, "learning_rate": 1.8231671178525164e-05, "loss": 0.4632, "step": 3510 }, { "epoch": 0.65, "learning_rate": 1.823053686267975e-05, "loss": 0.4783, "step": 3511 }, { "epoch": 0.65, "learning_rate": 1.822940221845115e-05, "loss": 0.4646, "step": 3512 }, { "epoch": 0.65, "learning_rate": 1.822826724588464e-05, "loss": 0.4508, "step": 3513 }, { "epoch": 0.65, "learning_rate": 1.82271319450255e-05, "loss": 0.4663, "step": 3514 }, { "epoch": 0.65, "learning_rate": 1.822599631591903e-05, "loss": 0.4765, "step": 3515 }, { "epoch": 0.65, "learning_rate": 1.8224860358610534e-05, "loss": 0.4611, "step": 3516 }, { "epoch": 0.65, "learning_rate": 1.8223724073145342e-05, "loss": 0.4757, "step": 3517 }, { "epoch": 0.65, "learning_rate": 1.8222587459568783e-05, "loss": 0.4541, "step": 3518 }, { "epoch": 0.65, "learning_rate": 1.8221450517926205e-05, "loss": 0.4694, "step": 3519 }, { "epoch": 0.65, "learning_rate": 1.8220313248262976e-05, "loss": 0.4886, "step": 3520 }, { "epoch": 0.65, "learning_rate": 1.8219175650624467e-05, "loss": 0.4624, "step": 3521 }, { "epoch": 0.65, "learning_rate": 1.8218037725056068e-05, "loss": 0.499, "step": 3522 }, { "epoch": 0.65, "learning_rate": 1.8216899471603177e-05, "loss": 0.4802, "step": 3523 }, { "epoch": 0.65, "learning_rate": 1.821576089031121e-05, "loss": 0.458, "step": 3524 }, { "epoch": 0.65, "learning_rate": 1.8214621981225596e-05, "loss": 0.4653, "step": 3525 }, { "epoch": 0.65, "learning_rate": 1.8213482744391777e-05, "loss": 0.465, "step": 3526 }, { "epoch": 0.65, "learning_rate": 1.82123431798552e-05, "loss": 0.459, "step": 3527 }, { "epoch": 0.65, "learning_rate": 1.8211203287661338e-05, "loss": 0.4826, "step": 3528 }, { "epoch": 0.65, "learning_rate": 1.821006306785566e-05, "loss": 0.4871, "step": 3529 }, { "epoch": 0.65, "learning_rate": 1.8208922520483675e-05, "loss": 0.4756, "step": 3530 }, { "epoch": 0.65, "learning_rate": 1.8207781645590874e-05, "loss": 0.459, "step": 3531 }, { "epoch": 0.65, "learning_rate": 1.8206640443222782e-05, "loss": 0.4618, "step": 3532 }, { "epoch": 0.65, "learning_rate": 1.8205498913424933e-05, "loss": 0.4905, "step": 3533 }, { "epoch": 0.65, "learning_rate": 1.820435705624287e-05, "loss": 0.4628, "step": 3534 }, { "epoch": 0.65, "learning_rate": 1.8203214871722145e-05, "loss": 0.4481, "step": 3535 }, { "epoch": 0.65, "learning_rate": 1.820207235990834e-05, "loss": 0.471, "step": 3536 }, { "epoch": 0.65, "learning_rate": 1.820092952084703e-05, "loss": 0.4475, "step": 3537 }, { "epoch": 0.65, "learning_rate": 1.819978635458382e-05, "loss": 0.4757, "step": 3538 }, { "epoch": 0.65, "learning_rate": 1.8198642861164313e-05, "loss": 0.4866, "step": 3539 }, { "epoch": 0.65, "learning_rate": 1.8197499040634136e-05, "loss": 0.4759, "step": 3540 }, { "epoch": 0.66, "learning_rate": 1.8196354893038923e-05, "loss": 0.4556, "step": 3541 }, { "epoch": 0.66, "learning_rate": 1.8195210418424327e-05, "loss": 0.4753, "step": 3542 }, { "epoch": 0.66, "learning_rate": 1.8194065616836006e-05, "loss": 0.4577, "step": 3543 }, { "epoch": 0.66, "learning_rate": 1.8192920488319642e-05, "loss": 0.4526, "step": 3544 }, { "epoch": 0.66, "learning_rate": 1.8191775032920914e-05, "loss": 0.4678, "step": 3545 }, { "epoch": 0.66, "learning_rate": 1.819062925068553e-05, "loss": 0.4743, "step": 3546 }, { "epoch": 0.66, "learning_rate": 1.818948314165921e-05, "loss": 0.4818, "step": 3547 }, { "epoch": 0.66, "learning_rate": 1.8188336705887665e-05, "loss": 0.4764, "step": 3548 }, { "epoch": 0.66, "learning_rate": 1.818718994341665e-05, "loss": 0.4664, "step": 3549 }, { "epoch": 0.66, "learning_rate": 1.8186042854291918e-05, "loss": 0.4742, "step": 3550 }, { "epoch": 0.66, "learning_rate": 1.818489543855923e-05, "loss": 0.4678, "step": 3551 }, { "epoch": 0.66, "learning_rate": 1.8183747696264368e-05, "loss": 0.4611, "step": 3552 }, { "epoch": 0.66, "learning_rate": 1.8182599627453125e-05, "loss": 0.4553, "step": 3553 }, { "epoch": 0.66, "learning_rate": 1.8181451232171302e-05, "loss": 0.4472, "step": 3554 }, { "epoch": 0.66, "learning_rate": 1.8180302510464726e-05, "loss": 0.4433, "step": 3555 }, { "epoch": 0.66, "learning_rate": 1.8179153462379228e-05, "loss": 0.4758, "step": 3556 }, { "epoch": 0.66, "learning_rate": 1.8178004087960643e-05, "loss": 0.4772, "step": 3557 }, { "epoch": 0.66, "learning_rate": 1.817685438725484e-05, "loss": 0.471, "step": 3558 }, { "epoch": 0.66, "learning_rate": 1.8175704360307687e-05, "loss": 0.452, "step": 3559 }, { "epoch": 0.66, "learning_rate": 1.8174554007165067e-05, "loss": 0.4616, "step": 3560 }, { "epoch": 0.66, "learning_rate": 1.8173403327872877e-05, "loss": 0.481, "step": 3561 }, { "epoch": 0.66, "learning_rate": 1.8172252322477028e-05, "loss": 0.4679, "step": 3562 }, { "epoch": 0.66, "learning_rate": 1.817110099102344e-05, "loss": 0.4721, "step": 3563 }, { "epoch": 0.66, "learning_rate": 1.816994933355805e-05, "loss": 0.4825, "step": 3564 }, { "epoch": 0.66, "learning_rate": 1.8168797350126808e-05, "loss": 0.4683, "step": 3565 }, { "epoch": 0.66, "learning_rate": 1.8167645040775673e-05, "loss": 0.47, "step": 3566 }, { "epoch": 0.66, "learning_rate": 1.816649240555063e-05, "loss": 0.4895, "step": 3567 }, { "epoch": 0.66, "learning_rate": 1.8165339444497653e-05, "loss": 0.4867, "step": 3568 }, { "epoch": 0.66, "learning_rate": 1.8164186157662755e-05, "loss": 0.4846, "step": 3569 }, { "epoch": 0.66, "learning_rate": 1.8163032545091942e-05, "loss": 0.4694, "step": 3570 }, { "epoch": 0.66, "learning_rate": 1.8161878606831245e-05, "loss": 0.4673, "step": 3571 }, { "epoch": 0.66, "learning_rate": 1.8160724342926706e-05, "loss": 0.4642, "step": 3572 }, { "epoch": 0.66, "learning_rate": 1.815956975342437e-05, "loss": 0.4727, "step": 3573 }, { "epoch": 0.66, "learning_rate": 1.8158414838370308e-05, "loss": 0.4535, "step": 3574 }, { "epoch": 0.66, "learning_rate": 1.81572595978106e-05, "loss": 0.4698, "step": 3575 }, { "epoch": 0.66, "learning_rate": 1.8156104031791337e-05, "loss": 0.4582, "step": 3576 }, { "epoch": 0.66, "learning_rate": 1.8154948140358627e-05, "loss": 0.4575, "step": 3577 }, { "epoch": 0.66, "learning_rate": 1.815379192355858e-05, "loss": 0.4598, "step": 3578 }, { "epoch": 0.66, "learning_rate": 1.8152635381437332e-05, "loss": 0.4592, "step": 3579 }, { "epoch": 0.66, "learning_rate": 1.815147851404103e-05, "loss": 0.4828, "step": 3580 }, { "epoch": 0.66, "learning_rate": 1.8150321321415822e-05, "loss": 0.4758, "step": 3581 }, { "epoch": 0.66, "learning_rate": 1.8149163803607887e-05, "loss": 0.4634, "step": 3582 }, { "epoch": 0.66, "learning_rate": 1.8148005960663403e-05, "loss": 0.4659, "step": 3583 }, { "epoch": 0.66, "learning_rate": 1.814684779262857e-05, "loss": 0.4825, "step": 3584 }, { "epoch": 0.66, "learning_rate": 1.8145689299549588e-05, "loss": 0.471, "step": 3585 }, { "epoch": 0.66, "learning_rate": 1.8144530481472688e-05, "loss": 0.4659, "step": 3586 }, { "epoch": 0.66, "learning_rate": 1.81433713384441e-05, "loss": 0.4478, "step": 3587 }, { "epoch": 0.66, "learning_rate": 1.8142211870510072e-05, "loss": 0.4592, "step": 3588 }, { "epoch": 0.66, "learning_rate": 1.814105207771687e-05, "loss": 0.4832, "step": 3589 }, { "epoch": 0.66, "learning_rate": 1.8139891960110752e-05, "loss": 0.4695, "step": 3590 }, { "epoch": 0.66, "learning_rate": 1.8138731517738028e-05, "loss": 0.4678, "step": 3591 }, { "epoch": 0.66, "learning_rate": 1.8137570750644977e-05, "loss": 0.4662, "step": 3592 }, { "epoch": 0.66, "learning_rate": 1.813640965887792e-05, "loss": 0.4863, "step": 3593 }, { "epoch": 0.66, "learning_rate": 1.8135248242483185e-05, "loss": 0.479, "step": 3594 }, { "epoch": 0.67, "learning_rate": 1.81340865015071e-05, "loss": 0.4515, "step": 3595 }, { "epoch": 0.67, "learning_rate": 1.813292443599603e-05, "loss": 0.4769, "step": 3596 }, { "epoch": 0.67, "learning_rate": 1.8131762045996333e-05, "loss": 0.4551, "step": 3597 }, { "epoch": 0.67, "learning_rate": 1.8130599331554384e-05, "loss": 0.4682, "step": 3598 }, { "epoch": 0.67, "learning_rate": 1.8129436292716577e-05, "loss": 0.4532, "step": 3599 }, { "epoch": 0.67, "learning_rate": 1.8128272929529312e-05, "loss": 0.4515, "step": 3600 }, { "epoch": 0.67, "learning_rate": 1.8127109242039003e-05, "loss": 0.4751, "step": 3601 }, { "epoch": 0.67, "learning_rate": 1.812594523029209e-05, "loss": 0.4613, "step": 3602 }, { "epoch": 0.67, "learning_rate": 1.8124780894335e-05, "loss": 0.4721, "step": 3603 }, { "epoch": 0.67, "learning_rate": 1.8123616234214196e-05, "loss": 0.4732, "step": 3604 }, { "epoch": 0.67, "learning_rate": 1.8122451249976144e-05, "loss": 0.4797, "step": 3605 }, { "epoch": 0.67, "learning_rate": 1.812128594166733e-05, "loss": 0.4874, "step": 3606 }, { "epoch": 0.67, "learning_rate": 1.8120120309334238e-05, "loss": 0.4646, "step": 3607 }, { "epoch": 0.67, "learning_rate": 1.8118954353023384e-05, "loss": 0.4629, "step": 3608 }, { "epoch": 0.67, "learning_rate": 1.811778807278128e-05, "loss": 0.4557, "step": 3609 }, { "epoch": 0.67, "learning_rate": 1.8116621468654462e-05, "loss": 0.4731, "step": 3610 }, { "epoch": 0.67, "learning_rate": 1.8115454540689476e-05, "loss": 0.4678, "step": 3611 }, { "epoch": 0.67, "learning_rate": 1.811428728893288e-05, "loss": 0.4695, "step": 3612 }, { "epoch": 0.67, "learning_rate": 1.8113119713431243e-05, "loss": 0.4783, "step": 3613 }, { "epoch": 0.67, "learning_rate": 1.811195181423115e-05, "loss": 0.4448, "step": 3614 }, { "epoch": 0.67, "learning_rate": 1.81107835913792e-05, "loss": 0.4518, "step": 3615 }, { "epoch": 0.67, "learning_rate": 1.8109615044922e-05, "loss": 0.4863, "step": 3616 }, { "epoch": 0.67, "learning_rate": 1.8108446174906175e-05, "loss": 0.4716, "step": 3617 }, { "epoch": 0.67, "learning_rate": 1.8107276981378363e-05, "loss": 0.4863, "step": 3618 }, { "epoch": 0.67, "learning_rate": 1.8106107464385202e-05, "loss": 0.4575, "step": 3619 }, { "epoch": 0.67, "learning_rate": 1.8104937623973368e-05, "loss": 0.5035, "step": 3620 }, { "epoch": 0.67, "learning_rate": 1.8103767460189525e-05, "loss": 0.4618, "step": 3621 }, { "epoch": 0.67, "learning_rate": 1.8102596973080365e-05, "loss": 0.4612, "step": 3622 }, { "epoch": 0.67, "learning_rate": 1.8101426162692587e-05, "loss": 0.4673, "step": 3623 }, { "epoch": 0.67, "learning_rate": 1.8100255029072905e-05, "loss": 0.4747, "step": 3624 }, { "epoch": 0.67, "learning_rate": 1.8099083572268047e-05, "loss": 0.4672, "step": 3625 }, { "epoch": 0.67, "learning_rate": 1.8097911792324748e-05, "loss": 0.4697, "step": 3626 }, { "epoch": 0.67, "learning_rate": 1.809673968928976e-05, "loss": 0.4763, "step": 3627 }, { "epoch": 0.67, "learning_rate": 1.809556726320985e-05, "loss": 0.4823, "step": 3628 }, { "epoch": 0.67, "learning_rate": 1.8094394514131795e-05, "loss": 0.4837, "step": 3629 }, { "epoch": 0.67, "learning_rate": 1.8093221442102385e-05, "loss": 0.4684, "step": 3630 }, { "epoch": 0.67, "learning_rate": 1.8092048047168426e-05, "loss": 0.4594, "step": 3631 }, { "epoch": 0.67, "learning_rate": 1.8090874329376726e-05, "loss": 0.4709, "step": 3632 }, { "epoch": 0.67, "learning_rate": 1.8089700288774122e-05, "loss": 0.4866, "step": 3633 }, { "epoch": 0.67, "learning_rate": 1.808852592540746e-05, "loss": 0.4579, "step": 3634 }, { "epoch": 0.67, "learning_rate": 1.8087351239323584e-05, "loss": 0.4523, "step": 3635 }, { "epoch": 0.67, "learning_rate": 1.808617623056937e-05, "loss": 0.4534, "step": 3636 }, { "epoch": 0.67, "learning_rate": 1.8085000899191688e-05, "loss": 0.469, "step": 3637 }, { "epoch": 0.67, "learning_rate": 1.8083825245237444e-05, "loss": 0.4615, "step": 3638 }, { "epoch": 0.67, "learning_rate": 1.808264926875354e-05, "loss": 0.471, "step": 3639 }, { "epoch": 0.67, "learning_rate": 1.8081472969786896e-05, "loss": 0.4828, "step": 3640 }, { "epoch": 0.67, "learning_rate": 1.8080296348384444e-05, "loss": 0.4752, "step": 3641 }, { "epoch": 0.67, "learning_rate": 1.8079119404593124e-05, "loss": 0.4408, "step": 3642 }, { "epoch": 0.67, "learning_rate": 1.80779421384599e-05, "loss": 0.4845, "step": 3643 }, { "epoch": 0.67, "learning_rate": 1.8076764550031738e-05, "loss": 0.4622, "step": 3644 }, { "epoch": 0.67, "learning_rate": 1.8075586639355626e-05, "loss": 0.4654, "step": 3645 }, { "epoch": 0.67, "learning_rate": 1.807440840647856e-05, "loss": 0.4935, "step": 3646 }, { "epoch": 0.67, "learning_rate": 1.807322985144755e-05, "loss": 0.4749, "step": 3647 }, { "epoch": 0.67, "learning_rate": 1.8072050974309608e-05, "loss": 0.465, "step": 3648 }, { "epoch": 0.68, "learning_rate": 1.8070871775111784e-05, "loss": 0.4497, "step": 3649 }, { "epoch": 0.68, "learning_rate": 1.8069692253901117e-05, "loss": 0.4675, "step": 3650 }, { "epoch": 0.68, "learning_rate": 1.806851241072467e-05, "loss": 0.4691, "step": 3651 }, { "epoch": 0.68, "learning_rate": 1.8067332245629516e-05, "loss": 0.4674, "step": 3652 }, { "epoch": 0.68, "learning_rate": 1.806615175866274e-05, "loss": 0.4895, "step": 3653 }, { "epoch": 0.68, "learning_rate": 1.8064970949871446e-05, "loss": 0.4688, "step": 3654 }, { "epoch": 0.68, "learning_rate": 1.8063789819302743e-05, "loss": 0.4554, "step": 3655 }, { "epoch": 0.68, "learning_rate": 1.8062608367003754e-05, "loss": 0.4761, "step": 3656 }, { "epoch": 0.68, "learning_rate": 1.8061426593021618e-05, "loss": 0.4765, "step": 3657 }, { "epoch": 0.68, "learning_rate": 1.806024449740349e-05, "loss": 0.469, "step": 3658 }, { "epoch": 0.68, "learning_rate": 1.8059062080196524e-05, "loss": 0.481, "step": 3659 }, { "epoch": 0.68, "learning_rate": 1.8057879341447907e-05, "loss": 0.475, "step": 3660 }, { "epoch": 0.68, "learning_rate": 1.805669628120482e-05, "loss": 0.4554, "step": 3661 }, { "epoch": 0.68, "learning_rate": 1.8055512899514468e-05, "loss": 0.4592, "step": 3662 }, { "epoch": 0.68, "learning_rate": 1.805432919642407e-05, "loss": 0.4447, "step": 3663 }, { "epoch": 0.68, "learning_rate": 1.8053145171980846e-05, "loss": 0.4854, "step": 3664 }, { "epoch": 0.68, "learning_rate": 1.8051960826232037e-05, "loss": 0.4798, "step": 3665 }, { "epoch": 0.68, "learning_rate": 1.8050776159224902e-05, "loss": 0.4796, "step": 3666 }, { "epoch": 0.68, "learning_rate": 1.8049591171006705e-05, "loss": 0.4709, "step": 3667 }, { "epoch": 0.68, "learning_rate": 1.804840586162472e-05, "loss": 0.4624, "step": 3668 }, { "epoch": 0.68, "learning_rate": 1.8047220231126245e-05, "loss": 0.4909, "step": 3669 }, { "epoch": 0.68, "learning_rate": 1.8046034279558582e-05, "loss": 0.4699, "step": 3670 }, { "epoch": 0.68, "learning_rate": 1.804484800696905e-05, "loss": 0.4486, "step": 3671 }, { "epoch": 0.68, "learning_rate": 1.8043661413404972e-05, "loss": 0.4601, "step": 3672 }, { "epoch": 0.68, "learning_rate": 1.80424744989137e-05, "loss": 0.4719, "step": 3673 }, { "epoch": 0.68, "learning_rate": 1.8041287263542583e-05, "loss": 0.454, "step": 3674 }, { "epoch": 0.68, "learning_rate": 1.8040099707338994e-05, "loss": 0.4636, "step": 3675 }, { "epoch": 0.68, "learning_rate": 1.8038911830350313e-05, "loss": 0.4596, "step": 3676 }, { "epoch": 0.68, "learning_rate": 1.8037723632623932e-05, "loss": 0.4576, "step": 3677 }, { "epoch": 0.68, "learning_rate": 1.803653511420726e-05, "loss": 0.4618, "step": 3678 }, { "epoch": 0.68, "learning_rate": 1.8035346275147715e-05, "loss": 0.4696, "step": 3679 }, { "epoch": 0.68, "learning_rate": 1.8034157115492732e-05, "loss": 0.4778, "step": 3680 }, { "epoch": 0.68, "learning_rate": 1.803296763528976e-05, "loss": 0.4483, "step": 3681 }, { "epoch": 0.68, "learning_rate": 1.803177783458624e-05, "loss": 0.473, "step": 3682 }, { "epoch": 0.68, "learning_rate": 1.8030587713429666e-05, "loss": 0.5031, "step": 3683 }, { "epoch": 0.68, "learning_rate": 1.8029397271867502e-05, "loss": 0.4678, "step": 3684 }, { "epoch": 0.68, "learning_rate": 1.802820650994726e-05, "loss": 0.4824, "step": 3685 }, { "epoch": 0.68, "learning_rate": 1.8027015427716442e-05, "loss": 0.4761, "step": 3686 }, { "epoch": 0.68, "learning_rate": 1.8025824025222566e-05, "loss": 0.461, "step": 3687 }, { "epoch": 0.68, "learning_rate": 1.8024632302513173e-05, "loss": 0.4685, "step": 3688 }, { "epoch": 0.68, "learning_rate": 1.8023440259635806e-05, "loss": 0.4628, "step": 3689 }, { "epoch": 0.68, "learning_rate": 1.8022247896638026e-05, "loss": 0.4637, "step": 3690 }, { "epoch": 0.68, "learning_rate": 1.8021055213567414e-05, "loss": 0.4417, "step": 3691 }, { "epoch": 0.68, "learning_rate": 1.8019862210471546e-05, "loss": 0.4722, "step": 3692 }, { "epoch": 0.68, "learning_rate": 1.8018668887398024e-05, "loss": 0.4557, "step": 3693 }, { "epoch": 0.68, "learning_rate": 1.801747524439446e-05, "loss": 0.4565, "step": 3694 }, { "epoch": 0.68, "learning_rate": 1.801628128150848e-05, "loss": 0.4761, "step": 3695 }, { "epoch": 0.68, "learning_rate": 1.8015086998787717e-05, "loss": 0.4618, "step": 3696 }, { "epoch": 0.68, "learning_rate": 1.801389239627982e-05, "loss": 0.4724, "step": 3697 }, { "epoch": 0.68, "learning_rate": 1.8012697474032454e-05, "loss": 0.4482, "step": 3698 }, { "epoch": 0.68, "learning_rate": 1.8011502232093296e-05, "loss": 0.4567, "step": 3699 }, { "epoch": 0.68, "learning_rate": 1.801030667051003e-05, "loss": 0.4745, "step": 3700 }, { "epoch": 0.68, "learning_rate": 1.8009110789330363e-05, "loss": 0.4425, "step": 3701 }, { "epoch": 0.68, "learning_rate": 1.8007914588602e-05, "loss": 0.4522, "step": 3702 }, { "epoch": 0.69, "learning_rate": 1.8006718068372673e-05, "loss": 0.4416, "step": 3703 }, { "epoch": 0.69, "learning_rate": 1.8005521228690117e-05, "loss": 0.4646, "step": 3704 }, { "epoch": 0.69, "learning_rate": 1.8004324069602085e-05, "loss": 0.4573, "step": 3705 }, { "epoch": 0.69, "learning_rate": 1.8003126591156347e-05, "loss": 0.4703, "step": 3706 }, { "epoch": 0.69, "learning_rate": 1.8001928793400672e-05, "loss": 0.472, "step": 3707 }, { "epoch": 0.69, "learning_rate": 1.8000730676382853e-05, "loss": 0.4662, "step": 3708 }, { "epoch": 0.69, "learning_rate": 1.7999532240150693e-05, "loss": 0.4778, "step": 3709 }, { "epoch": 0.69, "learning_rate": 1.799833348475201e-05, "loss": 0.4687, "step": 3710 }, { "epoch": 0.69, "learning_rate": 1.7997134410234625e-05, "loss": 0.4707, "step": 3711 }, { "epoch": 0.69, "learning_rate": 1.7995935016646387e-05, "loss": 0.4798, "step": 3712 }, { "epoch": 0.69, "learning_rate": 1.7994735304035146e-05, "loss": 0.4528, "step": 3713 }, { "epoch": 0.69, "learning_rate": 1.7993535272448766e-05, "loss": 0.4665, "step": 3714 }, { "epoch": 0.69, "learning_rate": 1.799233492193513e-05, "loss": 0.4526, "step": 3715 }, { "epoch": 0.69, "learning_rate": 1.7991134252542125e-05, "loss": 0.4585, "step": 3716 }, { "epoch": 0.69, "learning_rate": 1.7989933264317663e-05, "loss": 0.4537, "step": 3717 }, { "epoch": 0.69, "learning_rate": 1.798873195730965e-05, "loss": 0.4602, "step": 3718 }, { "epoch": 0.69, "learning_rate": 1.7987530331566028e-05, "loss": 0.4606, "step": 3719 }, { "epoch": 0.69, "learning_rate": 1.7986328387134736e-05, "loss": 0.4782, "step": 3720 }, { "epoch": 0.69, "learning_rate": 1.7985126124063726e-05, "loss": 0.4501, "step": 3721 }, { "epoch": 0.69, "learning_rate": 1.798392354240097e-05, "loss": 0.4663, "step": 3722 }, { "epoch": 0.69, "learning_rate": 1.798272064219444e-05, "loss": 0.4586, "step": 3723 }, { "epoch": 0.69, "learning_rate": 1.798151742349214e-05, "loss": 0.4463, "step": 3724 }, { "epoch": 0.69, "learning_rate": 1.7980313886342073e-05, "loss": 0.4585, "step": 3725 }, { "epoch": 0.69, "learning_rate": 1.7979110030792256e-05, "loss": 0.4637, "step": 3726 }, { "epoch": 0.69, "learning_rate": 1.797790585689072e-05, "loss": 0.4841, "step": 3727 }, { "epoch": 0.69, "learning_rate": 1.7976701364685512e-05, "loss": 0.4572, "step": 3728 }, { "epoch": 0.69, "learning_rate": 1.797549655422469e-05, "loss": 0.441, "step": 3729 }, { "epoch": 0.69, "learning_rate": 1.797429142555632e-05, "loss": 0.469, "step": 3730 }, { "epoch": 0.69, "learning_rate": 1.7973085978728483e-05, "loss": 0.4482, "step": 3731 }, { "epoch": 0.69, "learning_rate": 1.797188021378928e-05, "loss": 0.4644, "step": 3732 }, { "epoch": 0.69, "learning_rate": 1.797067413078682e-05, "loss": 0.4631, "step": 3733 }, { "epoch": 0.69, "learning_rate": 1.7969467729769216e-05, "loss": 0.4574, "step": 3734 }, { "epoch": 0.69, "learning_rate": 1.7968261010784602e-05, "loss": 0.4668, "step": 3735 }, { "epoch": 0.69, "learning_rate": 1.796705397388113e-05, "loss": 0.4611, "step": 3736 }, { "epoch": 0.69, "learning_rate": 1.7965846619106955e-05, "loss": 0.4842, "step": 3737 }, { "epoch": 0.69, "learning_rate": 1.7964638946510246e-05, "loss": 0.4648, "step": 3738 }, { "epoch": 0.69, "learning_rate": 1.796343095613919e-05, "loss": 0.4685, "step": 3739 }, { "epoch": 0.69, "learning_rate": 1.7962222648041986e-05, "loss": 0.469, "step": 3740 }, { "epoch": 0.69, "learning_rate": 1.7961014022266837e-05, "loss": 0.4401, "step": 3741 }, { "epoch": 0.69, "learning_rate": 1.7959805078861967e-05, "loss": 0.4794, "step": 3742 }, { "epoch": 0.69, "learning_rate": 1.7958595817875614e-05, "loss": 0.4535, "step": 3743 }, { "epoch": 0.69, "learning_rate": 1.795738623935602e-05, "loss": 0.4869, "step": 3744 }, { "epoch": 0.69, "learning_rate": 1.795617634335145e-05, "loss": 0.4776, "step": 3745 }, { "epoch": 0.69, "learning_rate": 1.7954966129910175e-05, "loss": 0.4449, "step": 3746 }, { "epoch": 0.69, "learning_rate": 1.7953755599080475e-05, "loss": 0.5019, "step": 3747 }, { "epoch": 0.69, "learning_rate": 1.7952544750910657e-05, "loss": 0.4661, "step": 3748 }, { "epoch": 0.69, "learning_rate": 1.7951333585449026e-05, "loss": 0.4719, "step": 3749 }, { "epoch": 0.69, "learning_rate": 1.7950122102743907e-05, "loss": 0.4407, "step": 3750 }, { "epoch": 0.69, "learning_rate": 1.7948910302843638e-05, "loss": 0.4472, "step": 3751 }, { "epoch": 0.69, "learning_rate": 1.794769818579656e-05, "loss": 0.4539, "step": 3752 }, { "epoch": 0.69, "learning_rate": 1.794648575165104e-05, "loss": 0.4538, "step": 3753 }, { "epoch": 0.69, "learning_rate": 1.7945273000455455e-05, "loss": 0.4751, "step": 3754 }, { "epoch": 0.69, "learning_rate": 1.7944059932258185e-05, "loss": 0.4625, "step": 3755 }, { "epoch": 0.69, "learning_rate": 1.794284654710763e-05, "loss": 0.4672, "step": 3756 }, { "epoch": 0.7, "learning_rate": 1.7941632845052207e-05, "loss": 0.4969, "step": 3757 }, { "epoch": 0.7, "learning_rate": 1.7940418826140332e-05, "loss": 0.4676, "step": 3758 }, { "epoch": 0.7, "learning_rate": 1.793920449042045e-05, "loss": 0.4792, "step": 3759 }, { "epoch": 0.7, "learning_rate": 1.7937989837941007e-05, "loss": 0.5048, "step": 3760 }, { "epoch": 0.7, "learning_rate": 1.793677486875047e-05, "loss": 0.4606, "step": 3761 }, { "epoch": 0.7, "learning_rate": 1.793555958289731e-05, "loss": 0.4748, "step": 3762 }, { "epoch": 0.7, "learning_rate": 1.7934343980430008e-05, "loss": 0.4382, "step": 3763 }, { "epoch": 0.7, "learning_rate": 1.7933128061397078e-05, "loss": 0.464, "step": 3764 }, { "epoch": 0.7, "learning_rate": 1.7931911825847024e-05, "loss": 0.4563, "step": 3765 }, { "epoch": 0.7, "learning_rate": 1.7930695273828375e-05, "loss": 0.4615, "step": 3766 }, { "epoch": 0.7, "learning_rate": 1.7929478405389665e-05, "loss": 0.4545, "step": 3767 }, { "epoch": 0.7, "learning_rate": 1.792826122057945e-05, "loss": 0.4638, "step": 3768 }, { "epoch": 0.7, "learning_rate": 1.792704371944629e-05, "loss": 0.4592, "step": 3769 }, { "epoch": 0.7, "learning_rate": 1.792582590203876e-05, "loss": 0.4676, "step": 3770 }, { "epoch": 0.7, "learning_rate": 1.7924607768405454e-05, "loss": 0.4728, "step": 3771 }, { "epoch": 0.7, "learning_rate": 1.792338931859497e-05, "loss": 0.4672, "step": 3772 }, { "epoch": 0.7, "learning_rate": 1.792217055265592e-05, "loss": 0.4709, "step": 3773 }, { "epoch": 0.7, "learning_rate": 1.7920951470636933e-05, "loss": 0.4598, "step": 3774 }, { "epoch": 0.7, "learning_rate": 1.791973207258665e-05, "loss": 0.4804, "step": 3775 }, { "epoch": 0.7, "learning_rate": 1.7918512358553716e-05, "loss": 0.4768, "step": 3776 }, { "epoch": 0.7, "learning_rate": 1.7917292328586805e-05, "loss": 0.4647, "step": 3777 }, { "epoch": 0.7, "learning_rate": 1.7916071982734585e-05, "loss": 0.4678, "step": 3778 }, { "epoch": 0.7, "learning_rate": 1.791485132104575e-05, "loss": 0.4575, "step": 3779 }, { "epoch": 0.7, "learning_rate": 1.7913630343569e-05, "loss": 0.47, "step": 3780 }, { "epoch": 0.7, "learning_rate": 1.7912409050353052e-05, "loss": 0.4622, "step": 3781 }, { "epoch": 0.7, "learning_rate": 1.7911187441446633e-05, "loss": 0.4692, "step": 3782 }, { "epoch": 0.7, "learning_rate": 1.790996551689848e-05, "loss": 0.4613, "step": 3783 }, { "epoch": 0.7, "learning_rate": 1.790874327675735e-05, "loss": 0.4608, "step": 3784 }, { "epoch": 0.7, "learning_rate": 1.7907520721072008e-05, "loss": 0.4652, "step": 3785 }, { "epoch": 0.7, "learning_rate": 1.7906297849891223e-05, "loss": 0.4671, "step": 3786 }, { "epoch": 0.7, "learning_rate": 1.7905074663263797e-05, "loss": 0.4481, "step": 3787 }, { "epoch": 0.7, "learning_rate": 1.7903851161238524e-05, "loss": 0.4529, "step": 3788 }, { "epoch": 0.7, "learning_rate": 1.790262734386423e-05, "loss": 0.4706, "step": 3789 }, { "epoch": 0.7, "learning_rate": 1.7901403211189728e-05, "loss": 0.458, "step": 3790 }, { "epoch": 0.7, "learning_rate": 1.7900178763263874e-05, "loss": 0.48, "step": 3791 }, { "epoch": 0.7, "learning_rate": 1.7898954000135512e-05, "loss": 0.4644, "step": 3792 }, { "epoch": 0.7, "learning_rate": 1.789772892185351e-05, "loss": 0.4462, "step": 3793 }, { "epoch": 0.7, "learning_rate": 1.789650352846674e-05, "loss": 0.4718, "step": 3794 }, { "epoch": 0.7, "learning_rate": 1.7895277820024107e-05, "loss": 0.4553, "step": 3795 }, { "epoch": 0.7, "learning_rate": 1.7894051796574505e-05, "loss": 0.4835, "step": 3796 }, { "epoch": 0.7, "learning_rate": 1.789282545816685e-05, "loss": 0.4544, "step": 3797 }, { "epoch": 0.7, "learning_rate": 1.7891598804850074e-05, "loss": 0.4522, "step": 3798 }, { "epoch": 0.7, "learning_rate": 1.7890371836673116e-05, "loss": 0.4597, "step": 3799 }, { "epoch": 0.7, "learning_rate": 1.788914455368493e-05, "loss": 0.4612, "step": 3800 }, { "epoch": 0.7, "learning_rate": 1.7887916955934485e-05, "loss": 0.5003, "step": 3801 }, { "epoch": 0.7, "learning_rate": 1.7886689043470757e-05, "loss": 0.4647, "step": 3802 }, { "epoch": 0.7, "learning_rate": 1.7885460816342735e-05, "loss": 0.4486, "step": 3803 }, { "epoch": 0.7, "learning_rate": 1.788423227459943e-05, "loss": 0.4569, "step": 3804 }, { "epoch": 0.7, "learning_rate": 1.788300341828985e-05, "loss": 0.4721, "step": 3805 }, { "epoch": 0.7, "learning_rate": 1.788177424746303e-05, "loss": 0.4485, "step": 3806 }, { "epoch": 0.7, "learning_rate": 1.788054476216801e-05, "loss": 0.4836, "step": 3807 }, { "epoch": 0.7, "learning_rate": 1.7879314962453846e-05, "loss": 0.481, "step": 3808 }, { "epoch": 0.7, "learning_rate": 1.7878084848369603e-05, "loss": 0.4683, "step": 3809 }, { "epoch": 0.7, "learning_rate": 1.787685441996436e-05, "loss": 0.4564, "step": 3810 }, { "epoch": 0.71, "learning_rate": 1.7875623677287208e-05, "loss": 0.4339, "step": 3811 }, { "epoch": 0.71, "learning_rate": 1.7874392620387257e-05, "loss": 0.4554, "step": 3812 }, { "epoch": 0.71, "learning_rate": 1.7873161249313615e-05, "loss": 0.4443, "step": 3813 }, { "epoch": 0.71, "learning_rate": 1.787192956411542e-05, "loss": 0.4643, "step": 3814 }, { "epoch": 0.71, "learning_rate": 1.7870697564841803e-05, "loss": 0.4323, "step": 3815 }, { "epoch": 0.71, "learning_rate": 1.786946525154193e-05, "loss": 0.4516, "step": 3816 }, { "epoch": 0.71, "learning_rate": 1.7868232624264963e-05, "loss": 0.4679, "step": 3817 }, { "epoch": 0.71, "learning_rate": 1.7866999683060082e-05, "loss": 0.4779, "step": 3818 }, { "epoch": 0.71, "learning_rate": 1.786576642797648e-05, "loss": 0.4661, "step": 3819 }, { "epoch": 0.71, "learning_rate": 1.786453285906336e-05, "loss": 0.4744, "step": 3820 }, { "epoch": 0.71, "learning_rate": 1.7863298976369935e-05, "loss": 0.4497, "step": 3821 }, { "epoch": 0.71, "learning_rate": 1.7862064779945445e-05, "loss": 0.4599, "step": 3822 }, { "epoch": 0.71, "learning_rate": 1.7860830269839126e-05, "loss": 0.4584, "step": 3823 }, { "epoch": 0.71, "learning_rate": 1.785959544610023e-05, "loss": 0.4522, "step": 3824 }, { "epoch": 0.71, "learning_rate": 1.7858360308778033e-05, "loss": 0.4517, "step": 3825 }, { "epoch": 0.71, "learning_rate": 1.7857124857921804e-05, "loss": 0.4708, "step": 3826 }, { "epoch": 0.71, "learning_rate": 1.7855889093580843e-05, "loss": 0.4509, "step": 3827 }, { "epoch": 0.71, "learning_rate": 1.785465301580445e-05, "loss": 0.4657, "step": 3828 }, { "epoch": 0.71, "learning_rate": 1.7853416624641944e-05, "loss": 0.4833, "step": 3829 }, { "epoch": 0.71, "learning_rate": 1.7852179920142656e-05, "loss": 0.4569, "step": 3830 }, { "epoch": 0.71, "learning_rate": 1.785094290235593e-05, "loss": 0.4454, "step": 3831 }, { "epoch": 0.71, "learning_rate": 1.7849705571331112e-05, "loss": 0.4684, "step": 3832 }, { "epoch": 0.71, "learning_rate": 1.7848467927117578e-05, "loss": 0.4655, "step": 3833 }, { "epoch": 0.71, "learning_rate": 1.7847229969764704e-05, "loss": 0.4778, "step": 3834 }, { "epoch": 0.71, "learning_rate": 1.7845991699321884e-05, "loss": 0.4767, "step": 3835 }, { "epoch": 0.71, "learning_rate": 1.7844753115838522e-05, "loss": 0.46, "step": 3836 }, { "epoch": 0.71, "learning_rate": 1.7843514219364035e-05, "loss": 0.4694, "step": 3837 }, { "epoch": 0.71, "learning_rate": 1.7842275009947848e-05, "loss": 0.4732, "step": 3838 }, { "epoch": 0.71, "learning_rate": 1.7841035487639412e-05, "loss": 0.4634, "step": 3839 }, { "epoch": 0.71, "learning_rate": 1.7839795652488176e-05, "loss": 0.4834, "step": 3840 }, { "epoch": 0.71, "learning_rate": 1.783855550454361e-05, "loss": 0.4707, "step": 3841 }, { "epoch": 0.71, "learning_rate": 1.7837315043855192e-05, "loss": 0.4889, "step": 3842 }, { "epoch": 0.71, "learning_rate": 1.7836074270472412e-05, "loss": 0.4741, "step": 3843 }, { "epoch": 0.71, "learning_rate": 1.783483318444478e-05, "loss": 0.4705, "step": 3844 }, { "epoch": 0.71, "learning_rate": 1.7833591785821807e-05, "loss": 0.449, "step": 3845 }, { "epoch": 0.71, "learning_rate": 1.7832350074653027e-05, "loss": 0.4645, "step": 3846 }, { "epoch": 0.71, "learning_rate": 1.7831108050987976e-05, "loss": 0.4624, "step": 3847 }, { "epoch": 0.71, "learning_rate": 1.782986571487622e-05, "loss": 0.4589, "step": 3848 }, { "epoch": 0.71, "learning_rate": 1.7828623066367312e-05, "loss": 0.4649, "step": 3849 }, { "epoch": 0.71, "learning_rate": 1.7827380105510842e-05, "loss": 0.4636, "step": 3850 }, { "epoch": 0.71, "learning_rate": 1.7826136832356394e-05, "loss": 0.4569, "step": 3851 }, { "epoch": 0.71, "learning_rate": 1.782489324695358e-05, "loss": 0.4733, "step": 3852 }, { "epoch": 0.71, "learning_rate": 1.782364934935201e-05, "loss": 0.4706, "step": 3853 }, { "epoch": 0.71, "learning_rate": 1.7822405139601317e-05, "loss": 0.4766, "step": 3854 }, { "epoch": 0.71, "learning_rate": 1.7821160617751142e-05, "loss": 0.4683, "step": 3855 }, { "epoch": 0.71, "learning_rate": 1.781991578385114e-05, "loss": 0.4792, "step": 3856 }, { "epoch": 0.71, "learning_rate": 1.7818670637950976e-05, "loss": 0.4662, "step": 3857 }, { "epoch": 0.71, "learning_rate": 1.7817425180100328e-05, "loss": 0.445, "step": 3858 }, { "epoch": 0.71, "learning_rate": 1.781617941034889e-05, "loss": 0.4742, "step": 3859 }, { "epoch": 0.71, "learning_rate": 1.7814933328746363e-05, "loss": 0.4598, "step": 3860 }, { "epoch": 0.71, "learning_rate": 1.7813686935342468e-05, "loss": 0.4552, "step": 3861 }, { "epoch": 0.71, "learning_rate": 1.7812440230186928e-05, "loss": 0.468, "step": 3862 }, { "epoch": 0.71, "learning_rate": 1.781119321332949e-05, "loss": 0.4405, "step": 3863 }, { "epoch": 0.71, "learning_rate": 1.7809945884819904e-05, "loss": 0.4655, "step": 3864 }, { "epoch": 0.72, "learning_rate": 1.7808698244707936e-05, "loss": 0.4889, "step": 3865 }, { "epoch": 0.72, "learning_rate": 1.7807450293043366e-05, "loss": 0.4823, "step": 3866 }, { "epoch": 0.72, "learning_rate": 1.780620202987598e-05, "loss": 0.4557, "step": 3867 }, { "epoch": 0.72, "learning_rate": 1.7804953455255592e-05, "loss": 0.4681, "step": 3868 }, { "epoch": 0.72, "learning_rate": 1.7803704569232014e-05, "loss": 0.4604, "step": 3869 }, { "epoch": 0.72, "learning_rate": 1.7802455371855065e-05, "loss": 0.4545, "step": 3870 }, { "epoch": 0.72, "learning_rate": 1.7801205863174595e-05, "loss": 0.4563, "step": 3871 }, { "epoch": 0.72, "learning_rate": 1.7799956043240455e-05, "loss": 0.4632, "step": 3872 }, { "epoch": 0.72, "learning_rate": 1.779870591210251e-05, "loss": 0.4752, "step": 3873 }, { "epoch": 0.72, "learning_rate": 1.779745546981064e-05, "loss": 0.4675, "step": 3874 }, { "epoch": 0.72, "learning_rate": 1.779620471641473e-05, "loss": 0.4874, "step": 3875 }, { "epoch": 0.72, "learning_rate": 1.7794953651964685e-05, "loss": 0.4729, "step": 3876 }, { "epoch": 0.72, "learning_rate": 1.7793702276510424e-05, "loss": 0.4696, "step": 3877 }, { "epoch": 0.72, "learning_rate": 1.779245059010187e-05, "loss": 0.4693, "step": 3878 }, { "epoch": 0.72, "learning_rate": 1.779119859278897e-05, "loss": 0.4585, "step": 3879 }, { "epoch": 0.72, "learning_rate": 1.7789946284621664e-05, "loss": 0.46, "step": 3880 }, { "epoch": 0.72, "learning_rate": 1.778869366564993e-05, "loss": 0.4638, "step": 3881 }, { "epoch": 0.72, "learning_rate": 1.7787440735923734e-05, "loss": 0.4538, "step": 3882 }, { "epoch": 0.72, "learning_rate": 1.7786187495493075e-05, "loss": 0.4499, "step": 3883 }, { "epoch": 0.72, "learning_rate": 1.7784933944407946e-05, "loss": 0.4597, "step": 3884 }, { "epoch": 0.72, "learning_rate": 1.778368008271837e-05, "loss": 0.4636, "step": 3885 }, { "epoch": 0.72, "learning_rate": 1.778242591047437e-05, "loss": 0.4544, "step": 3886 }, { "epoch": 0.72, "learning_rate": 1.7781171427725983e-05, "loss": 0.4517, "step": 3887 }, { "epoch": 0.72, "learning_rate": 1.7779916634523263e-05, "loss": 0.4691, "step": 3888 }, { "epoch": 0.72, "learning_rate": 1.7778661530916273e-05, "loss": 0.4684, "step": 3889 }, { "epoch": 0.72, "learning_rate": 1.777740611695509e-05, "loss": 0.4584, "step": 3890 }, { "epoch": 0.72, "learning_rate": 1.77761503926898e-05, "loss": 0.4463, "step": 3891 }, { "epoch": 0.72, "learning_rate": 1.7774894358170513e-05, "loss": 0.4439, "step": 3892 }, { "epoch": 0.72, "learning_rate": 1.7773638013447332e-05, "loss": 0.4482, "step": 3893 }, { "epoch": 0.72, "learning_rate": 1.7772381358570386e-05, "loss": 0.4372, "step": 3894 }, { "epoch": 0.72, "learning_rate": 1.7771124393589816e-05, "loss": 0.4661, "step": 3895 }, { "epoch": 0.72, "learning_rate": 1.7769867118555767e-05, "loss": 0.442, "step": 3896 }, { "epoch": 0.72, "learning_rate": 1.776860953351841e-05, "loss": 0.4764, "step": 3897 }, { "epoch": 0.72, "learning_rate": 1.776735163852791e-05, "loss": 0.4825, "step": 3898 }, { "epoch": 0.72, "learning_rate": 1.7766093433634465e-05, "loss": 0.4587, "step": 3899 }, { "epoch": 0.72, "learning_rate": 1.776483491888827e-05, "loss": 0.4566, "step": 3900 }, { "epoch": 0.72, "learning_rate": 1.776357609433954e-05, "loss": 0.4705, "step": 3901 }, { "epoch": 0.72, "learning_rate": 1.7762316960038494e-05, "loss": 0.4666, "step": 3902 }, { "epoch": 0.72, "learning_rate": 1.7761057516035373e-05, "loss": 0.469, "step": 3903 }, { "epoch": 0.72, "learning_rate": 1.7759797762380428e-05, "loss": 0.4747, "step": 3904 }, { "epoch": 0.72, "learning_rate": 1.775853769912392e-05, "loss": 0.485, "step": 3905 }, { "epoch": 0.72, "learning_rate": 1.775727732631612e-05, "loss": 0.4604, "step": 3906 }, { "epoch": 0.72, "learning_rate": 1.775601664400732e-05, "loss": 0.4433, "step": 3907 }, { "epoch": 0.72, "learning_rate": 1.775475565224781e-05, "loss": 0.4432, "step": 3908 }, { "epoch": 0.72, "learning_rate": 1.7753494351087912e-05, "loss": 0.4697, "step": 3909 }, { "epoch": 0.72, "learning_rate": 1.7752232740577945e-05, "loss": 0.4698, "step": 3910 }, { "epoch": 0.72, "learning_rate": 1.7750970820768242e-05, "loss": 0.4848, "step": 3911 }, { "epoch": 0.72, "learning_rate": 1.7749708591709155e-05, "loss": 0.4772, "step": 3912 }, { "epoch": 0.72, "learning_rate": 1.7748446053451042e-05, "loss": 0.4755, "step": 3913 }, { "epoch": 0.72, "learning_rate": 1.774718320604428e-05, "loss": 0.4487, "step": 3914 }, { "epoch": 0.72, "learning_rate": 1.7745920049539247e-05, "loss": 0.4554, "step": 3915 }, { "epoch": 0.72, "learning_rate": 1.774465658398635e-05, "loss": 0.4607, "step": 3916 }, { "epoch": 0.72, "learning_rate": 1.7743392809435992e-05, "loss": 0.4691, "step": 3917 }, { "epoch": 0.72, "learning_rate": 1.77421287259386e-05, "loss": 0.4747, "step": 3918 }, { "epoch": 0.73, "learning_rate": 1.77408643335446e-05, "loss": 0.472, "step": 3919 }, { "epoch": 0.73, "learning_rate": 1.773959963230445e-05, "loss": 0.4698, "step": 3920 }, { "epoch": 0.73, "learning_rate": 1.7738334622268603e-05, "loss": 0.4571, "step": 3921 }, { "epoch": 0.73, "learning_rate": 1.773706930348753e-05, "loss": 0.4544, "step": 3922 }, { "epoch": 0.73, "learning_rate": 1.773580367601172e-05, "loss": 0.4619, "step": 3923 }, { "epoch": 0.73, "learning_rate": 1.773453773989166e-05, "loss": 0.4553, "step": 3924 }, { "epoch": 0.73, "learning_rate": 1.773327149517787e-05, "loss": 0.4861, "step": 3925 }, { "epoch": 0.73, "learning_rate": 1.7732004941920864e-05, "loss": 0.4572, "step": 3926 }, { "epoch": 0.73, "learning_rate": 1.7730738080171174e-05, "loss": 0.4692, "step": 3927 }, { "epoch": 0.73, "learning_rate": 1.7729470909979352e-05, "loss": 0.4686, "step": 3928 }, { "epoch": 0.73, "learning_rate": 1.772820343139595e-05, "loss": 0.47, "step": 3929 }, { "epoch": 0.73, "learning_rate": 1.7726935644471537e-05, "loss": 0.4548, "step": 3930 }, { "epoch": 0.73, "learning_rate": 1.7725667549256697e-05, "loss": 0.4798, "step": 3931 }, { "epoch": 0.73, "learning_rate": 1.772439914580203e-05, "loss": 0.4701, "step": 3932 }, { "epoch": 0.73, "learning_rate": 1.7723130434158133e-05, "loss": 0.4905, "step": 3933 }, { "epoch": 0.73, "learning_rate": 1.7721861414375637e-05, "loss": 0.4452, "step": 3934 }, { "epoch": 0.73, "learning_rate": 1.7720592086505163e-05, "loss": 0.4655, "step": 3935 }, { "epoch": 0.73, "learning_rate": 1.771932245059736e-05, "loss": 0.4808, "step": 3936 }, { "epoch": 0.73, "learning_rate": 1.7718052506702882e-05, "loss": 0.4838, "step": 3937 }, { "epoch": 0.73, "learning_rate": 1.7716782254872397e-05, "loss": 0.4498, "step": 3938 }, { "epoch": 0.73, "learning_rate": 1.7715511695156592e-05, "loss": 0.4561, "step": 3939 }, { "epoch": 0.73, "learning_rate": 1.7714240827606152e-05, "loss": 0.468, "step": 3940 }, { "epoch": 0.73, "learning_rate": 1.771296965227179e-05, "loss": 0.458, "step": 3941 }, { "epoch": 0.73, "learning_rate": 1.7711698169204213e-05, "loss": 0.4951, "step": 3942 }, { "epoch": 0.73, "learning_rate": 1.771042637845416e-05, "loss": 0.4659, "step": 3943 }, { "epoch": 0.73, "learning_rate": 1.770915428007237e-05, "loss": 0.4475, "step": 3944 }, { "epoch": 0.73, "learning_rate": 1.7707881874109597e-05, "loss": 0.4691, "step": 3945 }, { "epoch": 0.73, "learning_rate": 1.770660916061661e-05, "loss": 0.4795, "step": 3946 }, { "epoch": 0.73, "learning_rate": 1.770533613964418e-05, "loss": 0.4667, "step": 3947 }, { "epoch": 0.73, "learning_rate": 1.7704062811243106e-05, "loss": 0.4719, "step": 3948 }, { "epoch": 0.73, "learning_rate": 1.7702789175464192e-05, "loss": 0.4506, "step": 3949 }, { "epoch": 0.73, "learning_rate": 1.7701515232358252e-05, "loss": 0.4725, "step": 3950 }, { "epoch": 0.73, "learning_rate": 1.7700240981976114e-05, "loss": 0.4604, "step": 3951 }, { "epoch": 0.73, "learning_rate": 1.7698966424368614e-05, "loss": 0.4778, "step": 3952 }, { "epoch": 0.73, "learning_rate": 1.7697691559586608e-05, "loss": 0.4455, "step": 3953 }, { "epoch": 0.73, "learning_rate": 1.7696416387680962e-05, "loss": 0.4666, "step": 3954 }, { "epoch": 0.73, "learning_rate": 1.7695140908702552e-05, "loss": 0.4537, "step": 3955 }, { "epoch": 0.73, "learning_rate": 1.7693865122702264e-05, "loss": 0.4557, "step": 3956 }, { "epoch": 0.73, "learning_rate": 1.7692589029731006e-05, "loss": 0.4942, "step": 3957 }, { "epoch": 0.73, "learning_rate": 1.7691312629839687e-05, "loss": 0.4557, "step": 3958 }, { "epoch": 0.73, "learning_rate": 1.7690035923079234e-05, "loss": 0.4443, "step": 3959 }, { "epoch": 0.73, "learning_rate": 1.7688758909500588e-05, "loss": 0.473, "step": 3960 }, { "epoch": 0.73, "learning_rate": 1.7687481589154692e-05, "loss": 0.4723, "step": 3961 }, { "epoch": 0.73, "learning_rate": 1.7686203962092515e-05, "loss": 0.4563, "step": 3962 }, { "epoch": 0.73, "learning_rate": 1.768492602836503e-05, "loss": 0.4556, "step": 3963 }, { "epoch": 0.73, "learning_rate": 1.7683647788023228e-05, "loss": 0.4662, "step": 3964 }, { "epoch": 0.73, "learning_rate": 1.7682369241118104e-05, "loss": 0.469, "step": 3965 }, { "epoch": 0.73, "learning_rate": 1.768109038770067e-05, "loss": 0.4471, "step": 3966 }, { "epoch": 0.73, "learning_rate": 1.767981122782195e-05, "loss": 0.4545, "step": 3967 }, { "epoch": 0.73, "learning_rate": 1.7678531761532986e-05, "loss": 0.4422, "step": 3968 }, { "epoch": 0.73, "learning_rate": 1.7677251988884813e-05, "loss": 0.4798, "step": 3969 }, { "epoch": 0.73, "learning_rate": 1.7675971909928503e-05, "loss": 0.4748, "step": 3970 }, { "epoch": 0.73, "learning_rate": 1.7674691524715126e-05, "loss": 0.4619, "step": 3971 }, { "epoch": 0.73, "learning_rate": 1.7673410833295767e-05, "loss": 0.4636, "step": 3972 }, { "epoch": 0.74, "learning_rate": 1.7672129835721523e-05, "loss": 0.4584, "step": 3973 }, { "epoch": 0.74, "learning_rate": 1.76708485320435e-05, "loss": 0.4565, "step": 3974 }, { "epoch": 0.74, "learning_rate": 1.7669566922312826e-05, "loss": 0.4769, "step": 3975 }, { "epoch": 0.74, "learning_rate": 1.7668285006580633e-05, "loss": 0.4751, "step": 3976 }, { "epoch": 0.74, "learning_rate": 1.766700278489806e-05, "loss": 0.4666, "step": 3977 }, { "epoch": 0.74, "learning_rate": 1.7665720257316277e-05, "loss": 0.4748, "step": 3978 }, { "epoch": 0.74, "learning_rate": 1.766443742388645e-05, "loss": 0.4606, "step": 3979 }, { "epoch": 0.74, "learning_rate": 1.7663154284659752e-05, "loss": 0.4735, "step": 3980 }, { "epoch": 0.74, "learning_rate": 1.766187083968739e-05, "loss": 0.4584, "step": 3981 }, { "epoch": 0.74, "learning_rate": 1.7660587089020567e-05, "loss": 0.4647, "step": 3982 }, { "epoch": 0.74, "learning_rate": 1.7659303032710502e-05, "loss": 0.4527, "step": 3983 }, { "epoch": 0.74, "learning_rate": 1.7658018670808426e-05, "loss": 0.4691, "step": 3984 }, { "epoch": 0.74, "learning_rate": 1.7656734003365583e-05, "loss": 0.457, "step": 3985 }, { "epoch": 0.74, "learning_rate": 1.765544903043323e-05, "loss": 0.4705, "step": 3986 }, { "epoch": 0.74, "learning_rate": 1.7654163752062637e-05, "loss": 0.4505, "step": 3987 }, { "epoch": 0.74, "learning_rate": 1.7652878168305082e-05, "loss": 0.4657, "step": 3988 }, { "epoch": 0.74, "learning_rate": 1.765159227921185e-05, "loss": 0.4677, "step": 3989 }, { "epoch": 0.74, "learning_rate": 1.7650306084834262e-05, "loss": 0.4421, "step": 3990 }, { "epoch": 0.74, "learning_rate": 1.764901958522362e-05, "loss": 0.4611, "step": 3991 }, { "epoch": 0.74, "learning_rate": 1.764773278043126e-05, "loss": 0.4678, "step": 3992 }, { "epoch": 0.74, "learning_rate": 1.764644567050852e-05, "loss": 0.455, "step": 3993 }, { "epoch": 0.74, "learning_rate": 1.7645158255506757e-05, "loss": 0.4853, "step": 3994 }, { "epoch": 0.74, "learning_rate": 1.7643870535477333e-05, "loss": 0.4541, "step": 3995 }, { "epoch": 0.74, "learning_rate": 1.7642582510471626e-05, "loss": 0.4513, "step": 3996 }, { "epoch": 0.74, "learning_rate": 1.7641294180541028e-05, "loss": 0.468, "step": 3997 }, { "epoch": 0.74, "learning_rate": 1.7640005545736935e-05, "loss": 0.4565, "step": 3998 }, { "epoch": 0.74, "learning_rate": 1.763871660611077e-05, "loss": 0.4833, "step": 3999 }, { "epoch": 0.74, "learning_rate": 1.7637427361713957e-05, "loss": 0.4785, "step": 4000 }, { "epoch": 0.74, "learning_rate": 1.7636137812597927e-05, "loss": 0.4724, "step": 4001 }, { "epoch": 0.74, "learning_rate": 1.763484795881414e-05, "loss": 0.4546, "step": 4002 }, { "epoch": 0.74, "learning_rate": 1.7633557800414055e-05, "loss": 0.4546, "step": 4003 }, { "epoch": 0.74, "learning_rate": 1.7632267337449148e-05, "loss": 0.472, "step": 4004 }, { "epoch": 0.74, "learning_rate": 1.7630976569970905e-05, "loss": 0.4704, "step": 4005 }, { "epoch": 0.74, "learning_rate": 1.7629685498030823e-05, "loss": 0.4795, "step": 4006 }, { "epoch": 0.74, "learning_rate": 1.7628394121680415e-05, "loss": 0.4517, "step": 4007 }, { "epoch": 0.74, "learning_rate": 1.762710244097121e-05, "loss": 0.4586, "step": 4008 }, { "epoch": 0.74, "learning_rate": 1.7625810455954733e-05, "loss": 0.4547, "step": 4009 }, { "epoch": 0.74, "learning_rate": 1.762451816668254e-05, "loss": 0.4733, "step": 4010 }, { "epoch": 0.74, "learning_rate": 1.762322557320619e-05, "loss": 0.4651, "step": 4011 }, { "epoch": 0.74, "learning_rate": 1.7621932675577252e-05, "loss": 0.4565, "step": 4012 }, { "epoch": 0.74, "learning_rate": 1.7620639473847312e-05, "loss": 0.4827, "step": 4013 }, { "epoch": 0.74, "learning_rate": 1.7619345968067968e-05, "loss": 0.4504, "step": 4014 }, { "epoch": 0.74, "learning_rate": 1.7618052158290822e-05, "loss": 0.469, "step": 4015 }, { "epoch": 0.74, "learning_rate": 1.7616758044567505e-05, "loss": 0.4798, "step": 4016 }, { "epoch": 0.74, "learning_rate": 1.761546362694964e-05, "loss": 0.4675, "step": 4017 }, { "epoch": 0.74, "learning_rate": 1.7614168905488877e-05, "loss": 0.4762, "step": 4018 }, { "epoch": 0.74, "learning_rate": 1.7612873880236874e-05, "loss": 0.4736, "step": 4019 }, { "epoch": 0.74, "learning_rate": 1.7611578551245294e-05, "loss": 0.441, "step": 4020 }, { "epoch": 0.74, "learning_rate": 1.7610282918565825e-05, "loss": 0.4587, "step": 4021 }, { "epoch": 0.74, "learning_rate": 1.760898698225016e-05, "loss": 0.4569, "step": 4022 }, { "epoch": 0.74, "learning_rate": 1.7607690742349995e-05, "loss": 0.4507, "step": 4023 }, { "epoch": 0.74, "learning_rate": 1.760639419891706e-05, "loss": 0.4626, "step": 4024 }, { "epoch": 0.74, "learning_rate": 1.760509735200308e-05, "loss": 0.4632, "step": 4025 }, { "epoch": 0.74, "learning_rate": 1.7603800201659794e-05, "loss": 0.4558, "step": 4026 }, { "epoch": 0.75, "learning_rate": 1.7602502747938958e-05, "loss": 0.469, "step": 4027 }, { "epoch": 0.75, "learning_rate": 1.7601204990892336e-05, "loss": 0.4454, "step": 4028 }, { "epoch": 0.75, "learning_rate": 1.7599906930571714e-05, "loss": 0.4453, "step": 4029 }, { "epoch": 0.75, "learning_rate": 1.7598608567028873e-05, "loss": 0.4593, "step": 4030 }, { "epoch": 0.75, "learning_rate": 1.759730990031562e-05, "loss": 0.4463, "step": 4031 }, { "epoch": 0.75, "learning_rate": 1.7596010930483764e-05, "loss": 0.4576, "step": 4032 }, { "epoch": 0.75, "learning_rate": 1.7594711657585138e-05, "loss": 0.4768, "step": 4033 }, { "epoch": 0.75, "learning_rate": 1.759341208167158e-05, "loss": 0.47, "step": 4034 }, { "epoch": 0.75, "learning_rate": 1.7592112202794934e-05, "loss": 0.4516, "step": 4035 }, { "epoch": 0.75, "learning_rate": 1.759081202100707e-05, "loss": 0.4582, "step": 4036 }, { "epoch": 0.75, "learning_rate": 1.758951153635986e-05, "loss": 0.4602, "step": 4037 }, { "epoch": 0.75, "learning_rate": 1.7588210748905196e-05, "loss": 0.4561, "step": 4038 }, { "epoch": 0.75, "learning_rate": 1.7586909658694965e-05, "loss": 0.4471, "step": 4039 }, { "epoch": 0.75, "learning_rate": 1.758560826578109e-05, "loss": 0.4616, "step": 4040 }, { "epoch": 0.75, "learning_rate": 1.758430657021549e-05, "loss": 0.459, "step": 4041 }, { "epoch": 0.75, "learning_rate": 1.7583004572050096e-05, "loss": 0.4554, "step": 4042 }, { "epoch": 0.75, "learning_rate": 1.758170227133686e-05, "loss": 0.4628, "step": 4043 }, { "epoch": 0.75, "learning_rate": 1.7580399668127746e-05, "loss": 0.4922, "step": 4044 }, { "epoch": 0.75, "learning_rate": 1.7579096762474714e-05, "loss": 0.446, "step": 4045 }, { "epoch": 0.75, "learning_rate": 1.7577793554429756e-05, "loss": 0.4681, "step": 4046 }, { "epoch": 0.75, "learning_rate": 1.7576490044044866e-05, "loss": 0.455, "step": 4047 }, { "epoch": 0.75, "learning_rate": 1.757518623137205e-05, "loss": 0.4865, "step": 4048 }, { "epoch": 0.75, "learning_rate": 1.7573882116463322e-05, "loss": 0.4739, "step": 4049 }, { "epoch": 0.75, "learning_rate": 1.757257769937073e-05, "loss": 0.4622, "step": 4050 }, { "epoch": 0.75, "learning_rate": 1.75712729801463e-05, "loss": 0.4559, "step": 4051 }, { "epoch": 0.75, "learning_rate": 1.7569967958842102e-05, "loss": 0.4675, "step": 4052 }, { "epoch": 0.75, "learning_rate": 1.7568662635510195e-05, "loss": 0.4596, "step": 4053 }, { "epoch": 0.75, "learning_rate": 1.7567357010202664e-05, "loss": 0.4788, "step": 4054 }, { "epoch": 0.75, "learning_rate": 1.7566051082971597e-05, "loss": 0.4444, "step": 4055 }, { "epoch": 0.75, "learning_rate": 1.75647448538691e-05, "loss": 0.4524, "step": 4056 }, { "epoch": 0.75, "learning_rate": 1.756343832294729e-05, "loss": 0.4748, "step": 4057 }, { "epoch": 0.75, "learning_rate": 1.7562131490258293e-05, "loss": 0.4822, "step": 4058 }, { "epoch": 0.75, "learning_rate": 1.7560824355854254e-05, "loss": 0.4538, "step": 4059 }, { "epoch": 0.75, "learning_rate": 1.7559516919787318e-05, "loss": 0.4658, "step": 4060 }, { "epoch": 0.75, "learning_rate": 1.755820918210965e-05, "loss": 0.459, "step": 4061 }, { "epoch": 0.75, "learning_rate": 1.7556901142873435e-05, "loss": 0.4537, "step": 4062 }, { "epoch": 0.75, "learning_rate": 1.7555592802130853e-05, "loss": 0.4741, "step": 4063 }, { "epoch": 0.75, "learning_rate": 1.755428415993411e-05, "loss": 0.4709, "step": 4064 }, { "epoch": 0.75, "learning_rate": 1.7552975216335414e-05, "loss": 0.4565, "step": 4065 }, { "epoch": 0.75, "learning_rate": 1.755166597138699e-05, "loss": 0.4733, "step": 4066 }, { "epoch": 0.75, "learning_rate": 1.7550356425141073e-05, "loss": 0.462, "step": 4067 }, { "epoch": 0.75, "learning_rate": 1.7549046577649917e-05, "loss": 0.4539, "step": 4068 }, { "epoch": 0.75, "learning_rate": 1.754773642896578e-05, "loss": 0.4655, "step": 4069 }, { "epoch": 0.75, "learning_rate": 1.7546425979140932e-05, "loss": 0.4612, "step": 4070 }, { "epoch": 0.75, "learning_rate": 1.7545115228227658e-05, "loss": 0.473, "step": 4071 }, { "epoch": 0.75, "learning_rate": 1.7543804176278257e-05, "loss": 0.4645, "step": 4072 }, { "epoch": 0.75, "learning_rate": 1.7542492823345036e-05, "loss": 0.4797, "step": 4073 }, { "epoch": 0.75, "learning_rate": 1.7541181169480314e-05, "loss": 0.4648, "step": 4074 }, { "epoch": 0.75, "learning_rate": 1.753986921473643e-05, "loss": 0.4432, "step": 4075 }, { "epoch": 0.75, "learning_rate": 1.753855695916572e-05, "loss": 0.4251, "step": 4076 }, { "epoch": 0.75, "learning_rate": 1.7537244402820547e-05, "loss": 0.4737, "step": 4077 }, { "epoch": 0.75, "learning_rate": 1.7535931545753276e-05, "loss": 0.4533, "step": 4078 }, { "epoch": 0.75, "learning_rate": 1.7534618388016292e-05, "loss": 0.4368, "step": 4079 }, { "epoch": 0.75, "learning_rate": 1.753330492966198e-05, "loss": 0.4659, "step": 4080 }, { "epoch": 0.76, "learning_rate": 1.7531991170742753e-05, "loss": 0.4604, "step": 4081 }, { "epoch": 0.76, "learning_rate": 1.7530677111311017e-05, "loss": 0.4553, "step": 4082 }, { "epoch": 0.76, "learning_rate": 1.7529362751419216e-05, "loss": 0.4675, "step": 4083 }, { "epoch": 0.76, "learning_rate": 1.7528048091119773e-05, "loss": 0.4681, "step": 4084 }, { "epoch": 0.76, "learning_rate": 1.752673313046515e-05, "loss": 0.463, "step": 4085 }, { "epoch": 0.76, "learning_rate": 1.7525417869507814e-05, "loss": 0.4541, "step": 4086 }, { "epoch": 0.76, "learning_rate": 1.7524102308300236e-05, "loss": 0.486, "step": 4087 }, { "epoch": 0.76, "learning_rate": 1.7522786446894908e-05, "loss": 0.4628, "step": 4088 }, { "epoch": 0.76, "learning_rate": 1.752147028534433e-05, "loss": 0.4479, "step": 4089 }, { "epoch": 0.76, "learning_rate": 1.7520153823701008e-05, "loss": 0.4574, "step": 4090 }, { "epoch": 0.76, "learning_rate": 1.7518837062017476e-05, "loss": 0.4772, "step": 4091 }, { "epoch": 0.76, "learning_rate": 1.7517520000346265e-05, "loss": 0.4476, "step": 4092 }, { "epoch": 0.76, "learning_rate": 1.7516202638739925e-05, "loss": 0.4496, "step": 4093 }, { "epoch": 0.76, "learning_rate": 1.7514884977251016e-05, "loss": 0.4433, "step": 4094 }, { "epoch": 0.76, "learning_rate": 1.7513567015932108e-05, "loss": 0.4739, "step": 4095 }, { "epoch": 0.76, "learning_rate": 1.7512248754835785e-05, "loss": 0.452, "step": 4096 }, { "epoch": 0.76, "learning_rate": 1.751093019401465e-05, "loss": 0.4742, "step": 4097 }, { "epoch": 0.76, "learning_rate": 1.7509611333521303e-05, "loss": 0.4537, "step": 4098 }, { "epoch": 0.76, "learning_rate": 1.7508292173408367e-05, "loss": 0.474, "step": 4099 }, { "epoch": 0.76, "learning_rate": 1.7506972713728478e-05, "loss": 0.4625, "step": 4100 }, { "epoch": 0.76, "learning_rate": 1.7505652954534272e-05, "loss": 0.4667, "step": 4101 }, { "epoch": 0.76, "learning_rate": 1.7504332895878415e-05, "loss": 0.4705, "step": 4102 }, { "epoch": 0.76, "learning_rate": 1.7503012537813566e-05, "loss": 0.4557, "step": 4103 }, { "epoch": 0.76, "learning_rate": 1.750169188039241e-05, "loss": 0.4785, "step": 4104 }, { "epoch": 0.76, "learning_rate": 1.7500370923667637e-05, "loss": 0.4702, "step": 4105 }, { "epoch": 0.76, "learning_rate": 1.7499049667691946e-05, "loss": 0.4823, "step": 4106 }, { "epoch": 0.76, "learning_rate": 1.749772811251806e-05, "loss": 0.4721, "step": 4107 }, { "epoch": 0.76, "learning_rate": 1.7496406258198706e-05, "loss": 0.4705, "step": 4108 }, { "epoch": 0.76, "learning_rate": 1.749508410478662e-05, "loss": 0.4691, "step": 4109 }, { "epoch": 0.76, "learning_rate": 1.7493761652334555e-05, "loss": 0.463, "step": 4110 }, { "epoch": 0.76, "learning_rate": 1.7492438900895274e-05, "loss": 0.4364, "step": 4111 }, { "epoch": 0.76, "learning_rate": 1.7491115850521554e-05, "loss": 0.4649, "step": 4112 }, { "epoch": 0.76, "learning_rate": 1.748979250126618e-05, "loss": 0.4686, "step": 4113 }, { "epoch": 0.76, "learning_rate": 1.7488468853181952e-05, "loss": 0.457, "step": 4114 }, { "epoch": 0.76, "learning_rate": 1.7487144906321684e-05, "loss": 0.4641, "step": 4115 }, { "epoch": 0.76, "learning_rate": 1.7485820660738194e-05, "loss": 0.4621, "step": 4116 }, { "epoch": 0.76, "learning_rate": 1.748449611648432e-05, "loss": 0.4764, "step": 4117 }, { "epoch": 0.76, "learning_rate": 1.7483171273612905e-05, "loss": 0.4817, "step": 4118 }, { "epoch": 0.76, "learning_rate": 1.7481846132176813e-05, "loss": 0.4573, "step": 4119 }, { "epoch": 0.76, "learning_rate": 1.7480520692228916e-05, "loss": 0.4727, "step": 4120 }, { "epoch": 0.76, "learning_rate": 1.7479194953822088e-05, "loss": 0.4735, "step": 4121 }, { "epoch": 0.76, "learning_rate": 1.7477868917009232e-05, "loss": 0.4612, "step": 4122 }, { "epoch": 0.76, "learning_rate": 1.747654258184325e-05, "loss": 0.4557, "step": 4123 }, { "epoch": 0.76, "learning_rate": 1.747521594837706e-05, "loss": 0.4551, "step": 4124 }, { "epoch": 0.76, "learning_rate": 1.7473889016663597e-05, "loss": 0.4711, "step": 4125 }, { "epoch": 0.76, "learning_rate": 1.74725617867558e-05, "loss": 0.4639, "step": 4126 }, { "epoch": 0.76, "learning_rate": 1.7471234258706616e-05, "loss": 0.4577, "step": 4127 }, { "epoch": 0.76, "learning_rate": 1.7469906432569023e-05, "loss": 0.4618, "step": 4128 }, { "epoch": 0.76, "learning_rate": 1.7468578308395993e-05, "loss": 0.4507, "step": 4129 }, { "epoch": 0.76, "learning_rate": 1.746724988624052e-05, "loss": 0.4825, "step": 4130 }, { "epoch": 0.76, "learning_rate": 1.7465921166155598e-05, "loss": 0.4698, "step": 4131 }, { "epoch": 0.76, "learning_rate": 1.7464592148194245e-05, "loss": 0.4605, "step": 4132 }, { "epoch": 0.76, "learning_rate": 1.746326283240948e-05, "loss": 0.4426, "step": 4133 }, { "epoch": 0.76, "learning_rate": 1.7461933218854353e-05, "loss": 0.4683, "step": 4134 }, { "epoch": 0.77, "learning_rate": 1.7460603307581904e-05, "loss": 0.4728, "step": 4135 }, { "epoch": 0.77, "learning_rate": 1.7459273098645196e-05, "loss": 0.4838, "step": 4136 }, { "epoch": 0.77, "learning_rate": 1.74579425920973e-05, "loss": 0.4723, "step": 4137 }, { "epoch": 0.77, "learning_rate": 1.7456611787991303e-05, "loss": 0.4484, "step": 4138 }, { "epoch": 0.77, "learning_rate": 1.7455280686380302e-05, "loss": 0.45, "step": 4139 }, { "epoch": 0.77, "learning_rate": 1.7453949287317407e-05, "loss": 0.4611, "step": 4140 }, { "epoch": 0.77, "learning_rate": 1.7452617590855733e-05, "loss": 0.4756, "step": 4141 }, { "epoch": 0.77, "learning_rate": 1.7451285597048414e-05, "loss": 0.4789, "step": 4142 }, { "epoch": 0.77, "learning_rate": 1.74499533059486e-05, "loss": 0.473, "step": 4143 }, { "epoch": 0.77, "learning_rate": 1.744862071760944e-05, "loss": 0.4528, "step": 4144 }, { "epoch": 0.77, "learning_rate": 1.7447287832084106e-05, "loss": 0.4611, "step": 4145 }, { "epoch": 0.77, "learning_rate": 1.7445954649425774e-05, "loss": 0.4615, "step": 4146 }, { "epoch": 0.77, "learning_rate": 1.7444621169687638e-05, "loss": 0.4498, "step": 4147 }, { "epoch": 0.77, "learning_rate": 1.7443287392922898e-05, "loss": 0.4674, "step": 4148 }, { "epoch": 0.77, "learning_rate": 1.744195331918477e-05, "loss": 0.4698, "step": 4149 }, { "epoch": 0.77, "learning_rate": 1.7440618948526488e-05, "loss": 0.4645, "step": 4150 }, { "epoch": 0.77, "learning_rate": 1.7439284281001287e-05, "loss": 0.4634, "step": 4151 }, { "epoch": 0.77, "learning_rate": 1.7437949316662412e-05, "loss": 0.4496, "step": 4152 }, { "epoch": 0.77, "learning_rate": 1.7436614055563135e-05, "loss": 0.4628, "step": 4153 }, { "epoch": 0.77, "learning_rate": 1.743527849775672e-05, "loss": 0.467, "step": 4154 }, { "epoch": 0.77, "learning_rate": 1.7433942643296466e-05, "loss": 0.4698, "step": 4155 }, { "epoch": 0.77, "learning_rate": 1.743260649223566e-05, "loss": 0.4542, "step": 4156 }, { "epoch": 0.77, "learning_rate": 1.7431270044627616e-05, "loss": 0.4535, "step": 4157 }, { "epoch": 0.77, "learning_rate": 1.7429933300525657e-05, "loss": 0.4482, "step": 4158 }, { "epoch": 0.77, "learning_rate": 1.7428596259983113e-05, "loss": 0.4711, "step": 4159 }, { "epoch": 0.77, "learning_rate": 1.7427258923053334e-05, "loss": 0.4682, "step": 4160 }, { "epoch": 0.77, "learning_rate": 1.7425921289789673e-05, "loss": 0.4637, "step": 4161 }, { "epoch": 0.77, "learning_rate": 1.74245833602455e-05, "loss": 0.46, "step": 4162 }, { "epoch": 0.77, "learning_rate": 1.74232451344742e-05, "loss": 0.441, "step": 4163 }, { "epoch": 0.77, "learning_rate": 1.742190661252917e-05, "loss": 0.4603, "step": 4164 }, { "epoch": 0.77, "learning_rate": 1.74205677944638e-05, "loss": 0.4806, "step": 4165 }, { "epoch": 0.77, "learning_rate": 1.7419228680331514e-05, "loss": 0.4495, "step": 4166 }, { "epoch": 0.77, "learning_rate": 1.7417889270185737e-05, "loss": 0.4532, "step": 4167 }, { "epoch": 0.77, "learning_rate": 1.7416549564079917e-05, "loss": 0.4382, "step": 4168 }, { "epoch": 0.77, "learning_rate": 1.74152095620675e-05, "loss": 0.466, "step": 4169 }, { "epoch": 0.77, "learning_rate": 1.7413869264201948e-05, "loss": 0.4666, "step": 4170 }, { "epoch": 0.77, "learning_rate": 1.7412528670536743e-05, "loss": 0.4965, "step": 4171 }, { "epoch": 0.77, "learning_rate": 1.7411187781125362e-05, "loss": 0.4481, "step": 4172 }, { "epoch": 0.77, "learning_rate": 1.7409846596021313e-05, "loss": 0.4471, "step": 4173 }, { "epoch": 0.77, "learning_rate": 1.7408505115278106e-05, "loss": 0.4566, "step": 4174 }, { "epoch": 0.77, "learning_rate": 1.7407163338949257e-05, "loss": 0.4432, "step": 4175 }, { "epoch": 0.77, "learning_rate": 1.740582126708831e-05, "loss": 0.4608, "step": 4176 }, { "epoch": 0.77, "learning_rate": 1.7404478899748804e-05, "loss": 0.4886, "step": 4177 }, { "epoch": 0.77, "learning_rate": 1.7403136236984296e-05, "loss": 0.4594, "step": 4178 }, { "epoch": 0.77, "learning_rate": 1.7401793278848363e-05, "loss": 0.4703, "step": 4179 }, { "epoch": 0.77, "learning_rate": 1.7400450025394577e-05, "loss": 0.4862, "step": 4180 }, { "epoch": 0.77, "learning_rate": 1.739910647667654e-05, "loss": 0.4732, "step": 4181 }, { "epoch": 0.77, "learning_rate": 1.7397762632747853e-05, "loss": 0.4492, "step": 4182 }, { "epoch": 0.77, "learning_rate": 1.7396418493662132e-05, "loss": 0.449, "step": 4183 }, { "epoch": 0.77, "learning_rate": 1.739507405947301e-05, "loss": 0.4586, "step": 4184 }, { "epoch": 0.77, "learning_rate": 1.7393729330234123e-05, "loss": 0.4518, "step": 4185 }, { "epoch": 0.77, "learning_rate": 1.7392384305999125e-05, "loss": 0.4549, "step": 4186 }, { "epoch": 0.77, "learning_rate": 1.7391038986821682e-05, "loss": 0.4639, "step": 4187 }, { "epoch": 0.77, "learning_rate": 1.7389693372755464e-05, "loss": 0.4398, "step": 4188 }, { "epoch": 0.78, "learning_rate": 1.7388347463854164e-05, "loss": 0.4789, "step": 4189 }, { "epoch": 0.78, "learning_rate": 1.738700126017148e-05, "loss": 0.4652, "step": 4190 }, { "epoch": 0.78, "learning_rate": 1.7385654761761123e-05, "loss": 0.4536, "step": 4191 }, { "epoch": 0.78, "learning_rate": 1.7384307968676814e-05, "loss": 0.4467, "step": 4192 }, { "epoch": 0.78, "learning_rate": 1.7382960880972287e-05, "loss": 0.4728, "step": 4193 }, { "epoch": 0.78, "learning_rate": 1.7381613498701292e-05, "loss": 0.4432, "step": 4194 }, { "epoch": 0.78, "learning_rate": 1.7380265821917585e-05, "loss": 0.4342, "step": 4195 }, { "epoch": 0.78, "learning_rate": 1.7378917850674935e-05, "loss": 0.4556, "step": 4196 }, { "epoch": 0.78, "learning_rate": 1.7377569585027127e-05, "loss": 0.4703, "step": 4197 }, { "epoch": 0.78, "learning_rate": 1.737622102502795e-05, "loss": 0.4682, "step": 4198 }, { "epoch": 0.78, "learning_rate": 1.737487217073121e-05, "loss": 0.4606, "step": 4199 }, { "epoch": 0.78, "learning_rate": 1.7373523022190723e-05, "loss": 0.4569, "step": 4200 }, { "epoch": 0.78, "learning_rate": 1.7372173579460324e-05, "loss": 0.4715, "step": 4201 }, { "epoch": 0.78, "learning_rate": 1.7370823842593843e-05, "loss": 0.463, "step": 4202 }, { "epoch": 0.78, "learning_rate": 1.736947381164514e-05, "loss": 0.4544, "step": 4203 }, { "epoch": 0.78, "learning_rate": 1.736812348666808e-05, "loss": 0.4418, "step": 4204 }, { "epoch": 0.78, "learning_rate": 1.7366772867716527e-05, "loss": 0.4497, "step": 4205 }, { "epoch": 0.78, "learning_rate": 1.736542195484438e-05, "loss": 0.4677, "step": 4206 }, { "epoch": 0.78, "learning_rate": 1.7364070748105533e-05, "loss": 0.4734, "step": 4207 }, { "epoch": 0.78, "learning_rate": 1.73627192475539e-05, "loss": 0.4762, "step": 4208 }, { "epoch": 0.78, "learning_rate": 1.73613674532434e-05, "loss": 0.4501, "step": 4209 }, { "epoch": 0.78, "learning_rate": 1.7360015365227963e-05, "loss": 0.4599, "step": 4210 }, { "epoch": 0.78, "learning_rate": 1.7358662983561543e-05, "loss": 0.4637, "step": 4211 }, { "epoch": 0.78, "learning_rate": 1.7357310308298093e-05, "loss": 0.4509, "step": 4212 }, { "epoch": 0.78, "learning_rate": 1.7355957339491585e-05, "loss": 0.4416, "step": 4213 }, { "epoch": 0.78, "learning_rate": 1.7354604077195997e-05, "loss": 0.4497, "step": 4214 }, { "epoch": 0.78, "learning_rate": 1.7353250521465326e-05, "loss": 0.4674, "step": 4215 }, { "epoch": 0.78, "learning_rate": 1.735189667235357e-05, "loss": 0.4687, "step": 4216 }, { "epoch": 0.78, "learning_rate": 1.735054252991475e-05, "loss": 0.4602, "step": 4217 }, { "epoch": 0.78, "learning_rate": 1.7349188094202895e-05, "loss": 0.476, "step": 4218 }, { "epoch": 0.78, "learning_rate": 1.734783336527204e-05, "loss": 0.4663, "step": 4219 }, { "epoch": 0.78, "learning_rate": 1.7346478343176233e-05, "loss": 0.4757, "step": 4220 }, { "epoch": 0.78, "learning_rate": 1.7345123027969547e-05, "loss": 0.4711, "step": 4221 }, { "epoch": 0.78, "learning_rate": 1.7343767419706046e-05, "loss": 0.4563, "step": 4222 }, { "epoch": 0.78, "learning_rate": 1.734241151843983e-05, "loss": 0.4559, "step": 4223 }, { "epoch": 0.78, "learning_rate": 1.734105532422498e-05, "loss": 0.4673, "step": 4224 }, { "epoch": 0.78, "learning_rate": 1.733969883711562e-05, "loss": 0.4442, "step": 4225 }, { "epoch": 0.78, "learning_rate": 1.733834205716586e-05, "loss": 0.4712, "step": 4226 }, { "epoch": 0.78, "learning_rate": 1.7336984984429843e-05, "loss": 0.48, "step": 4227 }, { "epoch": 0.78, "learning_rate": 1.7335627618961707e-05, "loss": 0.4759, "step": 4228 }, { "epoch": 0.78, "learning_rate": 1.7334269960815614e-05, "loss": 0.4571, "step": 4229 }, { "epoch": 0.78, "learning_rate": 1.7332912010045727e-05, "loss": 0.4486, "step": 4230 }, { "epoch": 0.78, "learning_rate": 1.7331553766706224e-05, "loss": 0.4536, "step": 4231 }, { "epoch": 0.78, "learning_rate": 1.7330195230851303e-05, "loss": 0.471, "step": 4232 }, { "epoch": 0.78, "learning_rate": 1.7328836402535164e-05, "loss": 0.4716, "step": 4233 }, { "epoch": 0.78, "learning_rate": 1.732747728181202e-05, "loss": 0.4577, "step": 4234 }, { "epoch": 0.78, "learning_rate": 1.73261178687361e-05, "loss": 0.4601, "step": 4235 }, { "epoch": 0.78, "learning_rate": 1.732475816336164e-05, "loss": 0.4569, "step": 4236 }, { "epoch": 0.78, "learning_rate": 1.732339816574289e-05, "loss": 0.472, "step": 4237 }, { "epoch": 0.78, "learning_rate": 1.7322037875934114e-05, "loss": 0.4737, "step": 4238 }, { "epoch": 0.78, "learning_rate": 1.732067729398958e-05, "loss": 0.4492, "step": 4239 }, { "epoch": 0.78, "learning_rate": 1.731931641996358e-05, "loss": 0.4433, "step": 4240 }, { "epoch": 0.78, "learning_rate": 1.7317955253910404e-05, "loss": 0.4602, "step": 4241 }, { "epoch": 0.78, "learning_rate": 1.7316593795884365e-05, "loss": 0.4524, "step": 4242 }, { "epoch": 0.79, "learning_rate": 1.7315232045939775e-05, "loss": 0.4507, "step": 4243 }, { "epoch": 0.79, "learning_rate": 1.731387000413097e-05, "loss": 0.4347, "step": 4244 }, { "epoch": 0.79, "learning_rate": 1.73125076705123e-05, "loss": 0.4717, "step": 4245 }, { "epoch": 0.79, "learning_rate": 1.7311145045138105e-05, "loss": 0.4756, "step": 4246 }, { "epoch": 0.79, "learning_rate": 1.7309782128062765e-05, "loss": 0.4481, "step": 4247 }, { "epoch": 0.79, "learning_rate": 1.7308418919340648e-05, "loss": 0.4616, "step": 4248 }, { "epoch": 0.79, "learning_rate": 1.7307055419026148e-05, "loss": 0.4525, "step": 4249 }, { "epoch": 0.79, "learning_rate": 1.7305691627173665e-05, "loss": 0.4582, "step": 4250 }, { "epoch": 0.79, "learning_rate": 1.7304327543837612e-05, "loss": 0.4712, "step": 4251 }, { "epoch": 0.79, "learning_rate": 1.7302963169072417e-05, "loss": 0.4393, "step": 4252 }, { "epoch": 0.79, "learning_rate": 1.730159850293251e-05, "loss": 0.4372, "step": 4253 }, { "epoch": 0.79, "learning_rate": 1.730023354547234e-05, "loss": 0.456, "step": 4254 }, { "epoch": 0.79, "learning_rate": 1.7298868296746372e-05, "loss": 0.4414, "step": 4255 }, { "epoch": 0.79, "learning_rate": 1.729750275680907e-05, "loss": 0.4711, "step": 4256 }, { "epoch": 0.79, "learning_rate": 1.7296136925714916e-05, "loss": 0.4613, "step": 4257 }, { "epoch": 0.79, "learning_rate": 1.729477080351841e-05, "loss": 0.4513, "step": 4258 }, { "epoch": 0.79, "learning_rate": 1.7293404390274056e-05, "loss": 0.457, "step": 4259 }, { "epoch": 0.79, "learning_rate": 1.729203768603637e-05, "loss": 0.455, "step": 4260 }, { "epoch": 0.79, "learning_rate": 1.7290670690859877e-05, "loss": 0.4608, "step": 4261 }, { "epoch": 0.79, "learning_rate": 1.7289303404799125e-05, "loss": 0.4596, "step": 4262 }, { "epoch": 0.79, "learning_rate": 1.728793582790866e-05, "loss": 0.445, "step": 4263 }, { "epoch": 0.79, "learning_rate": 1.7286567960243052e-05, "loss": 0.4575, "step": 4264 }, { "epoch": 0.79, "learning_rate": 1.7285199801856874e-05, "loss": 0.4788, "step": 4265 }, { "epoch": 0.79, "learning_rate": 1.728383135280471e-05, "loss": 0.4551, "step": 4266 }, { "epoch": 0.79, "learning_rate": 1.7282462613141162e-05, "loss": 0.4667, "step": 4267 }, { "epoch": 0.79, "learning_rate": 1.7281093582920838e-05, "loss": 0.4506, "step": 4268 }, { "epoch": 0.79, "learning_rate": 1.727972426219836e-05, "loss": 0.4456, "step": 4269 }, { "epoch": 0.79, "learning_rate": 1.7278354651028362e-05, "loss": 0.4584, "step": 4270 }, { "epoch": 0.79, "learning_rate": 1.7276984749465492e-05, "loss": 0.4657, "step": 4271 }, { "epoch": 0.79, "learning_rate": 1.72756145575644e-05, "loss": 0.4482, "step": 4272 }, { "epoch": 0.79, "learning_rate": 1.727424407537976e-05, "loss": 0.4662, "step": 4273 }, { "epoch": 0.79, "learning_rate": 1.7272873302966248e-05, "loss": 0.4567, "step": 4274 }, { "epoch": 0.79, "learning_rate": 1.7271502240378556e-05, "loss": 0.4654, "step": 4275 }, { "epoch": 0.79, "learning_rate": 1.7270130887671387e-05, "loss": 0.4593, "step": 4276 }, { "epoch": 0.79, "learning_rate": 1.7268759244899456e-05, "loss": 0.463, "step": 4277 }, { "epoch": 0.79, "learning_rate": 1.7267387312117493e-05, "loss": 0.4766, "step": 4278 }, { "epoch": 0.79, "learning_rate": 1.7266015089380226e-05, "loss": 0.4615, "step": 4279 }, { "epoch": 0.79, "learning_rate": 1.7264642576742412e-05, "loss": 0.4678, "step": 4280 }, { "epoch": 0.79, "learning_rate": 1.7263269774258807e-05, "loss": 0.4273, "step": 4281 }, { "epoch": 0.79, "learning_rate": 1.7261896681984187e-05, "loss": 0.4605, "step": 4282 }, { "epoch": 0.79, "learning_rate": 1.726052329997334e-05, "loss": 0.4683, "step": 4283 }, { "epoch": 0.79, "learning_rate": 1.725914962828105e-05, "loss": 0.4685, "step": 4284 }, { "epoch": 0.79, "learning_rate": 1.725777566696213e-05, "loss": 0.4621, "step": 4285 }, { "epoch": 0.79, "learning_rate": 1.72564014160714e-05, "loss": 0.4523, "step": 4286 }, { "epoch": 0.79, "learning_rate": 1.7255026875663685e-05, "loss": 0.4446, "step": 4287 }, { "epoch": 0.79, "learning_rate": 1.7253652045793833e-05, "loss": 0.4599, "step": 4288 }, { "epoch": 0.79, "learning_rate": 1.7252276926516695e-05, "loss": 0.4528, "step": 4289 }, { "epoch": 0.79, "learning_rate": 1.7250901517887132e-05, "loss": 0.4533, "step": 4290 }, { "epoch": 0.79, "learning_rate": 1.7249525819960022e-05, "loss": 0.4713, "step": 4291 }, { "epoch": 0.79, "learning_rate": 1.7248149832790257e-05, "loss": 0.4524, "step": 4292 }, { "epoch": 0.79, "learning_rate": 1.7246773556432733e-05, "loss": 0.4593, "step": 4293 }, { "epoch": 0.79, "learning_rate": 1.724539699094236e-05, "loss": 0.4673, "step": 4294 }, { "epoch": 0.79, "learning_rate": 1.7244020136374064e-05, "loss": 0.4457, "step": 4295 }, { "epoch": 0.79, "learning_rate": 1.7242642992782775e-05, "loss": 0.461, "step": 4296 }, { "epoch": 0.8, "learning_rate": 1.724126556022344e-05, "loss": 0.4635, "step": 4297 }, { "epoch": 0.8, "learning_rate": 1.7239887838751017e-05, "loss": 0.4687, "step": 4298 }, { "epoch": 0.8, "learning_rate": 1.723850982842047e-05, "loss": 0.4625, "step": 4299 }, { "epoch": 0.8, "learning_rate": 1.7237131529286785e-05, "loss": 0.4812, "step": 4300 }, { "epoch": 0.8, "learning_rate": 1.723575294140495e-05, "loss": 0.4572, "step": 4301 }, { "epoch": 0.8, "learning_rate": 1.723437406482997e-05, "loss": 0.4387, "step": 4302 }, { "epoch": 0.8, "learning_rate": 1.723299489961686e-05, "loss": 0.4344, "step": 4303 }, { "epoch": 0.8, "learning_rate": 1.7231615445820647e-05, "loss": 0.4641, "step": 4304 }, { "epoch": 0.8, "learning_rate": 1.7230235703496362e-05, "loss": 0.4649, "step": 4305 }, { "epoch": 0.8, "learning_rate": 1.722885567269906e-05, "loss": 0.4603, "step": 4306 }, { "epoch": 0.8, "learning_rate": 1.7227475353483805e-05, "loss": 0.4625, "step": 4307 }, { "epoch": 0.8, "learning_rate": 1.7226094745905658e-05, "loss": 0.4637, "step": 4308 }, { "epoch": 0.8, "learning_rate": 1.7224713850019714e-05, "loss": 0.4617, "step": 4309 }, { "epoch": 0.8, "learning_rate": 1.7223332665881063e-05, "loss": 0.4554, "step": 4310 }, { "epoch": 0.8, "learning_rate": 1.722195119354481e-05, "loss": 0.4375, "step": 4311 }, { "epoch": 0.8, "learning_rate": 1.722056943306608e-05, "loss": 0.4656, "step": 4312 }, { "epoch": 0.8, "learning_rate": 1.7219187384499992e-05, "loss": 0.4777, "step": 4313 }, { "epoch": 0.8, "learning_rate": 1.7217805047901695e-05, "loss": 0.4769, "step": 4314 }, { "epoch": 0.8, "learning_rate": 1.7216422423326342e-05, "loss": 0.447, "step": 4315 }, { "epoch": 0.8, "learning_rate": 1.7215039510829098e-05, "loss": 0.4636, "step": 4316 }, { "epoch": 0.8, "learning_rate": 1.721365631046513e-05, "loss": 0.4825, "step": 4317 }, { "epoch": 0.8, "learning_rate": 1.7212272822289632e-05, "loss": 0.4484, "step": 4318 }, { "epoch": 0.8, "learning_rate": 1.7210889046357806e-05, "loss": 0.4669, "step": 4319 }, { "epoch": 0.8, "learning_rate": 1.7209504982724853e-05, "loss": 0.4662, "step": 4320 }, { "epoch": 0.8, "learning_rate": 1.7208120631446e-05, "loss": 0.4655, "step": 4321 }, { "epoch": 0.8, "learning_rate": 1.7206735992576482e-05, "loss": 0.4489, "step": 4322 }, { "epoch": 0.8, "learning_rate": 1.7205351066171538e-05, "loss": 0.4709, "step": 4323 }, { "epoch": 0.8, "learning_rate": 1.7203965852286426e-05, "loss": 0.4835, "step": 4324 }, { "epoch": 0.8, "learning_rate": 1.7202580350976415e-05, "loss": 0.4626, "step": 4325 }, { "epoch": 0.8, "learning_rate": 1.7201194562296785e-05, "loss": 0.4465, "step": 4326 }, { "epoch": 0.8, "learning_rate": 1.7199808486302824e-05, "loss": 0.4598, "step": 4327 }, { "epoch": 0.8, "learning_rate": 1.7198422123049833e-05, "loss": 0.4499, "step": 4328 }, { "epoch": 0.8, "learning_rate": 1.719703547259313e-05, "loss": 0.4532, "step": 4329 }, { "epoch": 0.8, "learning_rate": 1.7195648534988035e-05, "loss": 0.477, "step": 4330 }, { "epoch": 0.8, "learning_rate": 1.7194261310289885e-05, "loss": 0.4591, "step": 4331 }, { "epoch": 0.8, "learning_rate": 1.719287379855403e-05, "loss": 0.4607, "step": 4332 }, { "epoch": 0.8, "learning_rate": 1.7191485999835826e-05, "loss": 0.4487, "step": 4333 }, { "epoch": 0.8, "learning_rate": 1.7190097914190644e-05, "loss": 0.4629, "step": 4334 }, { "epoch": 0.8, "learning_rate": 1.718870954167387e-05, "loss": 0.4633, "step": 4335 }, { "epoch": 0.8, "learning_rate": 1.7187320882340898e-05, "loss": 0.4523, "step": 4336 }, { "epoch": 0.8, "learning_rate": 1.7185931936247122e-05, "loss": 0.4755, "step": 4337 }, { "epoch": 0.8, "learning_rate": 1.7184542703447974e-05, "loss": 0.5013, "step": 4338 }, { "epoch": 0.8, "learning_rate": 1.7183153183998866e-05, "loss": 0.45, "step": 4339 }, { "epoch": 0.8, "learning_rate": 1.7181763377955253e-05, "loss": 0.4561, "step": 4340 }, { "epoch": 0.8, "learning_rate": 1.718037328537257e-05, "loss": 0.467, "step": 4341 }, { "epoch": 0.8, "learning_rate": 1.7178982906306294e-05, "loss": 0.4557, "step": 4342 }, { "epoch": 0.8, "learning_rate": 1.7177592240811888e-05, "loss": 0.4387, "step": 4343 }, { "epoch": 0.8, "learning_rate": 1.7176201288944842e-05, "loss": 0.4538, "step": 4344 }, { "epoch": 0.8, "learning_rate": 1.717481005076065e-05, "loss": 0.4512, "step": 4345 }, { "epoch": 0.8, "learning_rate": 1.717341852631482e-05, "loss": 0.4547, "step": 4346 }, { "epoch": 0.8, "learning_rate": 1.7172026715662876e-05, "loss": 0.4874, "step": 4347 }, { "epoch": 0.8, "learning_rate": 1.717063461886034e-05, "loss": 0.4499, "step": 4348 }, { "epoch": 0.8, "learning_rate": 1.716924223596276e-05, "loss": 0.4566, "step": 4349 }, { "epoch": 0.8, "learning_rate": 1.716784956702569e-05, "loss": 0.4719, "step": 4350 }, { "epoch": 0.8, "learning_rate": 1.716645661210469e-05, "loss": 0.4455, "step": 4351 }, { "epoch": 0.81, "learning_rate": 1.7165063371255342e-05, "loss": 0.4701, "step": 4352 }, { "epoch": 0.81, "learning_rate": 1.716366984453323e-05, "loss": 0.4545, "step": 4353 }, { "epoch": 0.81, "learning_rate": 1.7162276031993953e-05, "loss": 0.4418, "step": 4354 }, { "epoch": 0.81, "learning_rate": 1.7160881933693127e-05, "loss": 0.4777, "step": 4355 }, { "epoch": 0.81, "learning_rate": 1.715948754968637e-05, "loss": 0.4758, "step": 4356 }, { "epoch": 0.81, "learning_rate": 1.715809288002931e-05, "loss": 0.4435, "step": 4357 }, { "epoch": 0.81, "learning_rate": 1.7156697924777602e-05, "loss": 0.4504, "step": 4358 }, { "epoch": 0.81, "learning_rate": 1.7155302683986895e-05, "loss": 0.4528, "step": 4359 }, { "epoch": 0.81, "learning_rate": 1.715390715771286e-05, "loss": 0.4595, "step": 4360 }, { "epoch": 0.81, "learning_rate": 1.7152511346011172e-05, "loss": 0.4756, "step": 4361 }, { "epoch": 0.81, "learning_rate": 1.7151115248937525e-05, "loss": 0.4433, "step": 4362 }, { "epoch": 0.81, "learning_rate": 1.714971886654762e-05, "loss": 0.4646, "step": 4363 }, { "epoch": 0.81, "learning_rate": 1.714832219889717e-05, "loss": 0.4692, "step": 4364 }, { "epoch": 0.81, "learning_rate": 1.7146925246041897e-05, "loss": 0.4388, "step": 4365 }, { "epoch": 0.81, "learning_rate": 1.714552800803754e-05, "loss": 0.4679, "step": 4366 }, { "epoch": 0.81, "learning_rate": 1.7144130484939847e-05, "loss": 0.4687, "step": 4367 }, { "epoch": 0.81, "learning_rate": 1.714273267680457e-05, "loss": 0.4509, "step": 4368 }, { "epoch": 0.81, "learning_rate": 1.7141334583687488e-05, "loss": 0.4631, "step": 4369 }, { "epoch": 0.81, "learning_rate": 1.7139936205644377e-05, "loss": 0.4772, "step": 4370 }, { "epoch": 0.81, "learning_rate": 1.713853754273103e-05, "loss": 0.4579, "step": 4371 }, { "epoch": 0.81, "learning_rate": 1.713713859500325e-05, "loss": 0.4573, "step": 4372 }, { "epoch": 0.81, "learning_rate": 1.7135739362516856e-05, "loss": 0.4479, "step": 4373 }, { "epoch": 0.81, "learning_rate": 1.7134339845327673e-05, "loss": 0.4697, "step": 4374 }, { "epoch": 0.81, "learning_rate": 1.713294004349154e-05, "loss": 0.4362, "step": 4375 }, { "epoch": 0.81, "learning_rate": 1.7131539957064303e-05, "loss": 0.4589, "step": 4376 }, { "epoch": 0.81, "learning_rate": 1.7130139586101826e-05, "loss": 0.4574, "step": 4377 }, { "epoch": 0.81, "learning_rate": 1.7128738930659983e-05, "loss": 0.471, "step": 4378 }, { "epoch": 0.81, "learning_rate": 1.712733799079465e-05, "loss": 0.4499, "step": 4379 }, { "epoch": 0.81, "learning_rate": 1.7125936766561734e-05, "loss": 0.4559, "step": 4380 }, { "epoch": 0.81, "learning_rate": 1.712453525801713e-05, "loss": 0.4423, "step": 4381 }, { "epoch": 0.81, "learning_rate": 1.7123133465216762e-05, "loss": 0.4431, "step": 4382 }, { "epoch": 0.81, "learning_rate": 1.7121731388216556e-05, "loss": 0.4722, "step": 4383 }, { "epoch": 0.81, "learning_rate": 1.7120329027072452e-05, "loss": 0.4587, "step": 4384 }, { "epoch": 0.81, "learning_rate": 1.7118926381840404e-05, "loss": 0.4435, "step": 4385 }, { "epoch": 0.81, "learning_rate": 1.7117523452576375e-05, "loss": 0.4556, "step": 4386 }, { "epoch": 0.81, "learning_rate": 1.7116120239336337e-05, "loss": 0.4627, "step": 4387 }, { "epoch": 0.81, "learning_rate": 1.7114716742176273e-05, "loss": 0.4377, "step": 4388 }, { "epoch": 0.81, "learning_rate": 1.7113312961152186e-05, "loss": 0.4726, "step": 4389 }, { "epoch": 0.81, "learning_rate": 1.7111908896320083e-05, "loss": 0.444, "step": 4390 }, { "epoch": 0.81, "learning_rate": 1.7110504547735982e-05, "loss": 0.4451, "step": 4391 }, { "epoch": 0.81, "learning_rate": 1.7109099915455912e-05, "loss": 0.4556, "step": 4392 }, { "epoch": 0.81, "learning_rate": 1.710769499953592e-05, "loss": 0.4685, "step": 4393 }, { "epoch": 0.81, "learning_rate": 1.7106289800032057e-05, "loss": 0.4506, "step": 4394 }, { "epoch": 0.81, "learning_rate": 1.710488431700039e-05, "loss": 0.4772, "step": 4395 }, { "epoch": 0.81, "learning_rate": 1.7103478550496988e-05, "loss": 0.4666, "step": 4396 }, { "epoch": 0.81, "learning_rate": 1.7102072500577946e-05, "loss": 0.4579, "step": 4397 }, { "epoch": 0.81, "learning_rate": 1.710066616729936e-05, "loss": 0.459, "step": 4398 }, { "epoch": 0.81, "learning_rate": 1.709925955071734e-05, "loss": 0.4448, "step": 4399 }, { "epoch": 0.81, "learning_rate": 1.709785265088801e-05, "loss": 0.4887, "step": 4400 }, { "epoch": 0.81, "learning_rate": 1.7096445467867503e-05, "loss": 0.4491, "step": 4401 }, { "epoch": 0.81, "learning_rate": 1.7095038001711954e-05, "loss": 0.467, "step": 4402 }, { "epoch": 0.81, "learning_rate": 1.7093630252477527e-05, "loss": 0.4615, "step": 4403 }, { "epoch": 0.81, "learning_rate": 1.7092222220220386e-05, "loss": 0.4408, "step": 4404 }, { "epoch": 0.81, "learning_rate": 1.7090813904996714e-05, "loss": 0.4322, "step": 4405 }, { "epoch": 0.82, "learning_rate": 1.708940530686269e-05, "loss": 0.4712, "step": 4406 }, { "epoch": 0.82, "learning_rate": 1.7087996425874524e-05, "loss": 0.461, "step": 4407 }, { "epoch": 0.82, "learning_rate": 1.7086587262088417e-05, "loss": 0.4397, "step": 4408 }, { "epoch": 0.82, "learning_rate": 1.7085177815560605e-05, "loss": 0.4543, "step": 4409 }, { "epoch": 0.82, "learning_rate": 1.7083768086347318e-05, "loss": 0.4368, "step": 4410 }, { "epoch": 0.82, "learning_rate": 1.7082358074504794e-05, "loss": 0.4688, "step": 4411 }, { "epoch": 0.82, "learning_rate": 1.7080947780089297e-05, "loss": 0.4311, "step": 4412 }, { "epoch": 0.82, "learning_rate": 1.7079537203157094e-05, "loss": 0.4598, "step": 4413 }, { "epoch": 0.82, "learning_rate": 1.7078126343764462e-05, "loss": 0.4665, "step": 4414 }, { "epoch": 0.82, "learning_rate": 1.7076715201967698e-05, "loss": 0.4662, "step": 4415 }, { "epoch": 0.82, "learning_rate": 1.70753037778231e-05, "loss": 0.4636, "step": 4416 }, { "epoch": 0.82, "learning_rate": 1.7073892071386975e-05, "loss": 0.4703, "step": 4417 }, { "epoch": 0.82, "learning_rate": 1.7072480082715656e-05, "loss": 0.4548, "step": 4418 }, { "epoch": 0.82, "learning_rate": 1.7071067811865477e-05, "loss": 0.4443, "step": 4419 }, { "epoch": 0.82, "learning_rate": 1.7069655258892785e-05, "loss": 0.462, "step": 4420 }, { "epoch": 0.82, "learning_rate": 1.7068242423853933e-05, "loss": 0.431, "step": 4421 }, { "epoch": 0.82, "learning_rate": 1.7066829306805298e-05, "loss": 0.4558, "step": 4422 }, { "epoch": 0.82, "learning_rate": 1.7065415907803257e-05, "loss": 0.4593, "step": 4423 }, { "epoch": 0.82, "learning_rate": 1.7064002226904202e-05, "loss": 0.4666, "step": 4424 }, { "epoch": 0.82, "learning_rate": 1.706258826416454e-05, "loss": 0.4545, "step": 4425 }, { "epoch": 0.82, "learning_rate": 1.706117401964068e-05, "loss": 0.4537, "step": 4426 }, { "epoch": 0.82, "learning_rate": 1.7059759493389048e-05, "loss": 0.4566, "step": 4427 }, { "epoch": 0.82, "learning_rate": 1.7058344685466088e-05, "loss": 0.4806, "step": 4428 }, { "epoch": 0.82, "learning_rate": 1.7056929595928236e-05, "loss": 0.4462, "step": 4429 }, { "epoch": 0.82, "learning_rate": 1.7055514224831965e-05, "loss": 0.442, "step": 4430 }, { "epoch": 0.82, "learning_rate": 1.7054098572233736e-05, "loss": 0.4668, "step": 4431 }, { "epoch": 0.82, "learning_rate": 1.7052682638190036e-05, "loss": 0.4684, "step": 4432 }, { "epoch": 0.82, "learning_rate": 1.7051266422757357e-05, "loss": 0.4692, "step": 4433 }, { "epoch": 0.82, "learning_rate": 1.70498499259922e-05, "loss": 0.4753, "step": 4434 }, { "epoch": 0.82, "learning_rate": 1.7048433147951087e-05, "loss": 0.4536, "step": 4435 }, { "epoch": 0.82, "learning_rate": 1.7047016088690538e-05, "loss": 0.4606, "step": 4436 }, { "epoch": 0.82, "learning_rate": 1.7045598748267096e-05, "loss": 0.487, "step": 4437 }, { "epoch": 0.82, "learning_rate": 1.7044181126737308e-05, "loss": 0.453, "step": 4438 }, { "epoch": 0.82, "learning_rate": 1.7042763224157733e-05, "loss": 0.4551, "step": 4439 }, { "epoch": 0.82, "learning_rate": 1.704134504058495e-05, "loss": 0.4413, "step": 4440 }, { "epoch": 0.82, "learning_rate": 1.703992657607553e-05, "loss": 0.4719, "step": 4441 }, { "epoch": 0.82, "learning_rate": 1.703850783068608e-05, "loss": 0.4883, "step": 4442 }, { "epoch": 0.82, "learning_rate": 1.7037088804473194e-05, "loss": 0.4618, "step": 4443 }, { "epoch": 0.82, "learning_rate": 1.7035669497493497e-05, "loss": 0.4412, "step": 4444 }, { "epoch": 0.82, "learning_rate": 1.7034249909803612e-05, "loss": 0.485, "step": 4445 }, { "epoch": 0.82, "learning_rate": 1.703283004146018e-05, "loss": 0.4663, "step": 4446 }, { "epoch": 0.82, "learning_rate": 1.703140989251985e-05, "loss": 0.4739, "step": 4447 }, { "epoch": 0.82, "learning_rate": 1.702998946303928e-05, "loss": 0.485, "step": 4448 }, { "epoch": 0.82, "learning_rate": 1.7028568753075147e-05, "loss": 0.4653, "step": 4449 }, { "epoch": 0.82, "learning_rate": 1.7027147762684136e-05, "loss": 0.4462, "step": 4450 }, { "epoch": 0.82, "learning_rate": 1.7025726491922942e-05, "loss": 0.448, "step": 4451 }, { "epoch": 0.82, "learning_rate": 1.7024304940848267e-05, "loss": 0.4612, "step": 4452 }, { "epoch": 0.82, "learning_rate": 1.7022883109516826e-05, "loss": 0.4793, "step": 4453 }, { "epoch": 0.82, "learning_rate": 1.7021460997985355e-05, "loss": 0.4868, "step": 4454 }, { "epoch": 0.82, "learning_rate": 1.7020038606310592e-05, "loss": 0.4404, "step": 4455 }, { "epoch": 0.82, "learning_rate": 1.7018615934549283e-05, "loss": 0.4546, "step": 4456 }, { "epoch": 0.82, "learning_rate": 1.701719298275819e-05, "loss": 0.4678, "step": 4457 }, { "epoch": 0.82, "learning_rate": 1.7015769750994094e-05, "loss": 0.4635, "step": 4458 }, { "epoch": 0.82, "learning_rate": 1.7014346239313774e-05, "loss": 0.4655, "step": 4459 }, { "epoch": 0.83, "learning_rate": 1.7012922447774025e-05, "loss": 0.4645, "step": 4460 }, { "epoch": 0.83, "learning_rate": 1.7011498376431653e-05, "loss": 0.4621, "step": 4461 }, { "epoch": 0.83, "learning_rate": 1.701007402534348e-05, "loss": 0.4666, "step": 4462 }, { "epoch": 0.83, "learning_rate": 1.7008649394566327e-05, "loss": 0.4405, "step": 4463 }, { "epoch": 0.83, "learning_rate": 1.7007224484157044e-05, "loss": 0.4468, "step": 4464 }, { "epoch": 0.83, "learning_rate": 1.7005799294172475e-05, "loss": 0.487, "step": 4465 }, { "epoch": 0.83, "learning_rate": 1.7004373824669487e-05, "loss": 0.4508, "step": 4466 }, { "epoch": 0.83, "learning_rate": 1.700294807570495e-05, "loss": 0.4812, "step": 4467 }, { "epoch": 0.83, "learning_rate": 1.7001522047335752e-05, "loss": 0.4582, "step": 4468 }, { "epoch": 0.83, "learning_rate": 1.7000095739618788e-05, "loss": 0.4668, "step": 4469 }, { "epoch": 0.83, "learning_rate": 1.6998669152610962e-05, "loss": 0.455, "step": 4470 }, { "epoch": 0.83, "learning_rate": 1.6997242286369197e-05, "loss": 0.4567, "step": 4471 }, { "epoch": 0.83, "learning_rate": 1.6995815140950418e-05, "loss": 0.4178, "step": 4472 }, { "epoch": 0.83, "learning_rate": 1.6994387716411565e-05, "loss": 0.4419, "step": 4473 }, { "epoch": 0.83, "learning_rate": 1.6992960012809597e-05, "loss": 0.4302, "step": 4474 }, { "epoch": 0.83, "learning_rate": 1.699153203020147e-05, "loss": 0.449, "step": 4475 }, { "epoch": 0.83, "learning_rate": 1.6990103768644158e-05, "loss": 0.4579, "step": 4476 }, { "epoch": 0.83, "learning_rate": 1.6988675228194647e-05, "loss": 0.4679, "step": 4477 }, { "epoch": 0.83, "learning_rate": 1.6987246408909934e-05, "loss": 0.4333, "step": 4478 }, { "epoch": 0.83, "learning_rate": 1.6985817310847027e-05, "loss": 0.457, "step": 4479 }, { "epoch": 0.83, "learning_rate": 1.698438793406294e-05, "loss": 0.4748, "step": 4480 }, { "epoch": 0.83, "learning_rate": 1.6982958278614708e-05, "loss": 0.4479, "step": 4481 }, { "epoch": 0.83, "learning_rate": 1.698152834455937e-05, "loss": 0.4664, "step": 4482 }, { "epoch": 0.83, "learning_rate": 1.698009813195398e-05, "loss": 0.4384, "step": 4483 }, { "epoch": 0.83, "learning_rate": 1.6978667640855594e-05, "loss": 0.4814, "step": 4484 }, { "epoch": 0.83, "learning_rate": 1.697723687132129e-05, "loss": 0.4383, "step": 4485 }, { "epoch": 0.83, "learning_rate": 1.6975805823408153e-05, "loss": 0.455, "step": 4486 }, { "epoch": 0.83, "learning_rate": 1.697437449717328e-05, "loss": 0.4528, "step": 4487 }, { "epoch": 0.83, "learning_rate": 1.6972942892673772e-05, "loss": 0.446, "step": 4488 }, { "epoch": 0.83, "learning_rate": 1.697151100996676e-05, "loss": 0.4747, "step": 4489 }, { "epoch": 0.83, "learning_rate": 1.6970078849109362e-05, "loss": 0.4667, "step": 4490 }, { "epoch": 0.83, "learning_rate": 1.696864641015872e-05, "loss": 0.4631, "step": 4491 }, { "epoch": 0.83, "learning_rate": 1.6967213693171996e-05, "loss": 0.4429, "step": 4492 }, { "epoch": 0.83, "learning_rate": 1.696578069820634e-05, "loss": 0.4591, "step": 4493 }, { "epoch": 0.83, "learning_rate": 1.6964347425318934e-05, "loss": 0.4539, "step": 4494 }, { "epoch": 0.83, "learning_rate": 1.6962913874566958e-05, "loss": 0.4503, "step": 4495 }, { "epoch": 0.83, "learning_rate": 1.6961480046007606e-05, "loss": 0.4625, "step": 4496 }, { "epoch": 0.83, "learning_rate": 1.6960045939698094e-05, "loss": 0.4663, "step": 4497 }, { "epoch": 0.83, "learning_rate": 1.6958611555695634e-05, "loss": 0.4567, "step": 4498 }, { "epoch": 0.83, "learning_rate": 1.695717689405746e-05, "loss": 0.4594, "step": 4499 }, { "epoch": 0.83, "learning_rate": 1.6955741954840804e-05, "loss": 0.4744, "step": 4500 }, { "epoch": 0.83, "learning_rate": 1.6954306738102922e-05, "loss": 0.4715, "step": 4501 }, { "epoch": 0.83, "learning_rate": 1.695287124390108e-05, "loss": 0.4406, "step": 4502 }, { "epoch": 0.83, "learning_rate": 1.6951435472292545e-05, "loss": 0.4459, "step": 4503 }, { "epoch": 0.83, "learning_rate": 1.6949999423334608e-05, "loss": 0.444, "step": 4504 }, { "epoch": 0.83, "learning_rate": 1.694856309708456e-05, "loss": 0.4416, "step": 4505 }, { "epoch": 0.83, "learning_rate": 1.694712649359971e-05, "loss": 0.4611, "step": 4506 }, { "epoch": 0.83, "learning_rate": 1.6945689612937373e-05, "loss": 0.4434, "step": 4507 }, { "epoch": 0.83, "learning_rate": 1.694425245515488e-05, "loss": 0.4368, "step": 4508 }, { "epoch": 0.83, "learning_rate": 1.6942815020309574e-05, "loss": 0.4535, "step": 4509 }, { "epoch": 0.83, "learning_rate": 1.6941377308458802e-05, "loss": 0.4745, "step": 4510 }, { "epoch": 0.83, "learning_rate": 1.6939939319659924e-05, "loss": 0.4625, "step": 4511 }, { "epoch": 0.83, "learning_rate": 1.693850105397032e-05, "loss": 0.4532, "step": 4512 }, { "epoch": 0.83, "learning_rate": 1.6937062511447367e-05, "loss": 0.4701, "step": 4513 }, { "epoch": 0.84, "learning_rate": 1.6935623692148467e-05, "loss": 0.4574, "step": 4514 }, { "epoch": 0.84, "learning_rate": 1.693418459613102e-05, "loss": 0.4481, "step": 4515 }, { "epoch": 0.84, "learning_rate": 1.6932745223452446e-05, "loss": 0.4561, "step": 4516 }, { "epoch": 0.84, "learning_rate": 1.6931305574170176e-05, "loss": 0.4617, "step": 4517 }, { "epoch": 0.84, "learning_rate": 1.6929865648341643e-05, "loss": 0.4644, "step": 4518 }, { "epoch": 0.84, "learning_rate": 1.6928425446024305e-05, "loss": 0.4656, "step": 4519 }, { "epoch": 0.84, "learning_rate": 1.6926984967275615e-05, "loss": 0.4477, "step": 4520 }, { "epoch": 0.84, "learning_rate": 1.6925544212153052e-05, "loss": 0.4677, "step": 4521 }, { "epoch": 0.84, "learning_rate": 1.69241031807141e-05, "loss": 0.4454, "step": 4522 }, { "epoch": 0.84, "learning_rate": 1.6922661873016245e-05, "loss": 0.4649, "step": 4523 }, { "epoch": 0.84, "learning_rate": 1.6921220289117e-05, "loss": 0.4668, "step": 4524 }, { "epoch": 0.84, "learning_rate": 1.691977842907388e-05, "loss": 0.4497, "step": 4525 }, { "epoch": 0.84, "learning_rate": 1.6918336292944416e-05, "loss": 0.4481, "step": 4526 }, { "epoch": 0.84, "learning_rate": 1.6916893880786138e-05, "loss": 0.4649, "step": 4527 }, { "epoch": 0.84, "learning_rate": 1.6915451192656604e-05, "loss": 0.4769, "step": 4528 }, { "epoch": 0.84, "learning_rate": 1.691400822861337e-05, "loss": 0.4547, "step": 4529 }, { "epoch": 0.84, "learning_rate": 1.6912564988714003e-05, "loss": 0.446, "step": 4530 }, { "epoch": 0.84, "learning_rate": 1.69111214730161e-05, "loss": 0.4637, "step": 4531 }, { "epoch": 0.84, "learning_rate": 1.690967768157724e-05, "loss": 0.4574, "step": 4532 }, { "epoch": 0.84, "learning_rate": 1.6908233614455036e-05, "loss": 0.454, "step": 4533 }, { "epoch": 0.84, "learning_rate": 1.6906789271707104e-05, "loss": 0.4605, "step": 4534 }, { "epoch": 0.84, "learning_rate": 1.690534465339106e-05, "loss": 0.4477, "step": 4535 }, { "epoch": 0.84, "learning_rate": 1.6903899759564554e-05, "loss": 0.4392, "step": 4536 }, { "epoch": 0.84, "learning_rate": 1.690245459028523e-05, "loss": 0.4762, "step": 4537 }, { "epoch": 0.84, "learning_rate": 1.6901009145610748e-05, "loss": 0.4646, "step": 4538 }, { "epoch": 0.84, "learning_rate": 1.6899563425598774e-05, "loss": 0.4647, "step": 4539 }, { "epoch": 0.84, "learning_rate": 1.6898117430306994e-05, "loss": 0.4567, "step": 4540 }, { "epoch": 0.84, "learning_rate": 1.6896671159793102e-05, "loss": 0.4498, "step": 4541 }, { "epoch": 0.84, "learning_rate": 1.68952246141148e-05, "loss": 0.4572, "step": 4542 }, { "epoch": 0.84, "learning_rate": 1.6893777793329803e-05, "loss": 0.4763, "step": 4543 }, { "epoch": 0.84, "learning_rate": 1.6892330697495836e-05, "loss": 0.4413, "step": 4544 }, { "epoch": 0.84, "learning_rate": 1.6890883326670634e-05, "loss": 0.4551, "step": 4545 }, { "epoch": 0.84, "learning_rate": 1.6889435680911945e-05, "loss": 0.4629, "step": 4546 }, { "epoch": 0.84, "learning_rate": 1.6887987760277525e-05, "loss": 0.4505, "step": 4547 }, { "epoch": 0.84, "learning_rate": 1.688653956482515e-05, "loss": 0.4692, "step": 4548 }, { "epoch": 0.84, "learning_rate": 1.6885091094612595e-05, "loss": 0.4764, "step": 4549 }, { "epoch": 0.84, "learning_rate": 1.688364234969765e-05, "loss": 0.458, "step": 4550 }, { "epoch": 0.84, "learning_rate": 1.6882193330138125e-05, "loss": 0.4488, "step": 4551 }, { "epoch": 0.84, "learning_rate": 1.6880744035991825e-05, "loss": 0.4655, "step": 4552 }, { "epoch": 0.84, "learning_rate": 1.6879294467316578e-05, "loss": 0.4543, "step": 4553 }, { "epoch": 0.84, "learning_rate": 1.687784462417022e-05, "loss": 0.4491, "step": 4554 }, { "epoch": 0.84, "learning_rate": 1.6876394506610592e-05, "loss": 0.4667, "step": 4555 }, { "epoch": 0.84, "learning_rate": 1.6874944114695556e-05, "loss": 0.4553, "step": 4556 }, { "epoch": 0.84, "learning_rate": 1.6873493448482978e-05, "loss": 0.4419, "step": 4557 }, { "epoch": 0.84, "learning_rate": 1.687204250803074e-05, "loss": 0.437, "step": 4558 }, { "epoch": 0.84, "learning_rate": 1.687059129339673e-05, "loss": 0.4592, "step": 4559 }, { "epoch": 0.84, "learning_rate": 1.6869139804638844e-05, "loss": 0.4464, "step": 4560 }, { "epoch": 0.84, "learning_rate": 1.6867688041815e-05, "loss": 0.4359, "step": 4561 }, { "epoch": 0.84, "learning_rate": 1.6866236004983115e-05, "loss": 0.4417, "step": 4562 }, { "epoch": 0.84, "learning_rate": 1.686478369420113e-05, "loss": 0.4485, "step": 4563 }, { "epoch": 0.84, "learning_rate": 1.686333110952698e-05, "loss": 0.4512, "step": 4564 }, { "epoch": 0.84, "learning_rate": 1.6861878251018632e-05, "loss": 0.4533, "step": 4565 }, { "epoch": 0.84, "learning_rate": 1.6860425118734047e-05, "loss": 0.4263, "step": 4566 }, { "epoch": 0.84, "learning_rate": 1.6858971712731194e-05, "loss": 0.4694, "step": 4567 }, { "epoch": 0.85, "learning_rate": 1.6857518033068073e-05, "loss": 0.4425, "step": 4568 }, { "epoch": 0.85, "learning_rate": 1.685606407980268e-05, "loss": 0.4513, "step": 4569 }, { "epoch": 0.85, "learning_rate": 1.685460985299302e-05, "loss": 0.4418, "step": 4570 }, { "epoch": 0.85, "learning_rate": 1.6853155352697123e-05, "loss": 0.4689, "step": 4571 }, { "epoch": 0.85, "learning_rate": 1.6851700578973017e-05, "loss": 0.4501, "step": 4572 }, { "epoch": 0.85, "learning_rate": 1.6850245531878737e-05, "loss": 0.4506, "step": 4573 }, { "epoch": 0.85, "learning_rate": 1.684879021147235e-05, "loss": 0.4452, "step": 4574 }, { "epoch": 0.85, "learning_rate": 1.6847334617811907e-05, "loss": 0.4477, "step": 4575 }, { "epoch": 0.85, "learning_rate": 1.684587875095549e-05, "loss": 0.4705, "step": 4576 }, { "epoch": 0.85, "learning_rate": 1.684442261096119e-05, "loss": 0.4417, "step": 4577 }, { "epoch": 0.85, "learning_rate": 1.68429661978871e-05, "loss": 0.4616, "step": 4578 }, { "epoch": 0.85, "learning_rate": 1.6841509511791326e-05, "loss": 0.4589, "step": 4579 }, { "epoch": 0.85, "learning_rate": 1.684005255273199e-05, "loss": 0.4533, "step": 4580 }, { "epoch": 0.85, "learning_rate": 1.6838595320767218e-05, "loss": 0.4702, "step": 4581 }, { "epoch": 0.85, "learning_rate": 1.683713781595516e-05, "loss": 0.4697, "step": 4582 }, { "epoch": 0.85, "learning_rate": 1.6835680038353958e-05, "loss": 0.4772, "step": 4583 }, { "epoch": 0.85, "learning_rate": 1.683422198802178e-05, "loss": 0.4762, "step": 4584 }, { "epoch": 0.85, "learning_rate": 1.6832763665016796e-05, "loss": 0.4583, "step": 4585 }, { "epoch": 0.85, "learning_rate": 1.6831305069397196e-05, "loss": 0.4323, "step": 4586 }, { "epoch": 0.85, "learning_rate": 1.6829846201221166e-05, "loss": 0.4345, "step": 4587 }, { "epoch": 0.85, "learning_rate": 1.6828387060546922e-05, "loss": 0.455, "step": 4588 }, { "epoch": 0.85, "learning_rate": 1.6826927647432673e-05, "loss": 0.47, "step": 4589 }, { "epoch": 0.85, "learning_rate": 1.6825467961936656e-05, "loss": 0.457, "step": 4590 }, { "epoch": 0.85, "learning_rate": 1.6824008004117097e-05, "loss": 0.4628, "step": 4591 }, { "epoch": 0.85, "learning_rate": 1.6822547774032262e-05, "loss": 0.4535, "step": 4592 }, { "epoch": 0.85, "learning_rate": 1.6821087271740396e-05, "loss": 0.4549, "step": 4593 }, { "epoch": 0.85, "learning_rate": 1.681962649729978e-05, "loss": 0.4631, "step": 4594 }, { "epoch": 0.85, "learning_rate": 1.681816545076869e-05, "loss": 0.4698, "step": 4595 }, { "epoch": 0.85, "learning_rate": 1.6816704132205423e-05, "loss": 0.4542, "step": 4596 }, { "epoch": 0.85, "learning_rate": 1.6815242541668282e-05, "loss": 0.461, "step": 4597 }, { "epoch": 0.85, "learning_rate": 1.6813780679215585e-05, "loss": 0.4555, "step": 4598 }, { "epoch": 0.85, "learning_rate": 1.681231854490565e-05, "loss": 0.4608, "step": 4599 }, { "epoch": 0.85, "learning_rate": 1.681085613879682e-05, "loss": 0.4248, "step": 4600 }, { "epoch": 0.85, "learning_rate": 1.6809393460947435e-05, "loss": 0.4436, "step": 4601 }, { "epoch": 0.85, "learning_rate": 1.6807930511415865e-05, "loss": 0.4495, "step": 4602 }, { "epoch": 0.85, "learning_rate": 1.680646729026047e-05, "loss": 0.4767, "step": 4603 }, { "epoch": 0.85, "learning_rate": 1.680500379753963e-05, "loss": 0.4732, "step": 4604 }, { "epoch": 0.85, "learning_rate": 1.680354003331174e-05, "loss": 0.4764, "step": 4605 }, { "epoch": 0.85, "learning_rate": 1.6802075997635196e-05, "loss": 0.4482, "step": 4606 }, { "epoch": 0.85, "learning_rate": 1.6800611690568415e-05, "loss": 0.4549, "step": 4607 }, { "epoch": 0.85, "learning_rate": 1.679914711216982e-05, "loss": 0.4683, "step": 4608 }, { "epoch": 0.85, "learning_rate": 1.6797682262497846e-05, "loss": 0.4523, "step": 4609 }, { "epoch": 0.85, "learning_rate": 1.679621714161093e-05, "loss": 0.4596, "step": 4610 }, { "epoch": 0.85, "learning_rate": 1.6794751749567532e-05, "loss": 0.4403, "step": 4611 }, { "epoch": 0.85, "learning_rate": 1.6793286086426125e-05, "loss": 0.4538, "step": 4612 }, { "epoch": 0.85, "learning_rate": 1.679182015224518e-05, "loss": 0.4595, "step": 4613 }, { "epoch": 0.85, "learning_rate": 1.679035394708318e-05, "loss": 0.4752, "step": 4614 }, { "epoch": 0.85, "learning_rate": 1.6788887470998632e-05, "loss": 0.4635, "step": 4615 }, { "epoch": 0.85, "learning_rate": 1.6787420724050044e-05, "loss": 0.4582, "step": 4616 }, { "epoch": 0.85, "learning_rate": 1.6785953706295936e-05, "loss": 0.4701, "step": 4617 }, { "epoch": 0.85, "learning_rate": 1.6784486417794837e-05, "loss": 0.4499, "step": 4618 }, { "epoch": 0.85, "learning_rate": 1.6783018858605292e-05, "loss": 0.447, "step": 4619 }, { "epoch": 0.85, "learning_rate": 1.6781551028785857e-05, "loss": 0.4552, "step": 4620 }, { "epoch": 0.85, "learning_rate": 1.6780082928395086e-05, "loss": 0.4481, "step": 4621 }, { "epoch": 0.86, "learning_rate": 1.6778614557491564e-05, "loss": 0.4587, "step": 4622 }, { "epoch": 0.86, "learning_rate": 1.6777145916133867e-05, "loss": 0.477, "step": 4623 }, { "epoch": 0.86, "learning_rate": 1.6775677004380597e-05, "loss": 0.4537, "step": 4624 }, { "epoch": 0.86, "learning_rate": 1.677420782229036e-05, "loss": 0.4689, "step": 4625 }, { "epoch": 0.86, "learning_rate": 1.6772738369921772e-05, "loss": 0.4546, "step": 4626 }, { "epoch": 0.86, "learning_rate": 1.6771268647333463e-05, "loss": 0.4477, "step": 4627 }, { "epoch": 0.86, "learning_rate": 1.6769798654584074e-05, "loss": 0.4619, "step": 4628 }, { "epoch": 0.86, "learning_rate": 1.676832839173225e-05, "loss": 0.4559, "step": 4629 }, { "epoch": 0.86, "learning_rate": 1.6766857858836652e-05, "loss": 0.4791, "step": 4630 }, { "epoch": 0.86, "learning_rate": 1.676538705595596e-05, "loss": 0.4816, "step": 4631 }, { "epoch": 0.86, "learning_rate": 1.6763915983148846e-05, "loss": 0.4636, "step": 4632 }, { "epoch": 0.86, "learning_rate": 1.6762444640474006e-05, "loss": 0.4719, "step": 4633 }, { "epoch": 0.86, "learning_rate": 1.676097302799015e-05, "loss": 0.4521, "step": 4634 }, { "epoch": 0.86, "learning_rate": 1.6759501145755987e-05, "loss": 0.4662, "step": 4635 }, { "epoch": 0.86, "learning_rate": 1.6758028993830243e-05, "loss": 0.4627, "step": 4636 }, { "epoch": 0.86, "learning_rate": 1.6756556572271652e-05, "loss": 0.4671, "step": 4637 }, { "epoch": 0.86, "learning_rate": 1.675508388113896e-05, "loss": 0.4689, "step": 4638 }, { "epoch": 0.86, "learning_rate": 1.6753610920490933e-05, "loss": 0.474, "step": 4639 }, { "epoch": 0.86, "learning_rate": 1.6752137690386333e-05, "loss": 0.4616, "step": 4640 }, { "epoch": 0.86, "learning_rate": 1.675066419088394e-05, "loss": 0.4722, "step": 4641 }, { "epoch": 0.86, "learning_rate": 1.6749190422042546e-05, "loss": 0.4372, "step": 4642 }, { "epoch": 0.86, "learning_rate": 1.674771638392095e-05, "loss": 0.4629, "step": 4643 }, { "epoch": 0.86, "learning_rate": 1.6746242076577962e-05, "loss": 0.4652, "step": 4644 }, { "epoch": 0.86, "learning_rate": 1.67447675000724e-05, "loss": 0.4622, "step": 4645 }, { "epoch": 0.86, "learning_rate": 1.674329265446311e-05, "loss": 0.4828, "step": 4646 }, { "epoch": 0.86, "learning_rate": 1.674181753980893e-05, "loss": 0.4616, "step": 4647 }, { "epoch": 0.86, "learning_rate": 1.6740342156168706e-05, "loss": 0.4481, "step": 4648 }, { "epoch": 0.86, "learning_rate": 1.673886650360131e-05, "loss": 0.4629, "step": 4649 }, { "epoch": 0.86, "learning_rate": 1.673739058216562e-05, "loss": 0.4532, "step": 4650 }, { "epoch": 0.86, "learning_rate": 1.6735914391920517e-05, "loss": 0.4581, "step": 4651 }, { "epoch": 0.86, "learning_rate": 1.6734437932924902e-05, "loss": 0.4553, "step": 4652 }, { "epoch": 0.86, "learning_rate": 1.6732961205237686e-05, "loss": 0.4668, "step": 4653 }, { "epoch": 0.86, "learning_rate": 1.673148420891778e-05, "loss": 0.4501, "step": 4654 }, { "epoch": 0.86, "learning_rate": 1.6730006944024116e-05, "loss": 0.4479, "step": 4655 }, { "epoch": 0.86, "learning_rate": 1.6728529410615637e-05, "loss": 0.4394, "step": 4656 }, { "epoch": 0.86, "learning_rate": 1.672705160875129e-05, "loss": 0.4569, "step": 4657 }, { "epoch": 0.86, "learning_rate": 1.672557353849004e-05, "loss": 0.4621, "step": 4658 }, { "epoch": 0.86, "learning_rate": 1.672409519989086e-05, "loss": 0.4389, "step": 4659 }, { "epoch": 0.86, "learning_rate": 1.6722616593012725e-05, "loss": 0.4667, "step": 4660 }, { "epoch": 0.86, "learning_rate": 1.6721137717914642e-05, "loss": 0.4618, "step": 4661 }, { "epoch": 0.86, "learning_rate": 1.6719658574655602e-05, "loss": 0.4678, "step": 4662 }, { "epoch": 0.86, "learning_rate": 1.671817916329463e-05, "loss": 0.4334, "step": 4663 }, { "epoch": 0.86, "learning_rate": 1.6716699483890745e-05, "loss": 0.4642, "step": 4664 }, { "epoch": 0.86, "learning_rate": 1.6715219536502985e-05, "loss": 0.4602, "step": 4665 }, { "epoch": 0.86, "learning_rate": 1.6713739321190403e-05, "loss": 0.4722, "step": 4666 }, { "epoch": 0.86, "learning_rate": 1.671225883801205e-05, "loss": 0.4453, "step": 4667 }, { "epoch": 0.86, "learning_rate": 1.6710778087026997e-05, "loss": 0.4497, "step": 4668 }, { "epoch": 0.86, "learning_rate": 1.670929706829432e-05, "loss": 0.4402, "step": 4669 }, { "epoch": 0.86, "learning_rate": 1.670781578187312e-05, "loss": 0.4362, "step": 4670 }, { "epoch": 0.86, "learning_rate": 1.670633422782248e-05, "loss": 0.4669, "step": 4671 }, { "epoch": 0.86, "learning_rate": 1.6704852406201526e-05, "loss": 0.4646, "step": 4672 }, { "epoch": 0.86, "learning_rate": 1.670337031706937e-05, "loss": 0.4654, "step": 4673 }, { "epoch": 0.86, "learning_rate": 1.6701887960485155e-05, "loss": 0.4303, "step": 4674 }, { "epoch": 0.86, "learning_rate": 1.6700405336508017e-05, "loss": 0.4684, "step": 4675 }, { "epoch": 0.87, "learning_rate": 1.6698922445197113e-05, "loss": 0.4733, "step": 4676 }, { "epoch": 0.87, "learning_rate": 1.66974392866116e-05, "loss": 0.4435, "step": 4677 }, { "epoch": 0.87, "learning_rate": 1.6695955860810668e-05, "loss": 0.4482, "step": 4678 }, { "epoch": 0.87, "learning_rate": 1.6694472167853488e-05, "loss": 0.4903, "step": 4679 }, { "epoch": 0.87, "learning_rate": 1.6692988207799264e-05, "loss": 0.448, "step": 4680 }, { "epoch": 0.87, "learning_rate": 1.6691503980707204e-05, "loss": 0.4718, "step": 4681 }, { "epoch": 0.87, "learning_rate": 1.669001948663652e-05, "loss": 0.4511, "step": 4682 }, { "epoch": 0.87, "learning_rate": 1.668853472564645e-05, "loss": 0.4411, "step": 4683 }, { "epoch": 0.87, "learning_rate": 1.6687049697796223e-05, "loss": 0.4528, "step": 4684 }, { "epoch": 0.87, "learning_rate": 1.66855644031451e-05, "loss": 0.4616, "step": 4685 }, { "epoch": 0.87, "learning_rate": 1.6684078841752332e-05, "loss": 0.457, "step": 4686 }, { "epoch": 0.87, "learning_rate": 1.6682593013677193e-05, "loss": 0.452, "step": 4687 }, { "epoch": 0.87, "learning_rate": 1.6681106918978965e-05, "loss": 0.4235, "step": 4688 }, { "epoch": 0.87, "learning_rate": 1.667962055771694e-05, "loss": 0.4533, "step": 4689 }, { "epoch": 0.87, "learning_rate": 1.6678133929950428e-05, "loss": 0.4627, "step": 4690 }, { "epoch": 0.87, "learning_rate": 1.667664703573873e-05, "loss": 0.4734, "step": 4691 }, { "epoch": 0.87, "learning_rate": 1.6675159875141177e-05, "loss": 0.4551, "step": 4692 }, { "epoch": 0.87, "learning_rate": 1.6673672448217106e-05, "loss": 0.4508, "step": 4693 }, { "epoch": 0.87, "learning_rate": 1.667218475502586e-05, "loss": 0.4828, "step": 4694 }, { "epoch": 0.87, "learning_rate": 1.6670696795626794e-05, "loss": 0.4777, "step": 4695 }, { "epoch": 0.87, "learning_rate": 1.6669208570079277e-05, "loss": 0.4584, "step": 4696 }, { "epoch": 0.87, "learning_rate": 1.6667720078442686e-05, "loss": 0.4457, "step": 4697 }, { "epoch": 0.87, "learning_rate": 1.666623132077641e-05, "loss": 0.4445, "step": 4698 }, { "epoch": 0.87, "learning_rate": 1.6664742297139844e-05, "loss": 0.4842, "step": 4699 }, { "epoch": 0.87, "learning_rate": 1.66632530075924e-05, "loss": 0.4573, "step": 4700 }, { "epoch": 0.87, "learning_rate": 1.6661763452193498e-05, "loss": 0.4416, "step": 4701 }, { "epoch": 0.87, "learning_rate": 1.666027363100257e-05, "loss": 0.4617, "step": 4702 }, { "epoch": 0.87, "learning_rate": 1.6658783544079055e-05, "loss": 0.4607, "step": 4703 }, { "epoch": 0.87, "learning_rate": 1.66572931914824e-05, "loss": 0.4709, "step": 4704 }, { "epoch": 0.87, "learning_rate": 1.665580257327208e-05, "loss": 0.4501, "step": 4705 }, { "epoch": 0.87, "learning_rate": 1.6654311689507558e-05, "loss": 0.4199, "step": 4706 }, { "epoch": 0.87, "learning_rate": 1.665282054024832e-05, "loss": 0.4563, "step": 4707 }, { "epoch": 0.87, "learning_rate": 1.6651329125553854e-05, "loss": 0.456, "step": 4708 }, { "epoch": 0.87, "learning_rate": 1.6649837445483676e-05, "loss": 0.4639, "step": 4709 }, { "epoch": 0.87, "learning_rate": 1.6648345500097293e-05, "loss": 0.4951, "step": 4710 }, { "epoch": 0.87, "learning_rate": 1.6646853289454238e-05, "loss": 0.44, "step": 4711 }, { "epoch": 0.87, "learning_rate": 1.664536081361404e-05, "loss": 0.4572, "step": 4712 }, { "epoch": 0.87, "learning_rate": 1.6643868072636247e-05, "loss": 0.4548, "step": 4713 }, { "epoch": 0.87, "learning_rate": 1.6642375066580422e-05, "loss": 0.4667, "step": 4714 }, { "epoch": 0.87, "learning_rate": 1.6640881795506127e-05, "loss": 0.4439, "step": 4715 }, { "epoch": 0.87, "learning_rate": 1.6639388259472947e-05, "loss": 0.4547, "step": 4716 }, { "epoch": 0.87, "learning_rate": 1.6637894458540465e-05, "loss": 0.4503, "step": 4717 }, { "epoch": 0.87, "learning_rate": 1.6636400392768285e-05, "loss": 0.4669, "step": 4718 }, { "epoch": 0.87, "learning_rate": 1.663490606221602e-05, "loss": 0.4684, "step": 4719 }, { "epoch": 0.87, "learning_rate": 1.6633411466943283e-05, "loss": 0.4452, "step": 4720 }, { "epoch": 0.87, "learning_rate": 1.6631916607009712e-05, "loss": 0.4507, "step": 4721 }, { "epoch": 0.87, "learning_rate": 1.6630421482474944e-05, "loss": 0.4598, "step": 4722 }, { "epoch": 0.87, "learning_rate": 1.6628926093398637e-05, "loss": 0.4426, "step": 4723 }, { "epoch": 0.87, "learning_rate": 1.6627430439840453e-05, "loss": 0.459, "step": 4724 }, { "epoch": 0.87, "learning_rate": 1.6625934521860064e-05, "loss": 0.4732, "step": 4725 }, { "epoch": 0.87, "learning_rate": 1.662443833951715e-05, "loss": 0.4647, "step": 4726 }, { "epoch": 0.87, "learning_rate": 1.6622941892871418e-05, "loss": 0.4597, "step": 4727 }, { "epoch": 0.87, "learning_rate": 1.6621445181982565e-05, "loss": 0.444, "step": 4728 }, { "epoch": 0.87, "learning_rate": 1.661994820691031e-05, "loss": 0.4673, "step": 4729 }, { "epoch": 0.88, "learning_rate": 1.6618450967714373e-05, "loss": 0.4153, "step": 4730 }, { "epoch": 0.88, "learning_rate": 1.66169534644545e-05, "loss": 0.4731, "step": 4731 }, { "epoch": 0.88, "learning_rate": 1.661545569719043e-05, "loss": 0.4553, "step": 4732 }, { "epoch": 0.88, "learning_rate": 1.661395766598193e-05, "loss": 0.4499, "step": 4733 }, { "epoch": 0.88, "learning_rate": 1.6612459370888763e-05, "loss": 0.4805, "step": 4734 }, { "epoch": 0.88, "learning_rate": 1.6610960811970714e-05, "loss": 0.4508, "step": 4735 }, { "epoch": 0.88, "learning_rate": 1.6609461989287564e-05, "loss": 0.4621, "step": 4736 }, { "epoch": 0.88, "learning_rate": 1.660796290289912e-05, "loss": 0.447, "step": 4737 }, { "epoch": 0.88, "learning_rate": 1.6606463552865187e-05, "loss": 0.4445, "step": 4738 }, { "epoch": 0.88, "learning_rate": 1.6604963939245596e-05, "loss": 0.4548, "step": 4739 }, { "epoch": 0.88, "learning_rate": 1.660346406210017e-05, "loss": 0.4461, "step": 4740 }, { "epoch": 0.88, "learning_rate": 1.660196392148875e-05, "loss": 0.4579, "step": 4741 }, { "epoch": 0.88, "learning_rate": 1.6600463517471195e-05, "loss": 0.4617, "step": 4742 }, { "epoch": 0.88, "learning_rate": 1.6598962850107366e-05, "loss": 0.4375, "step": 4743 }, { "epoch": 0.88, "learning_rate": 1.659746191945714e-05, "loss": 0.4453, "step": 4744 }, { "epoch": 0.88, "learning_rate": 1.6595960725580392e-05, "loss": 0.4594, "step": 4745 }, { "epoch": 0.88, "learning_rate": 1.659445926853703e-05, "loss": 0.4408, "step": 4746 }, { "epoch": 0.88, "learning_rate": 1.659295754838695e-05, "loss": 0.4804, "step": 4747 }, { "epoch": 0.88, "learning_rate": 1.6591455565190068e-05, "loss": 0.4647, "step": 4748 }, { "epoch": 0.88, "learning_rate": 1.6589953319006316e-05, "loss": 0.4574, "step": 4749 }, { "epoch": 0.88, "learning_rate": 1.6588450809895627e-05, "loss": 0.4531, "step": 4750 }, { "epoch": 0.88, "learning_rate": 1.6586948037917948e-05, "loss": 0.4572, "step": 4751 }, { "epoch": 0.88, "learning_rate": 1.6585445003133234e-05, "loss": 0.465, "step": 4752 }, { "epoch": 0.88, "learning_rate": 1.6583941705601462e-05, "loss": 0.4618, "step": 4753 }, { "epoch": 0.88, "learning_rate": 1.6582438145382604e-05, "loss": 0.4734, "step": 4754 }, { "epoch": 0.88, "learning_rate": 1.658093432253665e-05, "loss": 0.4662, "step": 4755 }, { "epoch": 0.88, "learning_rate": 1.6579430237123605e-05, "loss": 0.4462, "step": 4756 }, { "epoch": 0.88, "learning_rate": 1.6577925889203473e-05, "loss": 0.4484, "step": 4757 }, { "epoch": 0.88, "learning_rate": 1.6576421278836274e-05, "loss": 0.4609, "step": 4758 }, { "epoch": 0.88, "learning_rate": 1.6574916406082045e-05, "loss": 0.4473, "step": 4759 }, { "epoch": 0.88, "learning_rate": 1.6573411271000822e-05, "loss": 0.4842, "step": 4760 }, { "epoch": 0.88, "learning_rate": 1.6571905873652662e-05, "loss": 0.4808, "step": 4761 }, { "epoch": 0.88, "learning_rate": 1.6570400214097623e-05, "loss": 0.452, "step": 4762 }, { "epoch": 0.88, "learning_rate": 1.6568894292395784e-05, "loss": 0.4524, "step": 4763 }, { "epoch": 0.88, "learning_rate": 1.6567388108607222e-05, "loss": 0.4568, "step": 4764 }, { "epoch": 0.88, "learning_rate": 1.6565881662792034e-05, "loss": 0.4708, "step": 4765 }, { "epoch": 0.88, "learning_rate": 1.656437495501032e-05, "loss": 0.4622, "step": 4766 }, { "epoch": 0.88, "learning_rate": 1.6562867985322206e-05, "loss": 0.4521, "step": 4767 }, { "epoch": 0.88, "learning_rate": 1.6561360753787807e-05, "loss": 0.4642, "step": 4768 }, { "epoch": 0.88, "learning_rate": 1.655985326046726e-05, "loss": 0.4338, "step": 4769 }, { "epoch": 0.88, "learning_rate": 1.6558345505420718e-05, "loss": 0.4603, "step": 4770 }, { "epoch": 0.88, "learning_rate": 1.655683748870833e-05, "loss": 0.4491, "step": 4771 }, { "epoch": 0.88, "learning_rate": 1.6555329210390265e-05, "loss": 0.4738, "step": 4772 }, { "epoch": 0.88, "learning_rate": 1.6553820670526702e-05, "loss": 0.4838, "step": 4773 }, { "epoch": 0.88, "learning_rate": 1.6552311869177828e-05, "loss": 0.4532, "step": 4774 }, { "epoch": 0.88, "learning_rate": 1.6550802806403843e-05, "loss": 0.4528, "step": 4775 }, { "epoch": 0.88, "learning_rate": 1.6549293482264953e-05, "loss": 0.461, "step": 4776 }, { "epoch": 0.88, "learning_rate": 1.6547783896821382e-05, "loss": 0.4675, "step": 4777 }, { "epoch": 0.88, "learning_rate": 1.654627405013335e-05, "loss": 0.4444, "step": 4778 }, { "epoch": 0.88, "learning_rate": 1.6544763942261107e-05, "loss": 0.4434, "step": 4779 }, { "epoch": 0.88, "learning_rate": 1.6543253573264905e-05, "loss": 0.4767, "step": 4780 }, { "epoch": 0.88, "learning_rate": 1.6541742943204996e-05, "loss": 0.4647, "step": 4781 }, { "epoch": 0.88, "learning_rate": 1.6540232052141653e-05, "loss": 0.4524, "step": 4782 }, { "epoch": 0.88, "learning_rate": 1.653872090013516e-05, "loss": 0.4357, "step": 4783 }, { "epoch": 0.89, "learning_rate": 1.6537209487245812e-05, "loss": 0.4778, "step": 4784 }, { "epoch": 0.89, "learning_rate": 1.6535697813533906e-05, "loss": 0.4333, "step": 4785 }, { "epoch": 0.89, "learning_rate": 1.6534185879059762e-05, "loss": 0.4485, "step": 4786 }, { "epoch": 0.89, "learning_rate": 1.6532673683883696e-05, "loss": 0.4605, "step": 4787 }, { "epoch": 0.89, "learning_rate": 1.6531161228066045e-05, "loss": 0.4596, "step": 4788 }, { "epoch": 0.89, "learning_rate": 1.6529648511667155e-05, "loss": 0.4663, "step": 4789 }, { "epoch": 0.89, "learning_rate": 1.6528135534747378e-05, "loss": 0.4526, "step": 4790 }, { "epoch": 0.89, "learning_rate": 1.6526622297367076e-05, "loss": 0.4567, "step": 4791 }, { "epoch": 0.89, "learning_rate": 1.6525108799586635e-05, "loss": 0.4259, "step": 4792 }, { "epoch": 0.89, "learning_rate": 1.6523595041466425e-05, "loss": 0.4395, "step": 4793 }, { "epoch": 0.89, "learning_rate": 1.652208102306686e-05, "loss": 0.4587, "step": 4794 }, { "epoch": 0.89, "learning_rate": 1.652056674444833e-05, "loss": 0.4666, "step": 4795 }, { "epoch": 0.89, "learning_rate": 1.6519052205671263e-05, "loss": 0.4518, "step": 4796 }, { "epoch": 0.89, "learning_rate": 1.6517537406796084e-05, "loss": 0.4345, "step": 4797 }, { "epoch": 0.89, "learning_rate": 1.6516022347883227e-05, "loss": 0.4257, "step": 4798 }, { "epoch": 0.89, "learning_rate": 1.6514507028993143e-05, "loss": 0.4606, "step": 4799 }, { "epoch": 0.89, "learning_rate": 1.651299145018629e-05, "loss": 0.4807, "step": 4800 }, { "epoch": 0.89, "learning_rate": 1.651147561152314e-05, "loss": 0.4632, "step": 4801 }, { "epoch": 0.89, "learning_rate": 1.650995951306416e-05, "loss": 0.4342, "step": 4802 }, { "epoch": 0.89, "learning_rate": 1.6508443154869854e-05, "loss": 0.4729, "step": 4803 }, { "epoch": 0.89, "learning_rate": 1.650692653700072e-05, "loss": 0.4637, "step": 4804 }, { "epoch": 0.89, "learning_rate": 1.650540965951726e-05, "loss": 0.4451, "step": 4805 }, { "epoch": 0.89, "learning_rate": 1.6503892522479996e-05, "loss": 0.4567, "step": 4806 }, { "epoch": 0.89, "learning_rate": 1.6502375125949467e-05, "loss": 0.4338, "step": 4807 }, { "epoch": 0.89, "learning_rate": 1.6500857469986208e-05, "loss": 0.4533, "step": 4808 }, { "epoch": 0.89, "learning_rate": 1.6499339554650774e-05, "loss": 0.4642, "step": 4809 }, { "epoch": 0.89, "learning_rate": 1.649782138000372e-05, "loss": 0.4482, "step": 4810 }, { "epoch": 0.89, "learning_rate": 1.6496302946105626e-05, "loss": 0.458, "step": 4811 }, { "epoch": 0.89, "learning_rate": 1.6494784253017072e-05, "loss": 0.4707, "step": 4812 }, { "epoch": 0.89, "learning_rate": 1.6493265300798653e-05, "loss": 0.4586, "step": 4813 }, { "epoch": 0.89, "learning_rate": 1.6491746089510968e-05, "loss": 0.4404, "step": 4814 }, { "epoch": 0.89, "learning_rate": 1.649022661921463e-05, "loss": 0.4434, "step": 4815 }, { "epoch": 0.89, "learning_rate": 1.648870688997027e-05, "loss": 0.4585, "step": 4816 }, { "epoch": 0.89, "learning_rate": 1.6487186901838522e-05, "loss": 0.4629, "step": 4817 }, { "epoch": 0.89, "learning_rate": 1.6485666654880024e-05, "loss": 0.4461, "step": 4818 }, { "epoch": 0.89, "learning_rate": 1.6484146149155434e-05, "loss": 0.4492, "step": 4819 }, { "epoch": 0.89, "learning_rate": 1.6482625384725416e-05, "loss": 0.4519, "step": 4820 }, { "epoch": 0.89, "learning_rate": 1.648110436165065e-05, "loss": 0.4546, "step": 4821 }, { "epoch": 0.89, "learning_rate": 1.647958307999182e-05, "loss": 0.4587, "step": 4822 }, { "epoch": 0.89, "learning_rate": 1.647806153980962e-05, "loss": 0.4544, "step": 4823 }, { "epoch": 0.89, "learning_rate": 1.647653974116476e-05, "loss": 0.4476, "step": 4824 }, { "epoch": 0.89, "learning_rate": 1.6475017684117954e-05, "loss": 0.4518, "step": 4825 }, { "epoch": 0.89, "learning_rate": 1.647349536872993e-05, "loss": 0.4774, "step": 4826 }, { "epoch": 0.89, "learning_rate": 1.6471972795061426e-05, "loss": 0.4477, "step": 4827 }, { "epoch": 0.89, "learning_rate": 1.647044996317319e-05, "loss": 0.4598, "step": 4828 }, { "epoch": 0.89, "learning_rate": 1.6468926873125982e-05, "loss": 0.4817, "step": 4829 }, { "epoch": 0.89, "learning_rate": 1.646740352498057e-05, "loss": 0.4569, "step": 4830 }, { "epoch": 0.89, "learning_rate": 1.6465879918797726e-05, "loss": 0.4656, "step": 4831 }, { "epoch": 0.89, "learning_rate": 1.6464356054638247e-05, "loss": 0.4362, "step": 4832 }, { "epoch": 0.89, "learning_rate": 1.6462831932562932e-05, "loss": 0.4474, "step": 4833 }, { "epoch": 0.89, "learning_rate": 1.646130755263259e-05, "loss": 0.4438, "step": 4834 }, { "epoch": 0.89, "learning_rate": 1.6459782914908037e-05, "loss": 0.4351, "step": 4835 }, { "epoch": 0.89, "learning_rate": 1.6458258019450106e-05, "loss": 0.4772, "step": 4836 }, { "epoch": 0.89, "learning_rate": 1.6456732866319632e-05, "loss": 0.4574, "step": 4837 }, { "epoch": 0.9, "learning_rate": 1.6455207455577474e-05, "loss": 0.4465, "step": 4838 }, { "epoch": 0.9, "learning_rate": 1.6453681787284496e-05, "loss": 0.4446, "step": 4839 }, { "epoch": 0.9, "learning_rate": 1.6452155861501556e-05, "loss": 0.438, "step": 4840 }, { "epoch": 0.9, "learning_rate": 1.6450629678289548e-05, "loss": 0.4878, "step": 4841 }, { "epoch": 0.9, "learning_rate": 1.6449103237709354e-05, "loss": 0.4396, "step": 4842 }, { "epoch": 0.9, "learning_rate": 1.6447576539821882e-05, "loss": 0.4195, "step": 4843 }, { "epoch": 0.9, "learning_rate": 1.6446049584688045e-05, "loss": 0.4476, "step": 4844 }, { "epoch": 0.9, "learning_rate": 1.6444522372368767e-05, "loss": 0.4653, "step": 4845 }, { "epoch": 0.9, "learning_rate": 1.6442994902924977e-05, "loss": 0.4433, "step": 4846 }, { "epoch": 0.9, "learning_rate": 1.6441467176417615e-05, "loss": 0.4563, "step": 4847 }, { "epoch": 0.9, "learning_rate": 1.6439939192907642e-05, "loss": 0.4565, "step": 4848 }, { "epoch": 0.9, "learning_rate": 1.6438410952456015e-05, "loss": 0.4588, "step": 4849 }, { "epoch": 0.9, "learning_rate": 1.6436882455123714e-05, "loss": 0.4396, "step": 4850 }, { "epoch": 0.9, "learning_rate": 1.6435353700971724e-05, "loss": 0.4594, "step": 4851 }, { "epoch": 0.9, "learning_rate": 1.6433824690061033e-05, "loss": 0.4709, "step": 4852 }, { "epoch": 0.9, "learning_rate": 1.6432295422452646e-05, "loss": 0.4475, "step": 4853 }, { "epoch": 0.9, "learning_rate": 1.6430765898207584e-05, "loss": 0.4731, "step": 4854 }, { "epoch": 0.9, "learning_rate": 1.6429236117386868e-05, "loss": 0.4667, "step": 4855 }, { "epoch": 0.9, "learning_rate": 1.6427706080051534e-05, "loss": 0.4573, "step": 4856 }, { "epoch": 0.9, "learning_rate": 1.642617578626263e-05, "loss": 0.4688, "step": 4857 }, { "epoch": 0.9, "learning_rate": 1.6424645236081206e-05, "loss": 0.4534, "step": 4858 }, { "epoch": 0.9, "learning_rate": 1.6423114429568335e-05, "loss": 0.4693, "step": 4859 }, { "epoch": 0.9, "learning_rate": 1.642158336678509e-05, "loss": 0.4462, "step": 4860 }, { "epoch": 0.9, "learning_rate": 1.6420052047792558e-05, "loss": 0.4715, "step": 4861 }, { "epoch": 0.9, "learning_rate": 1.6418520472651835e-05, "loss": 0.4511, "step": 4862 }, { "epoch": 0.9, "learning_rate": 1.641698864142403e-05, "loss": 0.4544, "step": 4863 }, { "epoch": 0.9, "learning_rate": 1.6415456554170254e-05, "loss": 0.4461, "step": 4864 }, { "epoch": 0.9, "learning_rate": 1.6413924210951642e-05, "loss": 0.4383, "step": 4865 }, { "epoch": 0.9, "learning_rate": 1.6412391611829334e-05, "loss": 0.4679, "step": 4866 }, { "epoch": 0.9, "learning_rate": 1.6410858756864468e-05, "loss": 0.4491, "step": 4867 }, { "epoch": 0.9, "learning_rate": 1.6409325646118207e-05, "loss": 0.4639, "step": 4868 }, { "epoch": 0.9, "learning_rate": 1.6407792279651723e-05, "loss": 0.4834, "step": 4869 }, { "epoch": 0.9, "learning_rate": 1.6406258657526186e-05, "loss": 0.4508, "step": 4870 }, { "epoch": 0.9, "learning_rate": 1.640472477980279e-05, "loss": 0.4645, "step": 4871 }, { "epoch": 0.9, "learning_rate": 1.6403190646542737e-05, "loss": 0.4564, "step": 4872 }, { "epoch": 0.9, "learning_rate": 1.6401656257807233e-05, "loss": 0.4453, "step": 4873 }, { "epoch": 0.9, "learning_rate": 1.6400121613657494e-05, "loss": 0.4597, "step": 4874 }, { "epoch": 0.9, "learning_rate": 1.6398586714154753e-05, "loss": 0.4525, "step": 4875 }, { "epoch": 0.9, "learning_rate": 1.6397051559360245e-05, "loss": 0.4723, "step": 4876 }, { "epoch": 0.9, "learning_rate": 1.6395516149335225e-05, "loss": 0.458, "step": 4877 }, { "epoch": 0.9, "learning_rate": 1.6393980484140954e-05, "loss": 0.47, "step": 4878 }, { "epoch": 0.9, "learning_rate": 1.6392444563838702e-05, "loss": 0.4504, "step": 4879 }, { "epoch": 0.9, "learning_rate": 1.6390908388489745e-05, "loss": 0.4483, "step": 4880 }, { "epoch": 0.9, "learning_rate": 1.6389371958155372e-05, "loss": 0.4535, "step": 4881 }, { "epoch": 0.9, "learning_rate": 1.638783527289689e-05, "loss": 0.4563, "step": 4882 }, { "epoch": 0.9, "learning_rate": 1.6386298332775606e-05, "loss": 0.4715, "step": 4883 }, { "epoch": 0.9, "learning_rate": 1.6384761137852846e-05, "loss": 0.4547, "step": 4884 }, { "epoch": 0.9, "learning_rate": 1.638322368818994e-05, "loss": 0.4589, "step": 4885 }, { "epoch": 0.9, "learning_rate": 1.638168598384822e-05, "loss": 0.4416, "step": 4886 }, { "epoch": 0.9, "learning_rate": 1.6380148024889047e-05, "loss": 0.4537, "step": 4887 }, { "epoch": 0.9, "learning_rate": 1.637860981137378e-05, "loss": 0.4627, "step": 4888 }, { "epoch": 0.9, "learning_rate": 1.6377071343363792e-05, "loss": 0.4681, "step": 4889 }, { "epoch": 0.9, "learning_rate": 1.6375532620920467e-05, "loss": 0.4586, "step": 4890 }, { "epoch": 0.9, "learning_rate": 1.6373993644105192e-05, "loss": 0.4576, "step": 4891 }, { "epoch": 0.91, "learning_rate": 1.637245441297937e-05, "loss": 0.4579, "step": 4892 }, { "epoch": 0.91, "learning_rate": 1.6370914927604416e-05, "loss": 0.4697, "step": 4893 }, { "epoch": 0.91, "learning_rate": 1.6369375188041752e-05, "loss": 0.4529, "step": 4894 }, { "epoch": 0.91, "learning_rate": 1.6367835194352813e-05, "loss": 0.4663, "step": 4895 }, { "epoch": 0.91, "learning_rate": 1.6366294946599037e-05, "loss": 0.4509, "step": 4896 }, { "epoch": 0.91, "learning_rate": 1.636475444484188e-05, "loss": 0.4493, "step": 4897 }, { "epoch": 0.91, "learning_rate": 1.6363213689142802e-05, "loss": 0.4548, "step": 4898 }, { "epoch": 0.91, "learning_rate": 1.6361672679563285e-05, "loss": 0.4315, "step": 4899 }, { "epoch": 0.91, "learning_rate": 1.6360131416164805e-05, "loss": 0.4787, "step": 4900 }, { "epoch": 0.91, "learning_rate": 1.6358589899008853e-05, "loss": 0.4685, "step": 4901 }, { "epoch": 0.91, "learning_rate": 1.635704812815694e-05, "loss": 0.4569, "step": 4902 }, { "epoch": 0.91, "learning_rate": 1.6355506103670574e-05, "loss": 0.4477, "step": 4903 }, { "epoch": 0.91, "learning_rate": 1.6353963825611282e-05, "loss": 0.4614, "step": 4904 }, { "epoch": 0.91, "learning_rate": 1.63524212940406e-05, "loss": 0.4693, "step": 4905 }, { "epoch": 0.91, "learning_rate": 1.6350878509020068e-05, "loss": 0.4863, "step": 4906 }, { "epoch": 0.91, "learning_rate": 1.634933547061124e-05, "loss": 0.4624, "step": 4907 }, { "epoch": 0.91, "learning_rate": 1.6347792178875684e-05, "loss": 0.4682, "step": 4908 }, { "epoch": 0.91, "learning_rate": 1.634624863387497e-05, "loss": 0.4522, "step": 4909 }, { "epoch": 0.91, "learning_rate": 1.634470483567069e-05, "loss": 0.4607, "step": 4910 }, { "epoch": 0.91, "learning_rate": 1.634316078432443e-05, "loss": 0.4556, "step": 4911 }, { "epoch": 0.91, "learning_rate": 1.6341616479897802e-05, "loss": 0.4508, "step": 4912 }, { "epoch": 0.91, "learning_rate": 1.6340071922452416e-05, "loss": 0.4484, "step": 4913 }, { "epoch": 0.91, "learning_rate": 1.63385271120499e-05, "loss": 0.4411, "step": 4914 }, { "epoch": 0.91, "learning_rate": 1.6336982048751883e-05, "loss": 0.4581, "step": 4915 }, { "epoch": 0.91, "learning_rate": 1.6335436732620017e-05, "loss": 0.473, "step": 4916 }, { "epoch": 0.91, "learning_rate": 1.633389116371596e-05, "loss": 0.4366, "step": 4917 }, { "epoch": 0.91, "learning_rate": 1.6332345342101367e-05, "loss": 0.4637, "step": 4918 }, { "epoch": 0.91, "learning_rate": 1.633079926783792e-05, "loss": 0.4701, "step": 4919 }, { "epoch": 0.91, "learning_rate": 1.6329252940987304e-05, "loss": 0.436, "step": 4920 }, { "epoch": 0.91, "learning_rate": 1.6327706361611212e-05, "loss": 0.4413, "step": 4921 }, { "epoch": 0.91, "learning_rate": 1.6326159529771354e-05, "loss": 0.4289, "step": 4922 }, { "epoch": 0.91, "learning_rate": 1.6324612445529443e-05, "loss": 0.4449, "step": 4923 }, { "epoch": 0.91, "learning_rate": 1.6323065108947208e-05, "loss": 0.4716, "step": 4924 }, { "epoch": 0.91, "learning_rate": 1.6321517520086377e-05, "loss": 0.4664, "step": 4925 }, { "epoch": 0.91, "learning_rate": 1.6319969679008704e-05, "loss": 0.4344, "step": 4926 }, { "epoch": 0.91, "learning_rate": 1.631842158577594e-05, "loss": 0.4536, "step": 4927 }, { "epoch": 0.91, "learning_rate": 1.6316873240449854e-05, "loss": 0.4555, "step": 4928 }, { "epoch": 0.91, "learning_rate": 1.631532464309222e-05, "loss": 0.4419, "step": 4929 }, { "epoch": 0.91, "learning_rate": 1.6313775793764825e-05, "loss": 0.4692, "step": 4930 }, { "epoch": 0.91, "learning_rate": 1.6312226692529466e-05, "loss": 0.4716, "step": 4931 }, { "epoch": 0.91, "learning_rate": 1.6310677339447952e-05, "loss": 0.4489, "step": 4932 }, { "epoch": 0.91, "learning_rate": 1.6309127734582093e-05, "loss": 0.4737, "step": 4933 }, { "epoch": 0.91, "learning_rate": 1.630757787799372e-05, "loss": 0.4636, "step": 4934 }, { "epoch": 0.91, "learning_rate": 1.6306027769744667e-05, "loss": 0.4389, "step": 4935 }, { "epoch": 0.91, "learning_rate": 1.630447740989678e-05, "loss": 0.4902, "step": 4936 }, { "epoch": 0.91, "learning_rate": 1.630292679851192e-05, "loss": 0.4368, "step": 4937 }, { "epoch": 0.91, "learning_rate": 1.6301375935651948e-05, "loss": 0.4651, "step": 4938 }, { "epoch": 0.91, "learning_rate": 1.629982482137874e-05, "loss": 0.4772, "step": 4939 }, { "epoch": 0.91, "learning_rate": 1.6298273455754187e-05, "loss": 0.4563, "step": 4940 }, { "epoch": 0.91, "learning_rate": 1.6296721838840187e-05, "loss": 0.4556, "step": 4941 }, { "epoch": 0.91, "learning_rate": 1.6295169970698644e-05, "loss": 0.4419, "step": 4942 }, { "epoch": 0.91, "learning_rate": 1.629361785139147e-05, "loss": 0.453, "step": 4943 }, { "epoch": 0.91, "learning_rate": 1.62920654809806e-05, "loss": 0.4441, "step": 4944 }, { "epoch": 0.91, "learning_rate": 1.6290512859527963e-05, "loss": 0.4687, "step": 4945 }, { "epoch": 0.92, "learning_rate": 1.628895998709551e-05, "loss": 0.4289, "step": 4946 }, { "epoch": 0.92, "learning_rate": 1.62874068637452e-05, "loss": 0.4516, "step": 4947 }, { "epoch": 0.92, "learning_rate": 1.6285853489539e-05, "loss": 0.4506, "step": 4948 }, { "epoch": 0.92, "learning_rate": 1.628429986453888e-05, "loss": 0.4621, "step": 4949 }, { "epoch": 0.92, "learning_rate": 1.6282745988806827e-05, "loss": 0.4548, "step": 4950 }, { "epoch": 0.92, "learning_rate": 1.6281191862404845e-05, "loss": 0.4417, "step": 4951 }, { "epoch": 0.92, "learning_rate": 1.6279637485394934e-05, "loss": 0.458, "step": 4952 }, { "epoch": 0.92, "learning_rate": 1.6278082857839116e-05, "loss": 0.4557, "step": 4953 }, { "epoch": 0.92, "learning_rate": 1.627652797979942e-05, "loss": 0.4606, "step": 4954 }, { "epoch": 0.92, "learning_rate": 1.6274972851337873e-05, "loss": 0.46, "step": 4955 }, { "epoch": 0.92, "learning_rate": 1.6273417472516526e-05, "loss": 0.4489, "step": 4956 }, { "epoch": 0.92, "learning_rate": 1.627186184339744e-05, "loss": 0.4629, "step": 4957 }, { "epoch": 0.92, "learning_rate": 1.6270305964042678e-05, "loss": 0.4609, "step": 4958 }, { "epoch": 0.92, "learning_rate": 1.6268749834514315e-05, "loss": 0.4479, "step": 4959 }, { "epoch": 0.92, "learning_rate": 1.6267193454874443e-05, "loss": 0.4342, "step": 4960 }, { "epoch": 0.92, "learning_rate": 1.6265636825185153e-05, "loss": 0.4567, "step": 4961 }, { "epoch": 0.92, "learning_rate": 1.6264079945508555e-05, "loss": 0.4591, "step": 4962 }, { "epoch": 0.92, "learning_rate": 1.6262522815906762e-05, "loss": 0.4621, "step": 4963 }, { "epoch": 0.92, "learning_rate": 1.626096543644191e-05, "loss": 0.4583, "step": 4964 }, { "epoch": 0.92, "learning_rate": 1.6259407807176125e-05, "loss": 0.4647, "step": 4965 }, { "epoch": 0.92, "learning_rate": 1.6257849928171557e-05, "loss": 0.4768, "step": 4966 }, { "epoch": 0.92, "learning_rate": 1.625629179949036e-05, "loss": 0.4642, "step": 4967 }, { "epoch": 0.92, "learning_rate": 1.625473342119471e-05, "loss": 0.4579, "step": 4968 }, { "epoch": 0.92, "learning_rate": 1.6253174793346774e-05, "loss": 0.4639, "step": 4969 }, { "epoch": 0.92, "learning_rate": 1.625161591600874e-05, "loss": 0.4541, "step": 4970 }, { "epoch": 0.92, "learning_rate": 1.6250056789242808e-05, "loss": 0.4816, "step": 4971 }, { "epoch": 0.92, "learning_rate": 1.6248497413111183e-05, "loss": 0.4648, "step": 4972 }, { "epoch": 0.92, "learning_rate": 1.6246937787676076e-05, "loss": 0.4572, "step": 4973 }, { "epoch": 0.92, "learning_rate": 1.6245377912999716e-05, "loss": 0.4729, "step": 4974 }, { "epoch": 0.92, "learning_rate": 1.6243817789144346e-05, "loss": 0.4493, "step": 4975 }, { "epoch": 0.92, "learning_rate": 1.62422574161722e-05, "loss": 0.4517, "step": 4976 }, { "epoch": 0.92, "learning_rate": 1.6240696794145546e-05, "loss": 0.4554, "step": 4977 }, { "epoch": 0.92, "learning_rate": 1.623913592312664e-05, "loss": 0.4442, "step": 4978 }, { "epoch": 0.92, "learning_rate": 1.6237574803177766e-05, "loss": 0.4563, "step": 4979 }, { "epoch": 0.92, "learning_rate": 1.6236013434361203e-05, "loss": 0.454, "step": 4980 }, { "epoch": 0.92, "learning_rate": 1.623445181673925e-05, "loss": 0.4448, "step": 4981 }, { "epoch": 0.92, "learning_rate": 1.6232889950374214e-05, "loss": 0.4604, "step": 4982 }, { "epoch": 0.92, "learning_rate": 1.6231327835328404e-05, "loss": 0.4705, "step": 4983 }, { "epoch": 0.92, "learning_rate": 1.6229765471664157e-05, "loss": 0.4392, "step": 4984 }, { "epoch": 0.92, "learning_rate": 1.6228202859443796e-05, "loss": 0.4735, "step": 4985 }, { "epoch": 0.92, "learning_rate": 1.6226639998729675e-05, "loss": 0.4578, "step": 4986 }, { "epoch": 0.92, "learning_rate": 1.6225076889584145e-05, "loss": 0.451, "step": 4987 }, { "epoch": 0.92, "learning_rate": 1.6223513532069577e-05, "loss": 0.4589, "step": 4988 }, { "epoch": 0.92, "learning_rate": 1.6221949926248338e-05, "loss": 0.4697, "step": 4989 }, { "epoch": 0.92, "learning_rate": 1.6220386072182816e-05, "loss": 0.4523, "step": 4990 }, { "epoch": 0.92, "learning_rate": 1.6218821969935407e-05, "loss": 0.4479, "step": 4991 }, { "epoch": 0.92, "learning_rate": 1.6217257619568518e-05, "loss": 0.4536, "step": 4992 }, { "epoch": 0.92, "learning_rate": 1.6215693021144557e-05, "loss": 0.4308, "step": 4993 }, { "epoch": 0.92, "learning_rate": 1.6214128174725954e-05, "loss": 0.4715, "step": 4994 }, { "epoch": 0.92, "learning_rate": 1.621256308037514e-05, "loss": 0.4586, "step": 4995 }, { "epoch": 0.92, "learning_rate": 1.6210997738154566e-05, "loss": 0.4432, "step": 4996 }, { "epoch": 0.92, "learning_rate": 1.6209432148126677e-05, "loss": 0.4788, "step": 4997 }, { "epoch": 0.92, "learning_rate": 1.6207866310353947e-05, "loss": 0.4667, "step": 4998 }, { "epoch": 0.92, "learning_rate": 1.6206300224898843e-05, "loss": 0.4428, "step": 4999 }, { "epoch": 0.93, "learning_rate": 1.6204733891823847e-05, "loss": 0.4569, "step": 5000 }, { "epoch": 0.93, "learning_rate": 1.6203167311191456e-05, "loss": 0.4403, "step": 5001 }, { "epoch": 0.93, "learning_rate": 1.6201600483064178e-05, "loss": 0.457, "step": 5002 }, { "epoch": 0.93, "learning_rate": 1.620003340750452e-05, "loss": 0.4772, "step": 5003 }, { "epoch": 0.93, "learning_rate": 1.6198466084575014e-05, "loss": 0.4452, "step": 5004 }, { "epoch": 0.93, "learning_rate": 1.619689851433818e-05, "loss": 0.4538, "step": 5005 }, { "epoch": 0.93, "learning_rate": 1.6195330696856573e-05, "loss": 0.4715, "step": 5006 }, { "epoch": 0.93, "learning_rate": 1.619376263219274e-05, "loss": 0.462, "step": 5007 }, { "epoch": 0.93, "learning_rate": 1.6192194320409244e-05, "loss": 0.4479, "step": 5008 }, { "epoch": 0.93, "learning_rate": 1.619062576156866e-05, "loss": 0.4672, "step": 5009 }, { "epoch": 0.93, "learning_rate": 1.618905695573357e-05, "loss": 0.473, "step": 5010 }, { "epoch": 0.93, "learning_rate": 1.6187487902966566e-05, "loss": 0.4637, "step": 5011 }, { "epoch": 0.93, "learning_rate": 1.618591860333025e-05, "loss": 0.4539, "step": 5012 }, { "epoch": 0.93, "learning_rate": 1.618434905688724e-05, "loss": 0.4286, "step": 5013 }, { "epoch": 0.93, "learning_rate": 1.6182779263700147e-05, "loss": 0.4612, "step": 5014 }, { "epoch": 0.93, "learning_rate": 1.6181209223831612e-05, "loss": 0.4557, "step": 5015 }, { "epoch": 0.93, "learning_rate": 1.617963893734427e-05, "loss": 0.4616, "step": 5016 }, { "epoch": 0.93, "learning_rate": 1.617806840430078e-05, "loss": 0.4659, "step": 5017 }, { "epoch": 0.93, "learning_rate": 1.6176497624763792e-05, "loss": 0.4565, "step": 5018 }, { "epoch": 0.93, "learning_rate": 1.6174926598795987e-05, "loss": 0.4391, "step": 5019 }, { "epoch": 0.93, "learning_rate": 1.6173355326460044e-05, "loss": 0.4578, "step": 5020 }, { "epoch": 0.93, "learning_rate": 1.6171783807818656e-05, "loss": 0.4485, "step": 5021 }, { "epoch": 0.93, "learning_rate": 1.617021204293452e-05, "loss": 0.4467, "step": 5022 }, { "epoch": 0.93, "learning_rate": 1.6168640031870346e-05, "loss": 0.4795, "step": 5023 }, { "epoch": 0.93, "learning_rate": 1.6167067774688852e-05, "loss": 0.4381, "step": 5024 }, { "epoch": 0.93, "learning_rate": 1.6165495271452775e-05, "loss": 0.4594, "step": 5025 }, { "epoch": 0.93, "learning_rate": 1.616392252222485e-05, "loss": 0.468, "step": 5026 }, { "epoch": 0.93, "learning_rate": 1.6162349527067834e-05, "loss": 0.46, "step": 5027 }, { "epoch": 0.93, "learning_rate": 1.6160776286044474e-05, "loss": 0.4714, "step": 5028 }, { "epoch": 0.93, "learning_rate": 1.6159202799217553e-05, "loss": 0.449, "step": 5029 }, { "epoch": 0.93, "learning_rate": 1.615762906664984e-05, "loss": 0.461, "step": 5030 }, { "epoch": 0.93, "learning_rate": 1.615605508840413e-05, "loss": 0.4546, "step": 5031 }, { "epoch": 0.93, "learning_rate": 1.6154480864543217e-05, "loss": 0.4488, "step": 5032 }, { "epoch": 0.93, "learning_rate": 1.6152906395129915e-05, "loss": 0.4556, "step": 5033 }, { "epoch": 0.93, "learning_rate": 1.6151331680227037e-05, "loss": 0.4393, "step": 5034 }, { "epoch": 0.93, "learning_rate": 1.6149756719897417e-05, "loss": 0.4581, "step": 5035 }, { "epoch": 0.93, "learning_rate": 1.6148181514203884e-05, "loss": 0.453, "step": 5036 }, { "epoch": 0.93, "learning_rate": 1.6146606063209297e-05, "loss": 0.4504, "step": 5037 }, { "epoch": 0.93, "learning_rate": 1.6145030366976507e-05, "loss": 0.4515, "step": 5038 }, { "epoch": 0.93, "learning_rate": 1.614345442556838e-05, "loss": 0.4613, "step": 5039 }, { "epoch": 0.93, "learning_rate": 1.61418782390478e-05, "loss": 0.4666, "step": 5040 }, { "epoch": 0.93, "learning_rate": 1.614030180747765e-05, "loss": 0.4531, "step": 5041 }, { "epoch": 0.93, "learning_rate": 1.613872513092082e-05, "loss": 0.4534, "step": 5042 }, { "epoch": 0.93, "learning_rate": 1.613714820944023e-05, "loss": 0.4769, "step": 5043 }, { "epoch": 0.93, "learning_rate": 1.6135571043098784e-05, "loss": 0.4556, "step": 5044 }, { "epoch": 0.93, "learning_rate": 1.6133993631959416e-05, "loss": 0.4688, "step": 5045 }, { "epoch": 0.93, "learning_rate": 1.613241597608506e-05, "loss": 0.4764, "step": 5046 }, { "epoch": 0.93, "learning_rate": 1.6130838075538654e-05, "loss": 0.4648, "step": 5047 }, { "epoch": 0.93, "learning_rate": 1.6129259930383167e-05, "loss": 0.4538, "step": 5048 }, { "epoch": 0.93, "learning_rate": 1.6127681540681553e-05, "loss": 0.472, "step": 5049 }, { "epoch": 0.93, "learning_rate": 1.612610290649679e-05, "loss": 0.4696, "step": 5050 }, { "epoch": 0.93, "learning_rate": 1.6124524027891867e-05, "loss": 0.4694, "step": 5051 }, { "epoch": 0.93, "learning_rate": 1.612294490492977e-05, "loss": 0.4542, "step": 5052 }, { "epoch": 0.93, "learning_rate": 1.612136553767351e-05, "loss": 0.4509, "step": 5053 }, { "epoch": 0.94, "learning_rate": 1.61197859261861e-05, "loss": 0.4364, "step": 5054 }, { "epoch": 0.94, "learning_rate": 1.611820607053056e-05, "loss": 0.4742, "step": 5055 }, { "epoch": 0.94, "learning_rate": 1.6116625970769925e-05, "loss": 0.4451, "step": 5056 }, { "epoch": 0.94, "learning_rate": 1.611504562696724e-05, "loss": 0.4674, "step": 5057 }, { "epoch": 0.94, "learning_rate": 1.6113465039185555e-05, "loss": 0.4585, "step": 5058 }, { "epoch": 0.94, "learning_rate": 1.6111884207487934e-05, "loss": 0.4459, "step": 5059 }, { "epoch": 0.94, "learning_rate": 1.611030313193745e-05, "loss": 0.4562, "step": 5060 }, { "epoch": 0.94, "learning_rate": 1.610872181259718e-05, "loss": 0.4804, "step": 5061 }, { "epoch": 0.94, "learning_rate": 1.610714024953022e-05, "loss": 0.4638, "step": 5062 }, { "epoch": 0.94, "learning_rate": 1.6105558442799676e-05, "loss": 0.44, "step": 5063 }, { "epoch": 0.94, "learning_rate": 1.6103976392468652e-05, "loss": 0.4537, "step": 5064 }, { "epoch": 0.94, "learning_rate": 1.6102394098600273e-05, "loss": 0.4474, "step": 5065 }, { "epoch": 0.94, "learning_rate": 1.6100811561257668e-05, "loss": 0.463, "step": 5066 }, { "epoch": 0.94, "learning_rate": 1.6099228780503974e-05, "loss": 0.4714, "step": 5067 }, { "epoch": 0.94, "learning_rate": 1.6097645756402346e-05, "loss": 0.4642, "step": 5068 }, { "epoch": 0.94, "learning_rate": 1.609606248901594e-05, "loss": 0.4302, "step": 5069 }, { "epoch": 0.94, "learning_rate": 1.6094478978407926e-05, "loss": 0.4456, "step": 5070 }, { "epoch": 0.94, "learning_rate": 1.609289522464149e-05, "loss": 0.451, "step": 5071 }, { "epoch": 0.94, "learning_rate": 1.609131122777981e-05, "loss": 0.4697, "step": 5072 }, { "epoch": 0.94, "learning_rate": 1.608972698788609e-05, "loss": 0.4343, "step": 5073 }, { "epoch": 0.94, "learning_rate": 1.6088142505023538e-05, "loss": 0.4558, "step": 5074 }, { "epoch": 0.94, "learning_rate": 1.6086557779255375e-05, "loss": 0.4411, "step": 5075 }, { "epoch": 0.94, "learning_rate": 1.6084972810644825e-05, "loss": 0.4373, "step": 5076 }, { "epoch": 0.94, "learning_rate": 1.6083387599255123e-05, "loss": 0.4615, "step": 5077 }, { "epoch": 0.94, "learning_rate": 1.6081802145149522e-05, "loss": 0.4412, "step": 5078 }, { "epoch": 0.94, "learning_rate": 1.6080216448391276e-05, "loss": 0.4548, "step": 5079 }, { "epoch": 0.94, "learning_rate": 1.6078630509043644e-05, "loss": 0.4402, "step": 5080 }, { "epoch": 0.94, "learning_rate": 1.6077044327169917e-05, "loss": 0.446, "step": 5081 }, { "epoch": 0.94, "learning_rate": 1.607545790283337e-05, "loss": 0.4402, "step": 5082 }, { "epoch": 0.94, "learning_rate": 1.60738712360973e-05, "loss": 0.4414, "step": 5083 }, { "epoch": 0.94, "learning_rate": 1.6072284327025013e-05, "loss": 0.4388, "step": 5084 }, { "epoch": 0.94, "learning_rate": 1.6070697175679824e-05, "loss": 0.4526, "step": 5085 }, { "epoch": 0.94, "learning_rate": 1.606910978212506e-05, "loss": 0.4215, "step": 5086 }, { "epoch": 0.94, "learning_rate": 1.6067522146424053e-05, "loss": 0.4496, "step": 5087 }, { "epoch": 0.94, "learning_rate": 1.6065934268640143e-05, "loss": 0.4576, "step": 5088 }, { "epoch": 0.94, "learning_rate": 1.6064346148836686e-05, "loss": 0.4486, "step": 5089 }, { "epoch": 0.94, "learning_rate": 1.606275778707705e-05, "loss": 0.4715, "step": 5090 }, { "epoch": 0.94, "learning_rate": 1.6061169183424595e-05, "loss": 0.4531, "step": 5091 }, { "epoch": 0.94, "learning_rate": 1.6059580337942717e-05, "loss": 0.4572, "step": 5092 }, { "epoch": 0.94, "learning_rate": 1.6057991250694803e-05, "loss": 0.4518, "step": 5093 }, { "epoch": 0.94, "learning_rate": 1.6056401921744252e-05, "loss": 0.4592, "step": 5094 }, { "epoch": 0.94, "learning_rate": 1.605481235115448e-05, "loss": 0.4679, "step": 5095 }, { "epoch": 0.94, "learning_rate": 1.6053222538988902e-05, "loss": 0.461, "step": 5096 }, { "epoch": 0.94, "learning_rate": 1.6051632485310954e-05, "loss": 0.4614, "step": 5097 }, { "epoch": 0.94, "learning_rate": 1.6050042190184076e-05, "loss": 0.4446, "step": 5098 }, { "epoch": 0.94, "learning_rate": 1.6048451653671714e-05, "loss": 0.4556, "step": 5099 }, { "epoch": 0.94, "learning_rate": 1.604686087583733e-05, "loss": 0.448, "step": 5100 }, { "epoch": 0.94, "learning_rate": 1.604526985674439e-05, "loss": 0.4631, "step": 5101 }, { "epoch": 0.94, "learning_rate": 1.6043678596456376e-05, "loss": 0.442, "step": 5102 }, { "epoch": 0.94, "learning_rate": 1.604208709503678e-05, "loss": 0.4356, "step": 5103 }, { "epoch": 0.94, "learning_rate": 1.6040495352549092e-05, "loss": 0.4451, "step": 5104 }, { "epoch": 0.94, "learning_rate": 1.6038903369056824e-05, "loss": 0.442, "step": 5105 }, { "epoch": 0.94, "learning_rate": 1.603731114462349e-05, "loss": 0.4454, "step": 5106 }, { "epoch": 0.94, "learning_rate": 1.6035718679312623e-05, "loss": 0.4533, "step": 5107 }, { "epoch": 0.95, "learning_rate": 1.6034125973187752e-05, "loss": 0.4507, "step": 5108 }, { "epoch": 0.95, "learning_rate": 1.6032533026312428e-05, "loss": 0.4649, "step": 5109 }, { "epoch": 0.95, "learning_rate": 1.6030939838750204e-05, "loss": 0.4604, "step": 5110 }, { "epoch": 0.95, "learning_rate": 1.6029346410564647e-05, "loss": 0.4363, "step": 5111 }, { "epoch": 0.95, "learning_rate": 1.602775274181933e-05, "loss": 0.4536, "step": 5112 }, { "epoch": 0.95, "learning_rate": 1.6026158832577843e-05, "loss": 0.4563, "step": 5113 }, { "epoch": 0.95, "learning_rate": 1.6024564682903773e-05, "loss": 0.4549, "step": 5114 }, { "epoch": 0.95, "learning_rate": 1.602297029286073e-05, "loss": 0.4232, "step": 5115 }, { "epoch": 0.95, "learning_rate": 1.602137566251232e-05, "loss": 0.4922, "step": 5116 }, { "epoch": 0.95, "learning_rate": 1.6019780791922165e-05, "loss": 0.4369, "step": 5117 }, { "epoch": 0.95, "learning_rate": 1.6018185681153905e-05, "loss": 0.4598, "step": 5118 }, { "epoch": 0.95, "learning_rate": 1.601659033027118e-05, "loss": 0.4654, "step": 5119 }, { "epoch": 0.95, "learning_rate": 1.6014994739337643e-05, "loss": 0.4643, "step": 5120 }, { "epoch": 0.95, "learning_rate": 1.601339890841695e-05, "loss": 0.4617, "step": 5121 }, { "epoch": 0.95, "learning_rate": 1.6011802837572772e-05, "loss": 0.4395, "step": 5122 }, { "epoch": 0.95, "learning_rate": 1.6010206526868792e-05, "loss": 0.4519, "step": 5123 }, { "epoch": 0.95, "learning_rate": 1.60086099763687e-05, "loss": 0.4677, "step": 5124 }, { "epoch": 0.95, "learning_rate": 1.6007013186136195e-05, "loss": 0.4713, "step": 5125 }, { "epoch": 0.95, "learning_rate": 1.6005416156234988e-05, "loss": 0.4556, "step": 5126 }, { "epoch": 0.95, "learning_rate": 1.600381888672879e-05, "loss": 0.455, "step": 5127 }, { "epoch": 0.95, "learning_rate": 1.6002221377681334e-05, "loss": 0.4469, "step": 5128 }, { "epoch": 0.95, "learning_rate": 1.600062362915636e-05, "loss": 0.4684, "step": 5129 }, { "epoch": 0.95, "learning_rate": 1.5999025641217614e-05, "loss": 0.4255, "step": 5130 }, { "epoch": 0.95, "learning_rate": 1.5997427413928854e-05, "loss": 0.4483, "step": 5131 }, { "epoch": 0.95, "learning_rate": 1.599582894735384e-05, "loss": 0.4777, "step": 5132 }, { "epoch": 0.95, "learning_rate": 1.5994230241556353e-05, "loss": 0.425, "step": 5133 }, { "epoch": 0.95, "learning_rate": 1.5992631296600175e-05, "loss": 0.4568, "step": 5134 }, { "epoch": 0.95, "learning_rate": 1.599103211254911e-05, "loss": 0.469, "step": 5135 }, { "epoch": 0.95, "learning_rate": 1.598943268946695e-05, "loss": 0.4538, "step": 5136 }, { "epoch": 0.95, "learning_rate": 1.5987833027417518e-05, "loss": 0.45, "step": 5137 }, { "epoch": 0.95, "learning_rate": 1.5986233126464634e-05, "loss": 0.4493, "step": 5138 }, { "epoch": 0.95, "learning_rate": 1.598463298667213e-05, "loss": 0.4551, "step": 5139 }, { "epoch": 0.95, "learning_rate": 1.598303260810385e-05, "loss": 0.4452, "step": 5140 }, { "epoch": 0.95, "learning_rate": 1.5981431990823645e-05, "loss": 0.4462, "step": 5141 }, { "epoch": 0.95, "learning_rate": 1.597983113489538e-05, "loss": 0.4411, "step": 5142 }, { "epoch": 0.95, "learning_rate": 1.5978230040382924e-05, "loss": 0.4521, "step": 5143 }, { "epoch": 0.95, "learning_rate": 1.597662870735016e-05, "loss": 0.4757, "step": 5144 }, { "epoch": 0.95, "learning_rate": 1.597502713586097e-05, "loss": 0.4696, "step": 5145 }, { "epoch": 0.95, "learning_rate": 1.5973425325979265e-05, "loss": 0.4634, "step": 5146 }, { "epoch": 0.95, "learning_rate": 1.597182327776895e-05, "loss": 0.4442, "step": 5147 }, { "epoch": 0.95, "learning_rate": 1.5970220991293937e-05, "loss": 0.4487, "step": 5148 }, { "epoch": 0.95, "learning_rate": 1.5968618466618163e-05, "loss": 0.453, "step": 5149 }, { "epoch": 0.95, "learning_rate": 1.5967015703805564e-05, "loss": 0.4605, "step": 5150 }, { "epoch": 0.95, "learning_rate": 1.5965412702920084e-05, "loss": 0.4857, "step": 5151 }, { "epoch": 0.95, "learning_rate": 1.5963809464025685e-05, "loss": 0.4492, "step": 5152 }, { "epoch": 0.95, "learning_rate": 1.5962205987186327e-05, "loss": 0.4534, "step": 5153 }, { "epoch": 0.95, "learning_rate": 1.596060227246599e-05, "loss": 0.4652, "step": 5154 }, { "epoch": 0.95, "learning_rate": 1.5958998319928656e-05, "loss": 0.4472, "step": 5155 }, { "epoch": 0.95, "learning_rate": 1.5957394129638322e-05, "loss": 0.4501, "step": 5156 }, { "epoch": 0.95, "learning_rate": 1.5955789701658994e-05, "loss": 0.4305, "step": 5157 }, { "epoch": 0.95, "learning_rate": 1.5954185036054685e-05, "loss": 0.4468, "step": 5158 }, { "epoch": 0.95, "learning_rate": 1.5952580132889416e-05, "loss": 0.4484, "step": 5159 }, { "epoch": 0.95, "learning_rate": 1.595097499222722e-05, "loss": 0.4598, "step": 5160 }, { "epoch": 0.95, "learning_rate": 1.5949369614132137e-05, "loss": 0.4326, "step": 5161 }, { "epoch": 0.96, "learning_rate": 1.5947763998668225e-05, "loss": 0.4404, "step": 5162 }, { "epoch": 0.96, "learning_rate": 1.594615814589954e-05, "loss": 0.4418, "step": 5163 }, { "epoch": 0.96, "learning_rate": 1.5944552055890156e-05, "loss": 0.4464, "step": 5164 }, { "epoch": 0.96, "learning_rate": 1.5942945728704148e-05, "loss": 0.4477, "step": 5165 }, { "epoch": 0.96, "learning_rate": 1.594133916440561e-05, "loss": 0.4278, "step": 5166 }, { "epoch": 0.96, "learning_rate": 1.593973236305864e-05, "loss": 0.4395, "step": 5167 }, { "epoch": 0.96, "learning_rate": 1.5938125324727347e-05, "loss": 0.4643, "step": 5168 }, { "epoch": 0.96, "learning_rate": 1.5936518049475847e-05, "loss": 0.4426, "step": 5169 }, { "epoch": 0.96, "learning_rate": 1.5934910537368265e-05, "loss": 0.4424, "step": 5170 }, { "epoch": 0.96, "learning_rate": 1.5933302788468745e-05, "loss": 0.4526, "step": 5171 }, { "epoch": 0.96, "learning_rate": 1.5931694802841425e-05, "loss": 0.4226, "step": 5172 }, { "epoch": 0.96, "learning_rate": 1.5930086580550463e-05, "loss": 0.4778, "step": 5173 }, { "epoch": 0.96, "learning_rate": 1.5928478121660028e-05, "loss": 0.461, "step": 5174 }, { "epoch": 0.96, "learning_rate": 1.5926869426234298e-05, "loss": 0.4694, "step": 5175 }, { "epoch": 0.96, "learning_rate": 1.5925260494337446e-05, "loss": 0.4528, "step": 5176 }, { "epoch": 0.96, "learning_rate": 1.592365132603367e-05, "loss": 0.4399, "step": 5177 }, { "epoch": 0.96, "learning_rate": 1.5922041921387176e-05, "loss": 0.451, "step": 5178 }, { "epoch": 0.96, "learning_rate": 1.5920432280462172e-05, "loss": 0.444, "step": 5179 }, { "epoch": 0.96, "learning_rate": 1.591882240332288e-05, "loss": 0.4521, "step": 5180 }, { "epoch": 0.96, "learning_rate": 1.5917212290033534e-05, "loss": 0.4511, "step": 5181 }, { "epoch": 0.96, "learning_rate": 1.5915601940658372e-05, "loss": 0.461, "step": 5182 }, { "epoch": 0.96, "learning_rate": 1.5913991355261646e-05, "loss": 0.4605, "step": 5183 }, { "epoch": 0.96, "learning_rate": 1.5912380533907613e-05, "loss": 0.4543, "step": 5184 }, { "epoch": 0.96, "learning_rate": 1.591076947666055e-05, "loss": 0.4462, "step": 5185 }, { "epoch": 0.96, "learning_rate": 1.590915818358472e-05, "loss": 0.4489, "step": 5186 }, { "epoch": 0.96, "learning_rate": 1.5907546654744422e-05, "loss": 0.4632, "step": 5187 }, { "epoch": 0.96, "learning_rate": 1.5905934890203953e-05, "loss": 0.4528, "step": 5188 }, { "epoch": 0.96, "learning_rate": 1.590432289002761e-05, "loss": 0.4572, "step": 5189 }, { "epoch": 0.96, "learning_rate": 1.590271065427972e-05, "loss": 0.4561, "step": 5190 }, { "epoch": 0.96, "learning_rate": 1.5901098183024603e-05, "loss": 0.474, "step": 5191 }, { "epoch": 0.96, "learning_rate": 1.5899485476326594e-05, "loss": 0.4548, "step": 5192 }, { "epoch": 0.96, "learning_rate": 1.5897872534250035e-05, "loss": 0.4513, "step": 5193 }, { "epoch": 0.96, "learning_rate": 1.5896259356859284e-05, "loss": 0.4364, "step": 5194 }, { "epoch": 0.96, "learning_rate": 1.5894645944218697e-05, "loss": 0.4449, "step": 5195 }, { "epoch": 0.96, "learning_rate": 1.5893032296392657e-05, "loss": 0.4342, "step": 5196 }, { "epoch": 0.96, "learning_rate": 1.5891418413445534e-05, "loss": 0.449, "step": 5197 }, { "epoch": 0.96, "learning_rate": 1.5889804295441727e-05, "loss": 0.4542, "step": 5198 }, { "epoch": 0.96, "learning_rate": 1.588818994244563e-05, "loss": 0.4718, "step": 5199 }, { "epoch": 0.96, "learning_rate": 1.588657535452166e-05, "loss": 0.4388, "step": 5200 }, { "epoch": 0.96, "learning_rate": 1.5884960531734228e-05, "loss": 0.4583, "step": 5201 }, { "epoch": 0.96, "learning_rate": 1.588334547414777e-05, "loss": 0.4696, "step": 5202 }, { "epoch": 0.96, "learning_rate": 1.5881730181826718e-05, "loss": 0.4345, "step": 5203 }, { "epoch": 0.96, "learning_rate": 1.5880114654835522e-05, "loss": 0.4619, "step": 5204 }, { "epoch": 0.96, "learning_rate": 1.5878498893238637e-05, "loss": 0.4756, "step": 5205 }, { "epoch": 0.96, "learning_rate": 1.5876882897100534e-05, "loss": 0.4535, "step": 5206 }, { "epoch": 0.96, "learning_rate": 1.587526666648568e-05, "loss": 0.4517, "step": 5207 }, { "epoch": 0.96, "learning_rate": 1.5873650201458567e-05, "loss": 0.4465, "step": 5208 }, { "epoch": 0.96, "learning_rate": 1.5872033502083682e-05, "loss": 0.4606, "step": 5209 }, { "epoch": 0.96, "learning_rate": 1.5870416568425535e-05, "loss": 0.4598, "step": 5210 }, { "epoch": 0.96, "learning_rate": 1.5868799400548633e-05, "loss": 0.4675, "step": 5211 }, { "epoch": 0.96, "learning_rate": 1.5867181998517503e-05, "loss": 0.4621, "step": 5212 }, { "epoch": 0.96, "learning_rate": 1.5865564362396674e-05, "loss": 0.4328, "step": 5213 }, { "epoch": 0.96, "learning_rate": 1.5863946492250688e-05, "loss": 0.4465, "step": 5214 }, { "epoch": 0.96, "learning_rate": 1.5862328388144092e-05, "loss": 0.4342, "step": 5215 }, { "epoch": 0.97, "learning_rate": 1.5860710050141443e-05, "loss": 0.455, "step": 5216 }, { "epoch": 0.97, "learning_rate": 1.585909147830732e-05, "loss": 0.4681, "step": 5217 }, { "epoch": 0.97, "learning_rate": 1.5857472672706294e-05, "loss": 0.4577, "step": 5218 }, { "epoch": 0.97, "learning_rate": 1.585585363340295e-05, "loss": 0.4372, "step": 5219 }, { "epoch": 0.97, "learning_rate": 1.5854234360461892e-05, "loss": 0.4588, "step": 5220 }, { "epoch": 0.97, "learning_rate": 1.5852614853947717e-05, "loss": 0.4646, "step": 5221 }, { "epoch": 0.97, "learning_rate": 1.5850995113925048e-05, "loss": 0.4571, "step": 5222 }, { "epoch": 0.97, "learning_rate": 1.5849375140458506e-05, "loss": 0.4621, "step": 5223 }, { "epoch": 0.97, "learning_rate": 1.584775493361273e-05, "loss": 0.434, "step": 5224 }, { "epoch": 0.97, "learning_rate": 1.5846134493452356e-05, "loss": 0.4424, "step": 5225 }, { "epoch": 0.97, "learning_rate": 1.5844513820042035e-05, "loss": 0.4519, "step": 5226 }, { "epoch": 0.97, "learning_rate": 1.5842892913446438e-05, "loss": 0.442, "step": 5227 }, { "epoch": 0.97, "learning_rate": 1.5841271773730232e-05, "loss": 0.4627, "step": 5228 }, { "epoch": 0.97, "learning_rate": 1.5839650400958092e-05, "loss": 0.4643, "step": 5229 }, { "epoch": 0.97, "learning_rate": 1.583802879519472e-05, "loss": 0.448, "step": 5230 }, { "epoch": 0.97, "learning_rate": 1.5836406956504803e-05, "loss": 0.4512, "step": 5231 }, { "epoch": 0.97, "learning_rate": 1.5834784884953056e-05, "loss": 0.4407, "step": 5232 }, { "epoch": 0.97, "learning_rate": 1.5833162580604194e-05, "loss": 0.4678, "step": 5233 }, { "epoch": 0.97, "learning_rate": 1.5831540043522947e-05, "loss": 0.4554, "step": 5234 }, { "epoch": 0.97, "learning_rate": 1.5829917273774048e-05, "loss": 0.4755, "step": 5235 }, { "epoch": 0.97, "learning_rate": 1.582829427142224e-05, "loss": 0.441, "step": 5236 }, { "epoch": 0.97, "learning_rate": 1.5826671036532287e-05, "loss": 0.4353, "step": 5237 }, { "epoch": 0.97, "learning_rate": 1.5825047569168943e-05, "loss": 0.4518, "step": 5238 }, { "epoch": 0.97, "learning_rate": 1.5823423869396987e-05, "loss": 0.4262, "step": 5239 }, { "epoch": 0.97, "learning_rate": 1.5821799937281203e-05, "loss": 0.4606, "step": 5240 }, { "epoch": 0.97, "learning_rate": 1.582017577288638e-05, "loss": 0.466, "step": 5241 }, { "epoch": 0.97, "learning_rate": 1.5818551376277318e-05, "loss": 0.4477, "step": 5242 }, { "epoch": 0.97, "learning_rate": 1.581692674751883e-05, "loss": 0.4625, "step": 5243 }, { "epoch": 0.97, "learning_rate": 1.5815301886675733e-05, "loss": 0.4496, "step": 5244 }, { "epoch": 0.97, "learning_rate": 1.5813676793812856e-05, "loss": 0.4422, "step": 5245 }, { "epoch": 0.97, "learning_rate": 1.581205146899504e-05, "loss": 0.4478, "step": 5246 }, { "epoch": 0.97, "learning_rate": 1.5810425912287134e-05, "loss": 0.4376, "step": 5247 }, { "epoch": 0.97, "learning_rate": 1.5808800123753987e-05, "loss": 0.4501, "step": 5248 }, { "epoch": 0.97, "learning_rate": 1.5807174103460472e-05, "loss": 0.451, "step": 5249 }, { "epoch": 0.97, "learning_rate": 1.5805547851471463e-05, "loss": 0.4353, "step": 5250 }, { "epoch": 0.97, "learning_rate": 1.5803921367851844e-05, "loss": 0.4451, "step": 5251 }, { "epoch": 0.97, "learning_rate": 1.5802294652666502e-05, "loss": 0.4447, "step": 5252 }, { "epoch": 0.97, "learning_rate": 1.580066770598035e-05, "loss": 0.4542, "step": 5253 }, { "epoch": 0.97, "learning_rate": 1.57990405278583e-05, "loss": 0.4625, "step": 5254 }, { "epoch": 0.97, "learning_rate": 1.5797413118365266e-05, "loss": 0.4438, "step": 5255 }, { "epoch": 0.97, "learning_rate": 1.5795785477566182e-05, "loss": 0.4609, "step": 5256 }, { "epoch": 0.97, "learning_rate": 1.579415760552599e-05, "loss": 0.4572, "step": 5257 }, { "epoch": 0.97, "learning_rate": 1.5792529502309634e-05, "loss": 0.4726, "step": 5258 }, { "epoch": 0.97, "learning_rate": 1.5790901167982078e-05, "loss": 0.4429, "step": 5259 }, { "epoch": 0.97, "learning_rate": 1.5789272602608287e-05, "loss": 0.4348, "step": 5260 }, { "epoch": 0.97, "learning_rate": 1.5787643806253236e-05, "loss": 0.4555, "step": 5261 }, { "epoch": 0.97, "learning_rate": 1.5786014778981913e-05, "loss": 0.4687, "step": 5262 }, { "epoch": 0.97, "learning_rate": 1.5784385520859316e-05, "loss": 0.4509, "step": 5263 }, { "epoch": 0.97, "learning_rate": 1.5782756031950442e-05, "loss": 0.451, "step": 5264 }, { "epoch": 0.97, "learning_rate": 1.578112631232031e-05, "loss": 0.4579, "step": 5265 }, { "epoch": 0.97, "learning_rate": 1.5779496362033943e-05, "loss": 0.4601, "step": 5266 }, { "epoch": 0.97, "learning_rate": 1.5777866181156367e-05, "loss": 0.4547, "step": 5267 }, { "epoch": 0.97, "learning_rate": 1.577623576975263e-05, "loss": 0.4367, "step": 5268 }, { "epoch": 0.97, "learning_rate": 1.5774605127887786e-05, "loss": 0.4612, "step": 5269 }, { "epoch": 0.98, "learning_rate": 1.577297425562688e-05, "loss": 0.4491, "step": 5270 }, { "epoch": 0.98, "learning_rate": 1.5771343153034998e-05, "loss": 0.4557, "step": 5271 }, { "epoch": 0.98, "learning_rate": 1.5769711820177204e-05, "loss": 0.442, "step": 5272 }, { "epoch": 0.98, "learning_rate": 1.5768080257118594e-05, "loss": 0.4301, "step": 5273 }, { "epoch": 0.98, "learning_rate": 1.5766448463924258e-05, "loss": 0.451, "step": 5274 }, { "epoch": 0.98, "learning_rate": 1.5764816440659308e-05, "loss": 0.4262, "step": 5275 }, { "epoch": 0.98, "learning_rate": 1.5763184187388853e-05, "loss": 0.4558, "step": 5276 }, { "epoch": 0.98, "learning_rate": 1.5761551704178016e-05, "loss": 0.4565, "step": 5277 }, { "epoch": 0.98, "learning_rate": 1.5759918991091937e-05, "loss": 0.4259, "step": 5278 }, { "epoch": 0.98, "learning_rate": 1.5758286048195758e-05, "loss": 0.4482, "step": 5279 }, { "epoch": 0.98, "learning_rate": 1.575665287555462e-05, "loss": 0.4692, "step": 5280 }, { "epoch": 0.98, "learning_rate": 1.5755019473233695e-05, "loss": 0.462, "step": 5281 }, { "epoch": 0.98, "learning_rate": 1.5753385841298144e-05, "loss": 0.4418, "step": 5282 }, { "epoch": 0.98, "learning_rate": 1.575175197981315e-05, "loss": 0.4554, "step": 5283 }, { "epoch": 0.98, "learning_rate": 1.5750117888843906e-05, "loss": 0.4403, "step": 5284 }, { "epoch": 0.98, "learning_rate": 1.5748483568455605e-05, "loss": 0.4431, "step": 5285 }, { "epoch": 0.98, "learning_rate": 1.574684901871345e-05, "loss": 0.4661, "step": 5286 }, { "epoch": 0.98, "learning_rate": 1.5745214239682658e-05, "loss": 0.4322, "step": 5287 }, { "epoch": 0.98, "learning_rate": 1.5743579231428455e-05, "loss": 0.4553, "step": 5288 }, { "epoch": 0.98, "learning_rate": 1.5741943994016074e-05, "loss": 0.4385, "step": 5289 }, { "epoch": 0.98, "learning_rate": 1.5740308527510762e-05, "loss": 0.4537, "step": 5290 }, { "epoch": 0.98, "learning_rate": 1.5738672831977762e-05, "loss": 0.4657, "step": 5291 }, { "epoch": 0.98, "learning_rate": 1.5737036907482345e-05, "loss": 0.4559, "step": 5292 }, { "epoch": 0.98, "learning_rate": 1.573540075408978e-05, "loss": 0.4315, "step": 5293 }, { "epoch": 0.98, "learning_rate": 1.573376437186534e-05, "loss": 0.4411, "step": 5294 }, { "epoch": 0.98, "learning_rate": 1.5732127760874316e-05, "loss": 0.4684, "step": 5295 }, { "epoch": 0.98, "learning_rate": 1.573049092118201e-05, "loss": 0.4416, "step": 5296 }, { "epoch": 0.98, "learning_rate": 1.5728853852853723e-05, "loss": 0.4576, "step": 5297 }, { "epoch": 0.98, "learning_rate": 1.5727216555954776e-05, "loss": 0.4491, "step": 5298 }, { "epoch": 0.98, "learning_rate": 1.572557903055049e-05, "loss": 0.4596, "step": 5299 }, { "epoch": 0.98, "learning_rate": 1.57239412767062e-05, "loss": 0.4468, "step": 5300 }, { "epoch": 0.98, "learning_rate": 1.572230329448726e-05, "loss": 0.4695, "step": 5301 }, { "epoch": 0.98, "learning_rate": 1.5720665083959005e-05, "loss": 0.4575, "step": 5302 }, { "epoch": 0.98, "learning_rate": 1.5719026645186806e-05, "loss": 0.4457, "step": 5303 }, { "epoch": 0.98, "learning_rate": 1.571738797823603e-05, "loss": 0.4634, "step": 5304 }, { "epoch": 0.98, "learning_rate": 1.5715749083172066e-05, "loss": 0.4405, "step": 5305 }, { "epoch": 0.98, "learning_rate": 1.5714109960060292e-05, "loss": 0.4349, "step": 5306 }, { "epoch": 0.98, "learning_rate": 1.5712470608966105e-05, "loss": 0.4473, "step": 5307 }, { "epoch": 0.98, "learning_rate": 1.5710831029954924e-05, "loss": 0.4261, "step": 5308 }, { "epoch": 0.98, "learning_rate": 1.570919122309216e-05, "loss": 0.4308, "step": 5309 }, { "epoch": 0.98, "learning_rate": 1.570755118844323e-05, "loss": 0.4414, "step": 5310 }, { "epoch": 0.98, "learning_rate": 1.5705910926073575e-05, "loss": 0.4456, "step": 5311 }, { "epoch": 0.98, "learning_rate": 1.5704270436048644e-05, "loss": 0.4332, "step": 5312 }, { "epoch": 0.98, "learning_rate": 1.5702629718433878e-05, "loss": 0.452, "step": 5313 }, { "epoch": 0.98, "learning_rate": 1.5700988773294746e-05, "loss": 0.4452, "step": 5314 }, { "epoch": 0.98, "learning_rate": 1.569934760069672e-05, "loss": 0.4569, "step": 5315 }, { "epoch": 0.98, "learning_rate": 1.5697706200705274e-05, "loss": 0.4613, "step": 5316 }, { "epoch": 0.98, "learning_rate": 1.56960645733859e-05, "loss": 0.4332, "step": 5317 }, { "epoch": 0.98, "learning_rate": 1.56944227188041e-05, "loss": 0.4545, "step": 5318 }, { "epoch": 0.98, "learning_rate": 1.569278063702537e-05, "loss": 0.4558, "step": 5319 }, { "epoch": 0.98, "learning_rate": 1.5691138328115234e-05, "loss": 0.442, "step": 5320 }, { "epoch": 0.98, "learning_rate": 1.5689495792139218e-05, "loss": 0.4396, "step": 5321 }, { "epoch": 0.98, "learning_rate": 1.568785302916285e-05, "loss": 0.4618, "step": 5322 }, { "epoch": 0.98, "learning_rate": 1.5686210039251683e-05, "loss": 0.4494, "step": 5323 }, { "epoch": 0.99, "learning_rate": 1.5684566822471254e-05, "loss": 0.446, "step": 5324 }, { "epoch": 0.99, "learning_rate": 1.568292337888714e-05, "loss": 0.4366, "step": 5325 }, { "epoch": 0.99, "learning_rate": 1.5681279708564905e-05, "loss": 0.4596, "step": 5326 }, { "epoch": 0.99, "learning_rate": 1.5679635811570128e-05, "loss": 0.4297, "step": 5327 }, { "epoch": 0.99, "learning_rate": 1.5677991687968396e-05, "loss": 0.449, "step": 5328 }, { "epoch": 0.99, "learning_rate": 1.5676347337825308e-05, "loss": 0.4524, "step": 5329 }, { "epoch": 0.99, "learning_rate": 1.567470276120647e-05, "loss": 0.4608, "step": 5330 }, { "epoch": 0.99, "learning_rate": 1.56730579581775e-05, "loss": 0.4521, "step": 5331 }, { "epoch": 0.99, "learning_rate": 1.567141292880402e-05, "loss": 0.4502, "step": 5332 }, { "epoch": 0.99, "learning_rate": 1.5669767673151666e-05, "loss": 0.4395, "step": 5333 }, { "epoch": 0.99, "learning_rate": 1.5668122191286077e-05, "loss": 0.4479, "step": 5334 }, { "epoch": 0.99, "learning_rate": 1.5666476483272907e-05, "loss": 0.4241, "step": 5335 }, { "epoch": 0.99, "learning_rate": 1.5664830549177818e-05, "loss": 0.4548, "step": 5336 }, { "epoch": 0.99, "learning_rate": 1.5663184389066477e-05, "loss": 0.437, "step": 5337 }, { "epoch": 0.99, "learning_rate": 1.5661538003004564e-05, "loss": 0.4566, "step": 5338 }, { "epoch": 0.99, "learning_rate": 1.565989139105777e-05, "loss": 0.4692, "step": 5339 }, { "epoch": 0.99, "learning_rate": 1.5658244553291786e-05, "loss": 0.4658, "step": 5340 }, { "epoch": 0.99, "learning_rate": 1.565659748977232e-05, "loss": 0.447, "step": 5341 }, { "epoch": 0.99, "learning_rate": 1.5654950200565084e-05, "loss": 0.4439, "step": 5342 }, { "epoch": 0.99, "learning_rate": 1.565330268573581e-05, "loss": 0.4655, "step": 5343 }, { "epoch": 0.99, "learning_rate": 1.5651654945350222e-05, "loss": 0.4549, "step": 5344 }, { "epoch": 0.99, "learning_rate": 1.5650006979474067e-05, "loss": 0.45, "step": 5345 }, { "epoch": 0.99, "learning_rate": 1.5648358788173098e-05, "loss": 0.4497, "step": 5346 }, { "epoch": 0.99, "learning_rate": 1.5646710371513063e-05, "loss": 0.4613, "step": 5347 }, { "epoch": 0.99, "learning_rate": 1.5645061729559744e-05, "loss": 0.4432, "step": 5348 }, { "epoch": 0.99, "learning_rate": 1.5643412862378914e-05, "loss": 0.4601, "step": 5349 }, { "epoch": 0.99, "learning_rate": 1.5641763770036357e-05, "loss": 0.4441, "step": 5350 }, { "epoch": 0.99, "learning_rate": 1.564011445259787e-05, "loss": 0.4806, "step": 5351 }, { "epoch": 0.99, "learning_rate": 1.5638464910129263e-05, "loss": 0.4635, "step": 5352 }, { "epoch": 0.99, "learning_rate": 1.5636815142696344e-05, "loss": 0.4486, "step": 5353 }, { "epoch": 0.99, "learning_rate": 1.5635165150364936e-05, "loss": 0.4507, "step": 5354 }, { "epoch": 0.99, "learning_rate": 1.563351493320087e-05, "loss": 0.4484, "step": 5355 }, { "epoch": 0.99, "learning_rate": 1.5631864491269992e-05, "loss": 0.4621, "step": 5356 }, { "epoch": 0.99, "learning_rate": 1.5630213824638145e-05, "loss": 0.4444, "step": 5357 }, { "epoch": 0.99, "learning_rate": 1.5628562933371193e-05, "loss": 0.4602, "step": 5358 }, { "epoch": 0.99, "learning_rate": 1.5626911817535e-05, "loss": 0.4505, "step": 5359 }, { "epoch": 0.99, "learning_rate": 1.562526047719544e-05, "loss": 0.4429, "step": 5360 }, { "epoch": 0.99, "learning_rate": 1.5623608912418408e-05, "loss": 0.4437, "step": 5361 }, { "epoch": 0.99, "learning_rate": 1.562195712326979e-05, "loss": 0.4498, "step": 5362 }, { "epoch": 0.99, "learning_rate": 1.562030510981549e-05, "loss": 0.4448, "step": 5363 }, { "epoch": 0.99, "learning_rate": 1.561865287212142e-05, "loss": 0.4485, "step": 5364 }, { "epoch": 0.99, "learning_rate": 1.561700041025351e-05, "loss": 0.4643, "step": 5365 }, { "epoch": 0.99, "learning_rate": 1.5615347724277678e-05, "loss": 0.4371, "step": 5366 }, { "epoch": 0.99, "learning_rate": 1.5613694814259866e-05, "loss": 0.4616, "step": 5367 }, { "epoch": 0.99, "learning_rate": 1.561204168026603e-05, "loss": 0.4289, "step": 5368 }, { "epoch": 0.99, "learning_rate": 1.561038832236212e-05, "loss": 0.4486, "step": 5369 }, { "epoch": 0.99, "learning_rate": 1.56087347406141e-05, "loss": 0.4458, "step": 5370 }, { "epoch": 0.99, "learning_rate": 1.560708093508795e-05, "loss": 0.4722, "step": 5371 }, { "epoch": 0.99, "learning_rate": 1.5605426905849654e-05, "loss": 0.4504, "step": 5372 }, { "epoch": 0.99, "learning_rate": 1.5603772652965198e-05, "loss": 0.4647, "step": 5373 }, { "epoch": 0.99, "learning_rate": 1.5602118176500592e-05, "loss": 0.4484, "step": 5374 }, { "epoch": 0.99, "learning_rate": 1.5600463476521843e-05, "loss": 0.4541, "step": 5375 }, { "epoch": 0.99, "learning_rate": 1.559880855309497e-05, "loss": 0.4558, "step": 5376 }, { "epoch": 0.99, "learning_rate": 1.5597153406286e-05, "loss": 0.4667, "step": 5377 }, { "epoch": 1.0, "learning_rate": 1.5595498036160973e-05, "loss": 0.4678, "step": 5378 }, { "epoch": 1.0, "learning_rate": 1.5593842442785936e-05, "loss": 0.4465, "step": 5379 }, { "epoch": 1.0, "learning_rate": 1.559218662622694e-05, "loss": 0.441, "step": 5380 }, { "epoch": 1.0, "learning_rate": 1.559053058655005e-05, "loss": 0.47, "step": 5381 }, { "epoch": 1.0, "learning_rate": 1.558887432382134e-05, "loss": 0.4345, "step": 5382 }, { "epoch": 1.0, "learning_rate": 1.5587217838106896e-05, "loss": 0.4248, "step": 5383 }, { "epoch": 1.0, "learning_rate": 1.5585561129472803e-05, "loss": 0.463, "step": 5384 }, { "epoch": 1.0, "learning_rate": 1.5583904197985162e-05, "loss": 0.445, "step": 5385 }, { "epoch": 1.0, "learning_rate": 1.5582247043710078e-05, "loss": 0.4411, "step": 5386 }, { "epoch": 1.0, "learning_rate": 1.5580589666713678e-05, "loss": 0.4723, "step": 5387 }, { "epoch": 1.0, "learning_rate": 1.557893206706208e-05, "loss": 0.4554, "step": 5388 }, { "epoch": 1.0, "learning_rate": 1.5577274244821422e-05, "loss": 0.4619, "step": 5389 }, { "epoch": 1.0, "learning_rate": 1.557561620005785e-05, "loss": 0.4215, "step": 5390 }, { "epoch": 1.0, "learning_rate": 1.5573957932837513e-05, "loss": 0.446, "step": 5391 }, { "epoch": 1.0, "learning_rate": 1.5572299443226572e-05, "loss": 0.4716, "step": 5392 }, { "epoch": 1.0, "learning_rate": 1.5570640731291203e-05, "loss": 0.478, "step": 5393 }, { "epoch": 1.0, "learning_rate": 1.556898179709758e-05, "loss": 0.4435, "step": 5394 }, { "epoch": 1.0, "learning_rate": 1.5567322640711896e-05, "loss": 0.4464, "step": 5395 }, { "epoch": 1.0, "learning_rate": 1.5565663262200344e-05, "loss": 0.4395, "step": 5396 }, { "epoch": 1.0, "learning_rate": 1.5564003661629135e-05, "loss": 0.4459, "step": 5397 }, { "epoch": 1.0, "learning_rate": 1.556234383906448e-05, "loss": 0.4621, "step": 5398 }, { "epoch": 1.0, "learning_rate": 1.55606837945726e-05, "loss": 0.4632, "step": 5399 }, { "epoch": 1.0, "learning_rate": 1.5559023528219742e-05, "loss": 0.4547, "step": 5400 }, { "epoch": 1.0, "learning_rate": 1.555736304007213e-05, "loss": 0.4573, "step": 5401 }, { "epoch": 1.0, "learning_rate": 1.5555702330196024e-05, "loss": 0.4683, "step": 5402 }, { "epoch": 1.0, "learning_rate": 1.5554041398657682e-05, "loss": 0.4438, "step": 5403 }, { "epoch": 1.0, "learning_rate": 1.5552380245523368e-05, "loss": 0.4595, "step": 5404 }, { "epoch": 1.0, "learning_rate": 1.5550718870859367e-05, "loss": 0.4508, "step": 5405 }, { "epoch": 1.0, "learning_rate": 1.5549057274731957e-05, "loss": 0.4584, "step": 5406 }, { "epoch": 1.0, "learning_rate": 1.5547395457207435e-05, "loss": 0.444, "step": 5407 }, { "epoch": 1.0, "learning_rate": 1.5545733418352103e-05, "loss": 0.4685, "step": 5408 }, { "epoch": 1.0, "learning_rate": 1.554407115823228e-05, "loss": 0.4511, "step": 5409 }, { "epoch": 1.0, "learning_rate": 1.554240867691428e-05, "loss": 0.4639, "step": 5410 }, { "epoch": 1.0, "learning_rate": 1.5540745974464434e-05, "loss": 0.442, "step": 5411 }, { "epoch": 1.0, "learning_rate": 1.5539083050949088e-05, "loss": 0.4452, "step": 5412 }, { "epoch": 1.0, "learning_rate": 1.5537419906434575e-05, "loss": 0.4519, "step": 5413 }, { "epoch": 1.0, "learning_rate": 1.5535756540987266e-05, "loss": 0.4336, "step": 5414 }, { "epoch": 1.0, "learning_rate": 1.5534092954673517e-05, "loss": 0.4566, "step": 5415 }, { "epoch": 1.0, "learning_rate": 1.5532429147559712e-05, "loss": 0.463, "step": 5416 }, { "epoch": 1.0, "learning_rate": 1.5530765119712218e-05, "loss": 0.4747, "step": 5417 }, { "epoch": 1.0, "learning_rate": 1.552910087119744e-05, "loss": 0.4408, "step": 5418 }, { "epoch": 1.0, "learning_rate": 1.552743640208177e-05, "loss": 0.4721, "step": 5419 }, { "epoch": 1.0, "learning_rate": 1.5525771712431626e-05, "loss": 0.4377, "step": 5420 }, { "epoch": 1.0, "learning_rate": 1.5524106802313422e-05, "loss": 0.4633, "step": 5421 }, { "epoch": 1.0, "learning_rate": 1.5522441671793585e-05, "loss": 0.4638, "step": 5422 }, { "epoch": 1.0, "learning_rate": 1.5520776320938544e-05, "loss": 0.4276, "step": 5423 }, { "epoch": 1.0, "learning_rate": 1.5519110749814753e-05, "loss": 0.4557, "step": 5424 }, { "epoch": 1.0, "learning_rate": 1.551744495848866e-05, "loss": 0.443, "step": 5425 }, { "epoch": 1.0, "learning_rate": 1.551577894702673e-05, "loss": 0.432, "step": 5426 }, { "epoch": 1.0, "learning_rate": 1.5514112715495433e-05, "loss": 0.4589, "step": 5427 }, { "epoch": 1.0, "learning_rate": 1.5512446263961247e-05, "loss": 0.457, "step": 5428 }, { "epoch": 1.0, "learning_rate": 1.551077959249066e-05, "loss": 0.4439, "step": 5429 }, { "epoch": 1.0, "learning_rate": 1.550911270115017e-05, "loss": 0.4453, "step": 5430 }, { "epoch": 1.0, "learning_rate": 1.5507445590006285e-05, "loss": 0.4492, "step": 5431 }, { "epoch": 1.0, "learning_rate": 1.5505778259125515e-05, "loss": 0.458, "step": 5432 }, { "epoch": 1.01, "learning_rate": 1.5504110708574387e-05, "loss": 0.4551, "step": 5433 }, { "epoch": 1.01, "learning_rate": 1.5502442938419434e-05, "loss": 0.456, "step": 5434 }, { "epoch": 1.01, "learning_rate": 1.5500774948727192e-05, "loss": 0.4501, "step": 5435 }, { "epoch": 1.01, "learning_rate": 1.5499106739564217e-05, "loss": 0.4456, "step": 5436 }, { "epoch": 1.01, "learning_rate": 1.5497438310997063e-05, "loss": 0.474, "step": 5437 }, { "epoch": 1.01, "learning_rate": 1.5495769663092303e-05, "loss": 0.4287, "step": 5438 }, { "epoch": 1.01, "learning_rate": 1.5494100795916502e-05, "loss": 0.4387, "step": 5439 }, { "epoch": 1.01, "learning_rate": 1.5492431709536253e-05, "loss": 0.4543, "step": 5440 }, { "epoch": 1.01, "learning_rate": 1.5490762404018148e-05, "loss": 0.4504, "step": 5441 }, { "epoch": 1.01, "learning_rate": 1.548909287942879e-05, "loss": 0.4489, "step": 5442 }, { "epoch": 1.01, "learning_rate": 1.548742313583479e-05, "loss": 0.4437, "step": 5443 }, { "epoch": 1.01, "learning_rate": 1.5485753173302766e-05, "loss": 0.448, "step": 5444 }, { "epoch": 1.01, "learning_rate": 1.5484082991899346e-05, "loss": 0.441, "step": 5445 }, { "epoch": 1.01, "learning_rate": 1.548241259169117e-05, "loss": 0.4384, "step": 5446 }, { "epoch": 1.01, "learning_rate": 1.5480741972744876e-05, "loss": 0.4437, "step": 5447 }, { "epoch": 1.01, "learning_rate": 1.5479071135127132e-05, "loss": 0.4581, "step": 5448 }, { "epoch": 1.01, "learning_rate": 1.547740007890459e-05, "loss": 0.4519, "step": 5449 }, { "epoch": 1.01, "learning_rate": 1.5475728804143927e-05, "loss": 0.4548, "step": 5450 }, { "epoch": 1.01, "learning_rate": 1.5474057310911823e-05, "loss": 0.4335, "step": 5451 }, { "epoch": 1.01, "learning_rate": 1.5472385599274967e-05, "loss": 0.4595, "step": 5452 }, { "epoch": 1.01, "learning_rate": 1.5470713669300054e-05, "loss": 0.4566, "step": 5453 }, { "epoch": 1.01, "learning_rate": 1.54690415210538e-05, "loss": 0.4263, "step": 5454 }, { "epoch": 1.01, "learning_rate": 1.5467369154602912e-05, "loss": 0.446, "step": 5455 }, { "epoch": 1.01, "learning_rate": 1.546569657001412e-05, "loss": 0.4335, "step": 5456 }, { "epoch": 1.01, "learning_rate": 1.546402376735415e-05, "loss": 0.4312, "step": 5457 }, { "epoch": 1.01, "learning_rate": 1.546235074668975e-05, "loss": 0.4483, "step": 5458 }, { "epoch": 1.01, "learning_rate": 1.546067750808767e-05, "loss": 0.4523, "step": 5459 }, { "epoch": 1.01, "learning_rate": 1.5459004051614667e-05, "loss": 0.4651, "step": 5460 }, { "epoch": 1.01, "learning_rate": 1.545733037733751e-05, "loss": 0.4418, "step": 5461 }, { "epoch": 1.01, "learning_rate": 1.545565648532297e-05, "loss": 0.4431, "step": 5462 }, { "epoch": 1.01, "learning_rate": 1.5453982375637844e-05, "loss": 0.4688, "step": 5463 }, { "epoch": 1.01, "learning_rate": 1.5452308048348915e-05, "loss": 0.4442, "step": 5464 }, { "epoch": 1.01, "learning_rate": 1.545063350352299e-05, "loss": 0.4434, "step": 5465 }, { "epoch": 1.01, "learning_rate": 1.544895874122688e-05, "loss": 0.4467, "step": 5466 }, { "epoch": 1.01, "learning_rate": 1.5447283761527404e-05, "loss": 0.4439, "step": 5467 }, { "epoch": 1.01, "learning_rate": 1.5445608564491394e-05, "loss": 0.4571, "step": 5468 }, { "epoch": 1.01, "learning_rate": 1.544393315018568e-05, "loss": 0.4625, "step": 5469 }, { "epoch": 1.01, "learning_rate": 1.5442257518677117e-05, "loss": 0.4486, "step": 5470 }, { "epoch": 1.01, "learning_rate": 1.5440581670032556e-05, "loss": 0.4443, "step": 5471 }, { "epoch": 1.01, "learning_rate": 1.5438905604318854e-05, "loss": 0.4402, "step": 5472 }, { "epoch": 1.01, "learning_rate": 1.543722932160289e-05, "loss": 0.4276, "step": 5473 }, { "epoch": 1.01, "learning_rate": 1.5435552821951547e-05, "loss": 0.4531, "step": 5474 }, { "epoch": 1.01, "learning_rate": 1.5433876105431705e-05, "loss": 0.4441, "step": 5475 }, { "epoch": 1.01, "learning_rate": 1.5432199172110266e-05, "loss": 0.4689, "step": 5476 }, { "epoch": 1.01, "learning_rate": 1.543052202205414e-05, "loss": 0.432, "step": 5477 }, { "epoch": 1.01, "learning_rate": 1.5428844655330242e-05, "loss": 0.4377, "step": 5478 }, { "epoch": 1.01, "learning_rate": 1.542716707200549e-05, "loss": 0.4609, "step": 5479 }, { "epoch": 1.01, "learning_rate": 1.5425489272146824e-05, "loss": 0.4221, "step": 5480 }, { "epoch": 1.01, "learning_rate": 1.5423811255821175e-05, "loss": 0.4321, "step": 5481 }, { "epoch": 1.01, "learning_rate": 1.5422133023095505e-05, "loss": 0.4401, "step": 5482 }, { "epoch": 1.01, "learning_rate": 1.5420454574036763e-05, "loss": 0.4652, "step": 5483 }, { "epoch": 1.01, "learning_rate": 1.5418775908711922e-05, "loss": 0.4333, "step": 5484 }, { "epoch": 1.01, "learning_rate": 1.541709702718795e-05, "loss": 0.4584, "step": 5485 }, { "epoch": 1.01, "learning_rate": 1.5415417929531837e-05, "loss": 0.4451, "step": 5486 }, { "epoch": 1.02, "learning_rate": 1.5413738615810576e-05, "loss": 0.4546, "step": 5487 }, { "epoch": 1.02, "learning_rate": 1.541205908609117e-05, "loss": 0.4548, "step": 5488 }, { "epoch": 1.02, "learning_rate": 1.5410379340440624e-05, "loss": 0.439, "step": 5489 }, { "epoch": 1.02, "learning_rate": 1.540869937892596e-05, "loss": 0.4462, "step": 5490 }, { "epoch": 1.02, "learning_rate": 1.5407019201614203e-05, "loss": 0.4231, "step": 5491 }, { "epoch": 1.02, "learning_rate": 1.5405338808572393e-05, "loss": 0.4343, "step": 5492 }, { "epoch": 1.02, "learning_rate": 1.5403658199867573e-05, "loss": 0.4362, "step": 5493 }, { "epoch": 1.02, "learning_rate": 1.5401977375566795e-05, "loss": 0.4664, "step": 5494 }, { "epoch": 1.02, "learning_rate": 1.540029633573712e-05, "loss": 0.4407, "step": 5495 }, { "epoch": 1.02, "learning_rate": 1.539861508044562e-05, "loss": 0.44, "step": 5496 }, { "epoch": 1.02, "learning_rate": 1.539693360975937e-05, "loss": 0.4422, "step": 5497 }, { "epoch": 1.02, "learning_rate": 1.5395251923745466e-05, "loss": 0.4592, "step": 5498 }, { "epoch": 1.02, "learning_rate": 1.5393570022470997e-05, "loss": 0.4427, "step": 5499 }, { "epoch": 1.02, "learning_rate": 1.5391887906003075e-05, "loss": 0.44, "step": 5500 }, { "epoch": 1.02, "learning_rate": 1.53902055744088e-05, "loss": 0.4575, "step": 5501 }, { "epoch": 1.02, "learning_rate": 1.5388523027755308e-05, "loss": 0.4402, "step": 5502 }, { "epoch": 1.02, "learning_rate": 1.538684026610972e-05, "loss": 0.442, "step": 5503 }, { "epoch": 1.02, "learning_rate": 1.5385157289539184e-05, "loss": 0.4532, "step": 5504 }, { "epoch": 1.02, "learning_rate": 1.538347409811084e-05, "loss": 0.476, "step": 5505 }, { "epoch": 1.02, "learning_rate": 1.5381790691891848e-05, "loss": 0.4492, "step": 5506 }, { "epoch": 1.02, "learning_rate": 1.5380107070949368e-05, "loss": 0.4293, "step": 5507 }, { "epoch": 1.02, "learning_rate": 1.537842323535058e-05, "loss": 0.4497, "step": 5508 }, { "epoch": 1.02, "learning_rate": 1.537673918516266e-05, "loss": 0.4413, "step": 5509 }, { "epoch": 1.02, "learning_rate": 1.5375054920452806e-05, "loss": 0.4296, "step": 5510 }, { "epoch": 1.02, "learning_rate": 1.5373370441288206e-05, "loss": 0.4536, "step": 5511 }, { "epoch": 1.02, "learning_rate": 1.5371685747736077e-05, "loss": 0.4478, "step": 5512 }, { "epoch": 1.02, "learning_rate": 1.5370000839863634e-05, "loss": 0.4657, "step": 5513 }, { "epoch": 1.02, "learning_rate": 1.5368315717738095e-05, "loss": 0.4471, "step": 5514 }, { "epoch": 1.02, "learning_rate": 1.5366630381426703e-05, "loss": 0.434, "step": 5515 }, { "epoch": 1.02, "learning_rate": 1.5364944830996692e-05, "loss": 0.447, "step": 5516 }, { "epoch": 1.02, "learning_rate": 1.5363259066515316e-05, "loss": 0.4586, "step": 5517 }, { "epoch": 1.02, "learning_rate": 1.5361573088049832e-05, "loss": 0.4334, "step": 5518 }, { "epoch": 1.02, "learning_rate": 1.535988689566751e-05, "loss": 0.4543, "step": 5519 }, { "epoch": 1.02, "learning_rate": 1.5358200489435625e-05, "loss": 0.426, "step": 5520 }, { "epoch": 1.02, "learning_rate": 1.535651386942146e-05, "loss": 0.4275, "step": 5521 }, { "epoch": 1.02, "learning_rate": 1.535482703569231e-05, "loss": 0.4358, "step": 5522 }, { "epoch": 1.02, "learning_rate": 1.5353139988315472e-05, "loss": 0.4582, "step": 5523 }, { "epoch": 1.02, "learning_rate": 1.535145272735826e-05, "loss": 0.4409, "step": 5524 }, { "epoch": 1.02, "learning_rate": 1.5349765252887996e-05, "loss": 0.4313, "step": 5525 }, { "epoch": 1.02, "learning_rate": 1.5348077564972002e-05, "loss": 0.4453, "step": 5526 }, { "epoch": 1.02, "learning_rate": 1.5346389663677615e-05, "loss": 0.4433, "step": 5527 }, { "epoch": 1.02, "learning_rate": 1.5344701549072176e-05, "loss": 0.4217, "step": 5528 }, { "epoch": 1.02, "learning_rate": 1.534301322122304e-05, "loss": 0.4463, "step": 5529 }, { "epoch": 1.02, "learning_rate": 1.5341324680197574e-05, "loss": 0.448, "step": 5530 }, { "epoch": 1.02, "learning_rate": 1.5339635926063138e-05, "loss": 0.4471, "step": 5531 }, { "epoch": 1.02, "learning_rate": 1.533794695888712e-05, "loss": 0.4424, "step": 5532 }, { "epoch": 1.02, "learning_rate": 1.5336257778736897e-05, "loss": 0.4212, "step": 5533 }, { "epoch": 1.02, "learning_rate": 1.5334568385679867e-05, "loss": 0.4387, "step": 5534 }, { "epoch": 1.02, "learning_rate": 1.533287877978344e-05, "loss": 0.4595, "step": 5535 }, { "epoch": 1.02, "learning_rate": 1.533118896111502e-05, "loss": 0.4293, "step": 5536 }, { "epoch": 1.02, "learning_rate": 1.5329498929742032e-05, "loss": 0.4771, "step": 5537 }, { "epoch": 1.02, "learning_rate": 1.5327808685731905e-05, "loss": 0.4393, "step": 5538 }, { "epoch": 1.02, "learning_rate": 1.5326118229152073e-05, "loss": 0.4364, "step": 5539 }, { "epoch": 1.02, "learning_rate": 1.5324427560069985e-05, "loss": 0.4353, "step": 5540 }, { "epoch": 1.03, "learning_rate": 1.5322736678553097e-05, "loss": 0.4436, "step": 5541 }, { "epoch": 1.03, "learning_rate": 1.532104558466887e-05, "loss": 0.4442, "step": 5542 }, { "epoch": 1.03, "learning_rate": 1.5319354278484774e-05, "loss": 0.4504, "step": 5543 }, { "epoch": 1.03, "learning_rate": 1.531766276006829e-05, "loss": 0.4576, "step": 5544 }, { "epoch": 1.03, "learning_rate": 1.5315971029486912e-05, "loss": 0.4361, "step": 5545 }, { "epoch": 1.03, "learning_rate": 1.5314279086808127e-05, "loss": 0.4587, "step": 5546 }, { "epoch": 1.03, "learning_rate": 1.5312586932099448e-05, "loss": 0.4295, "step": 5547 }, { "epoch": 1.03, "learning_rate": 1.531089456542839e-05, "loss": 0.4451, "step": 5548 }, { "epoch": 1.03, "learning_rate": 1.5309201986862466e-05, "loss": 0.4568, "step": 5549 }, { "epoch": 1.03, "learning_rate": 1.5307509196469214e-05, "loss": 0.4598, "step": 5550 }, { "epoch": 1.03, "learning_rate": 1.5305816194316174e-05, "loss": 0.4498, "step": 5551 }, { "epoch": 1.03, "learning_rate": 1.5304122980470887e-05, "loss": 0.4359, "step": 5552 }, { "epoch": 1.03, "learning_rate": 1.5302429555000917e-05, "loss": 0.4665, "step": 5553 }, { "epoch": 1.03, "learning_rate": 1.5300735917973827e-05, "loss": 0.4602, "step": 5554 }, { "epoch": 1.03, "learning_rate": 1.529904206945718e-05, "loss": 0.4363, "step": 5555 }, { "epoch": 1.03, "learning_rate": 1.5297348009518575e-05, "loss": 0.4439, "step": 5556 }, { "epoch": 1.03, "learning_rate": 1.5295653738225587e-05, "loss": 0.4606, "step": 5557 }, { "epoch": 1.03, "learning_rate": 1.529395925564582e-05, "loss": 0.4479, "step": 5558 }, { "epoch": 1.03, "learning_rate": 1.529226456184688e-05, "loss": 0.459, "step": 5559 }, { "epoch": 1.03, "learning_rate": 1.5290569656896383e-05, "loss": 0.4678, "step": 5560 }, { "epoch": 1.03, "learning_rate": 1.5288874540861952e-05, "loss": 0.4345, "step": 5561 }, { "epoch": 1.03, "learning_rate": 1.5287179213811215e-05, "loss": 0.4726, "step": 5562 }, { "epoch": 1.03, "learning_rate": 1.5285483675811818e-05, "loss": 0.4321, "step": 5563 }, { "epoch": 1.03, "learning_rate": 1.528378792693141e-05, "loss": 0.4532, "step": 5564 }, { "epoch": 1.03, "learning_rate": 1.5282091967237645e-05, "loss": 0.4365, "step": 5565 }, { "epoch": 1.03, "learning_rate": 1.5280395796798195e-05, "loss": 0.4524, "step": 5566 }, { "epoch": 1.03, "learning_rate": 1.5278699415680725e-05, "loss": 0.4743, "step": 5567 }, { "epoch": 1.03, "learning_rate": 1.527700282395292e-05, "loss": 0.4417, "step": 5568 }, { "epoch": 1.03, "learning_rate": 1.5275306021682474e-05, "loss": 0.4506, "step": 5569 }, { "epoch": 1.03, "learning_rate": 1.5273609008937086e-05, "loss": 0.4238, "step": 5570 }, { "epoch": 1.03, "learning_rate": 1.527191178578446e-05, "loss": 0.425, "step": 5571 }, { "epoch": 1.03, "learning_rate": 1.5270214352292316e-05, "loss": 0.4349, "step": 5572 }, { "epoch": 1.03, "learning_rate": 1.5268516708528375e-05, "loss": 0.4578, "step": 5573 }, { "epoch": 1.03, "learning_rate": 1.5266818854560373e-05, "loss": 0.458, "step": 5574 }, { "epoch": 1.03, "learning_rate": 1.5265120790456054e-05, "loss": 0.4474, "step": 5575 }, { "epoch": 1.03, "learning_rate": 1.526342251628316e-05, "loss": 0.4199, "step": 5576 }, { "epoch": 1.03, "learning_rate": 1.526172403210945e-05, "loss": 0.4277, "step": 5577 }, { "epoch": 1.03, "learning_rate": 1.52600253380027e-05, "loss": 0.4597, "step": 5578 }, { "epoch": 1.03, "learning_rate": 1.525832643403067e-05, "loss": 0.4338, "step": 5579 }, { "epoch": 1.03, "learning_rate": 1.5256627320261154e-05, "loss": 0.4576, "step": 5580 }, { "epoch": 1.03, "learning_rate": 1.525492799676194e-05, "loss": 0.4506, "step": 5581 }, { "epoch": 1.03, "learning_rate": 1.525322846360083e-05, "loss": 0.4483, "step": 5582 }, { "epoch": 1.03, "learning_rate": 1.5251528720845627e-05, "loss": 0.4235, "step": 5583 }, { "epoch": 1.03, "learning_rate": 1.5249828768564153e-05, "loss": 0.4368, "step": 5584 }, { "epoch": 1.03, "learning_rate": 1.5248128606824231e-05, "loss": 0.4686, "step": 5585 }, { "epoch": 1.03, "learning_rate": 1.5246428235693696e-05, "loss": 0.4479, "step": 5586 }, { "epoch": 1.03, "learning_rate": 1.5244727655240384e-05, "loss": 0.4421, "step": 5587 }, { "epoch": 1.03, "learning_rate": 1.5243026865532151e-05, "loss": 0.4388, "step": 5588 }, { "epoch": 1.03, "learning_rate": 1.5241325866636853e-05, "loss": 0.4572, "step": 5589 }, { "epoch": 1.03, "learning_rate": 1.5239624658622357e-05, "loss": 0.447, "step": 5590 }, { "epoch": 1.03, "learning_rate": 1.5237923241556539e-05, "loss": 0.4531, "step": 5591 }, { "epoch": 1.03, "learning_rate": 1.5236221615507278e-05, "loss": 0.4552, "step": 5592 }, { "epoch": 1.03, "learning_rate": 1.5234519780542472e-05, "loss": 0.4391, "step": 5593 }, { "epoch": 1.03, "learning_rate": 1.5232817736730017e-05, "loss": 0.4567, "step": 5594 }, { "epoch": 1.04, "learning_rate": 1.5231115484137824e-05, "loss": 0.4412, "step": 5595 }, { "epoch": 1.04, "learning_rate": 1.5229413022833808e-05, "loss": 0.4619, "step": 5596 }, { "epoch": 1.04, "learning_rate": 1.5227710352885897e-05, "loss": 0.4372, "step": 5597 }, { "epoch": 1.04, "learning_rate": 1.5226007474362017e-05, "loss": 0.4433, "step": 5598 }, { "epoch": 1.04, "learning_rate": 1.5224304387330115e-05, "loss": 0.4481, "step": 5599 }, { "epoch": 1.04, "learning_rate": 1.5222601091858143e-05, "loss": 0.4364, "step": 5600 }, { "epoch": 1.04, "learning_rate": 1.5220897588014057e-05, "loss": 0.4287, "step": 5601 }, { "epoch": 1.04, "learning_rate": 1.521919387586582e-05, "loss": 0.4455, "step": 5602 }, { "epoch": 1.04, "learning_rate": 1.5217489955481414e-05, "loss": 0.4214, "step": 5603 }, { "epoch": 1.04, "learning_rate": 1.5215785826928817e-05, "loss": 0.4496, "step": 5604 }, { "epoch": 1.04, "learning_rate": 1.5214081490276023e-05, "loss": 0.4561, "step": 5605 }, { "epoch": 1.04, "learning_rate": 1.5212376945591029e-05, "loss": 0.4402, "step": 5606 }, { "epoch": 1.04, "learning_rate": 1.5210672192941847e-05, "loss": 0.4459, "step": 5607 }, { "epoch": 1.04, "learning_rate": 1.5208967232396494e-05, "loss": 0.4454, "step": 5608 }, { "epoch": 1.04, "learning_rate": 1.5207262064022989e-05, "loss": 0.4345, "step": 5609 }, { "epoch": 1.04, "learning_rate": 1.5205556687889372e-05, "loss": 0.4521, "step": 5610 }, { "epoch": 1.04, "learning_rate": 1.5203851104063679e-05, "loss": 0.4494, "step": 5611 }, { "epoch": 1.04, "learning_rate": 1.5202145312613961e-05, "loss": 0.435, "step": 5612 }, { "epoch": 1.04, "learning_rate": 1.5200439313608275e-05, "loss": 0.4556, "step": 5613 }, { "epoch": 1.04, "learning_rate": 1.5198733107114693e-05, "loss": 0.4499, "step": 5614 }, { "epoch": 1.04, "learning_rate": 1.5197026693201284e-05, "loss": 0.4466, "step": 5615 }, { "epoch": 1.04, "learning_rate": 1.5195320071936131e-05, "loss": 0.441, "step": 5616 }, { "epoch": 1.04, "learning_rate": 1.5193613243387325e-05, "loss": 0.4478, "step": 5617 }, { "epoch": 1.04, "learning_rate": 1.5191906207622969e-05, "loss": 0.455, "step": 5618 }, { "epoch": 1.04, "learning_rate": 1.5190198964711165e-05, "loss": 0.4479, "step": 5619 }, { "epoch": 1.04, "learning_rate": 1.5188491514720032e-05, "loss": 0.4605, "step": 5620 }, { "epoch": 1.04, "learning_rate": 1.5186783857717695e-05, "loss": 0.4632, "step": 5621 }, { "epoch": 1.04, "learning_rate": 1.5185075993772284e-05, "loss": 0.4432, "step": 5622 }, { "epoch": 1.04, "learning_rate": 1.5183367922951942e-05, "loss": 0.451, "step": 5623 }, { "epoch": 1.04, "learning_rate": 1.5181659645324818e-05, "loss": 0.4457, "step": 5624 }, { "epoch": 1.04, "learning_rate": 1.5179951160959065e-05, "loss": 0.428, "step": 5625 }, { "epoch": 1.04, "learning_rate": 1.5178242469922852e-05, "loss": 0.4464, "step": 5626 }, { "epoch": 1.04, "learning_rate": 1.5176533572284351e-05, "loss": 0.466, "step": 5627 }, { "epoch": 1.04, "learning_rate": 1.5174824468111747e-05, "loss": 0.458, "step": 5628 }, { "epoch": 1.04, "learning_rate": 1.5173115157473227e-05, "loss": 0.4606, "step": 5629 }, { "epoch": 1.04, "learning_rate": 1.5171405640436989e-05, "loss": 0.4622, "step": 5630 }, { "epoch": 1.04, "learning_rate": 1.5169695917071242e-05, "loss": 0.4427, "step": 5631 }, { "epoch": 1.04, "learning_rate": 1.5167985987444196e-05, "loss": 0.4309, "step": 5632 }, { "epoch": 1.04, "learning_rate": 1.516627585162408e-05, "loss": 0.4546, "step": 5633 }, { "epoch": 1.04, "learning_rate": 1.5164565509679121e-05, "loss": 0.4533, "step": 5634 }, { "epoch": 1.04, "learning_rate": 1.5162854961677562e-05, "loss": 0.4138, "step": 5635 }, { "epoch": 1.04, "learning_rate": 1.5161144207687649e-05, "loss": 0.459, "step": 5636 }, { "epoch": 1.04, "learning_rate": 1.5159433247777635e-05, "loss": 0.4502, "step": 5637 }, { "epoch": 1.04, "learning_rate": 1.5157722082015789e-05, "loss": 0.4555, "step": 5638 }, { "epoch": 1.04, "learning_rate": 1.5156010710470381e-05, "loss": 0.4408, "step": 5639 }, { "epoch": 1.04, "learning_rate": 1.515429913320969e-05, "loss": 0.4735, "step": 5640 }, { "epoch": 1.04, "learning_rate": 1.5152587350302008e-05, "loss": 0.4331, "step": 5641 }, { "epoch": 1.04, "learning_rate": 1.5150875361815632e-05, "loss": 0.4276, "step": 5642 }, { "epoch": 1.04, "learning_rate": 1.5149163167818863e-05, "loss": 0.4615, "step": 5643 }, { "epoch": 1.04, "learning_rate": 1.514745076838002e-05, "loss": 0.4472, "step": 5644 }, { "epoch": 1.04, "learning_rate": 1.5145738163567419e-05, "loss": 0.4464, "step": 5645 }, { "epoch": 1.04, "learning_rate": 1.5144025353449393e-05, "loss": 0.4363, "step": 5646 }, { "epoch": 1.04, "learning_rate": 1.514231233809428e-05, "loss": 0.4801, "step": 5647 }, { "epoch": 1.04, "learning_rate": 1.5140599117570425e-05, "loss": 0.4704, "step": 5648 }, { "epoch": 1.05, "learning_rate": 1.513888569194618e-05, "loss": 0.4251, "step": 5649 }, { "epoch": 1.05, "learning_rate": 1.5137172061289913e-05, "loss": 0.4421, "step": 5650 }, { "epoch": 1.05, "learning_rate": 1.5135458225669992e-05, "loss": 0.4411, "step": 5651 }, { "epoch": 1.05, "learning_rate": 1.5133744185154798e-05, "loss": 0.4515, "step": 5652 }, { "epoch": 1.05, "learning_rate": 1.5132029939812714e-05, "loss": 0.4496, "step": 5653 }, { "epoch": 1.05, "learning_rate": 1.5130315489712135e-05, "loss": 0.4618, "step": 5654 }, { "epoch": 1.05, "learning_rate": 1.5128600834921468e-05, "loss": 0.4303, "step": 5655 }, { "epoch": 1.05, "learning_rate": 1.5126885975509122e-05, "loss": 0.4581, "step": 5656 }, { "epoch": 1.05, "learning_rate": 1.512517091154352e-05, "loss": 0.4358, "step": 5657 }, { "epoch": 1.05, "learning_rate": 1.5123455643093087e-05, "loss": 0.4416, "step": 5658 }, { "epoch": 1.05, "learning_rate": 1.512174017022626e-05, "loss": 0.4537, "step": 5659 }, { "epoch": 1.05, "learning_rate": 1.5120024493011483e-05, "loss": 0.455, "step": 5660 }, { "epoch": 1.05, "learning_rate": 1.5118308611517206e-05, "loss": 0.4297, "step": 5661 }, { "epoch": 1.05, "learning_rate": 1.5116592525811892e-05, "loss": 0.4269, "step": 5662 }, { "epoch": 1.05, "learning_rate": 1.5114876235964012e-05, "loss": 0.4425, "step": 5663 }, { "epoch": 1.05, "learning_rate": 1.5113159742042039e-05, "loss": 0.4608, "step": 5664 }, { "epoch": 1.05, "learning_rate": 1.5111443044114458e-05, "loss": 0.4478, "step": 5665 }, { "epoch": 1.05, "learning_rate": 1.5109726142249763e-05, "loss": 0.4423, "step": 5666 }, { "epoch": 1.05, "learning_rate": 1.5108009036516457e-05, "loss": 0.4487, "step": 5667 }, { "epoch": 1.05, "learning_rate": 1.5106291726983044e-05, "loss": 0.4445, "step": 5668 }, { "epoch": 1.05, "learning_rate": 1.5104574213718049e-05, "loss": 0.4391, "step": 5669 }, { "epoch": 1.05, "learning_rate": 1.5102856496789992e-05, "loss": 0.4266, "step": 5670 }, { "epoch": 1.05, "learning_rate": 1.510113857626741e-05, "loss": 0.4596, "step": 5671 }, { "epoch": 1.05, "learning_rate": 1.5099420452218842e-05, "loss": 0.4621, "step": 5672 }, { "epoch": 1.05, "learning_rate": 1.5097702124712838e-05, "loss": 0.4335, "step": 5673 }, { "epoch": 1.05, "learning_rate": 1.509598359381796e-05, "loss": 0.4377, "step": 5674 }, { "epoch": 1.05, "learning_rate": 1.5094264859602773e-05, "loss": 0.4541, "step": 5675 }, { "epoch": 1.05, "learning_rate": 1.5092545922135847e-05, "loss": 0.443, "step": 5676 }, { "epoch": 1.05, "learning_rate": 1.5090826781485766e-05, "loss": 0.4367, "step": 5677 }, { "epoch": 1.05, "learning_rate": 1.5089107437721121e-05, "loss": 0.4391, "step": 5678 }, { "epoch": 1.05, "learning_rate": 1.5087387890910516e-05, "loss": 0.4392, "step": 5679 }, { "epoch": 1.05, "learning_rate": 1.5085668141122551e-05, "loss": 0.4461, "step": 5680 }, { "epoch": 1.05, "learning_rate": 1.5083948188425846e-05, "loss": 0.4512, "step": 5681 }, { "epoch": 1.05, "learning_rate": 1.5082228032889016e-05, "loss": 0.4516, "step": 5682 }, { "epoch": 1.05, "learning_rate": 1.50805076745807e-05, "loss": 0.4543, "step": 5683 }, { "epoch": 1.05, "learning_rate": 1.5078787113569534e-05, "loss": 0.4448, "step": 5684 }, { "epoch": 1.05, "learning_rate": 1.5077066349924166e-05, "loss": 0.4481, "step": 5685 }, { "epoch": 1.05, "learning_rate": 1.5075345383713246e-05, "loss": 0.4407, "step": 5686 }, { "epoch": 1.05, "learning_rate": 1.5073624215005448e-05, "loss": 0.4544, "step": 5687 }, { "epoch": 1.05, "learning_rate": 1.5071902843869433e-05, "loss": 0.4473, "step": 5688 }, { "epoch": 1.05, "learning_rate": 1.5070181270373887e-05, "loss": 0.4474, "step": 5689 }, { "epoch": 1.05, "learning_rate": 1.5068459494587492e-05, "loss": 0.4665, "step": 5690 }, { "epoch": 1.05, "learning_rate": 1.5066737516578952e-05, "loss": 0.4409, "step": 5691 }, { "epoch": 1.05, "learning_rate": 1.5065015336416963e-05, "loss": 0.4337, "step": 5692 }, { "epoch": 1.05, "learning_rate": 1.5063292954170242e-05, "loss": 0.4634, "step": 5693 }, { "epoch": 1.05, "learning_rate": 1.5061570369907504e-05, "loss": 0.4308, "step": 5694 }, { "epoch": 1.05, "learning_rate": 1.505984758369748e-05, "loss": 0.4318, "step": 5695 }, { "epoch": 1.05, "learning_rate": 1.505812459560891e-05, "loss": 0.473, "step": 5696 }, { "epoch": 1.05, "learning_rate": 1.5056401405710528e-05, "loss": 0.4344, "step": 5697 }, { "epoch": 1.05, "learning_rate": 1.505467801407109e-05, "loss": 0.4437, "step": 5698 }, { "epoch": 1.05, "learning_rate": 1.5052954420759363e-05, "loss": 0.4297, "step": 5699 }, { "epoch": 1.05, "learning_rate": 1.505123062584411e-05, "loss": 0.4505, "step": 5700 }, { "epoch": 1.05, "learning_rate": 1.5049506629394101e-05, "loss": 0.4329, "step": 5701 }, { "epoch": 1.05, "learning_rate": 1.5047782431478135e-05, "loss": 0.4346, "step": 5702 }, { "epoch": 1.06, "learning_rate": 1.504605803216499e-05, "loss": 0.4292, "step": 5703 }, { "epoch": 1.06, "learning_rate": 1.5044333431523472e-05, "loss": 0.4349, "step": 5704 }, { "epoch": 1.06, "learning_rate": 1.5042608629622391e-05, "loss": 0.4546, "step": 5705 }, { "epoch": 1.06, "learning_rate": 1.504088362653056e-05, "loss": 0.4393, "step": 5706 }, { "epoch": 1.06, "learning_rate": 1.503915842231681e-05, "loss": 0.4417, "step": 5707 }, { "epoch": 1.06, "learning_rate": 1.5037433017049965e-05, "loss": 0.4459, "step": 5708 }, { "epoch": 1.06, "learning_rate": 1.5035707410798868e-05, "loss": 0.4405, "step": 5709 }, { "epoch": 1.06, "learning_rate": 1.5033981603632373e-05, "loss": 0.4386, "step": 5710 }, { "epoch": 1.06, "learning_rate": 1.5032255595619327e-05, "loss": 0.4461, "step": 5711 }, { "epoch": 1.06, "learning_rate": 1.5030529386828602e-05, "loss": 0.4171, "step": 5712 }, { "epoch": 1.06, "learning_rate": 1.502880297732907e-05, "loss": 0.4403, "step": 5713 }, { "epoch": 1.06, "learning_rate": 1.5027076367189607e-05, "loss": 0.4233, "step": 5714 }, { "epoch": 1.06, "learning_rate": 1.5025349556479105e-05, "loss": 0.4482, "step": 5715 }, { "epoch": 1.06, "learning_rate": 1.5023622545266463e-05, "loss": 0.4703, "step": 5716 }, { "epoch": 1.06, "learning_rate": 1.5021895333620578e-05, "loss": 0.4653, "step": 5717 }, { "epoch": 1.06, "learning_rate": 1.5020167921610368e-05, "loss": 0.4407, "step": 5718 }, { "epoch": 1.06, "learning_rate": 1.5018440309304754e-05, "loss": 0.4531, "step": 5719 }, { "epoch": 1.06, "learning_rate": 1.5016712496772661e-05, "loss": 0.4386, "step": 5720 }, { "epoch": 1.06, "learning_rate": 1.5014984484083028e-05, "loss": 0.4456, "step": 5721 }, { "epoch": 1.06, "learning_rate": 1.50132562713048e-05, "loss": 0.4267, "step": 5722 }, { "epoch": 1.06, "learning_rate": 1.5011527858506929e-05, "loss": 0.4356, "step": 5723 }, { "epoch": 1.06, "learning_rate": 1.5009799245758377e-05, "loss": 0.4496, "step": 5724 }, { "epoch": 1.06, "learning_rate": 1.5008070433128108e-05, "loss": 0.4432, "step": 5725 }, { "epoch": 1.06, "learning_rate": 1.50063414206851e-05, "loss": 0.4355, "step": 5726 }, { "epoch": 1.06, "learning_rate": 1.5004612208498339e-05, "loss": 0.4396, "step": 5727 }, { "epoch": 1.06, "learning_rate": 1.5002882796636817e-05, "loss": 0.4334, "step": 5728 }, { "epoch": 1.06, "learning_rate": 1.5001153185169535e-05, "loss": 0.461, "step": 5729 }, { "epoch": 1.06, "learning_rate": 1.49994233741655e-05, "loss": 0.4642, "step": 5730 }, { "epoch": 1.06, "learning_rate": 1.4997693363693728e-05, "loss": 0.4578, "step": 5731 }, { "epoch": 1.06, "learning_rate": 1.4995963153823244e-05, "loss": 0.4488, "step": 5732 }, { "epoch": 1.06, "learning_rate": 1.4994232744623078e-05, "loss": 0.4479, "step": 5733 }, { "epoch": 1.06, "learning_rate": 1.4992502136162274e-05, "loss": 0.4329, "step": 5734 }, { "epoch": 1.06, "learning_rate": 1.4990771328509878e-05, "loss": 0.4386, "step": 5735 }, { "epoch": 1.06, "learning_rate": 1.4989040321734946e-05, "loss": 0.4413, "step": 5736 }, { "epoch": 1.06, "learning_rate": 1.4987309115906543e-05, "loss": 0.4428, "step": 5737 }, { "epoch": 1.06, "learning_rate": 1.4985577711093739e-05, "loss": 0.4363, "step": 5738 }, { "epoch": 1.06, "learning_rate": 1.4983846107365613e-05, "loss": 0.4379, "step": 5739 }, { "epoch": 1.06, "learning_rate": 1.4982114304791257e-05, "loss": 0.4418, "step": 5740 }, { "epoch": 1.06, "learning_rate": 1.4980382303439764e-05, "loss": 0.4342, "step": 5741 }, { "epoch": 1.06, "learning_rate": 1.4978650103380238e-05, "loss": 0.4664, "step": 5742 }, { "epoch": 1.06, "learning_rate": 1.497691770468179e-05, "loss": 0.4629, "step": 5743 }, { "epoch": 1.06, "learning_rate": 1.4975185107413541e-05, "loss": 0.4576, "step": 5744 }, { "epoch": 1.06, "learning_rate": 1.4973452311644616e-05, "loss": 0.4515, "step": 5745 }, { "epoch": 1.06, "learning_rate": 1.4971719317444155e-05, "loss": 0.447, "step": 5746 }, { "epoch": 1.06, "learning_rate": 1.4969986124881297e-05, "loss": 0.4538, "step": 5747 }, { "epoch": 1.06, "learning_rate": 1.4968252734025192e-05, "loss": 0.459, "step": 5748 }, { "epoch": 1.06, "learning_rate": 1.4966519144945005e-05, "loss": 0.4601, "step": 5749 }, { "epoch": 1.06, "learning_rate": 1.4964785357709896e-05, "loss": 0.4653, "step": 5750 }, { "epoch": 1.06, "learning_rate": 1.4963051372389047e-05, "loss": 0.466, "step": 5751 }, { "epoch": 1.06, "learning_rate": 1.4961317189051633e-05, "loss": 0.4334, "step": 5752 }, { "epoch": 1.06, "learning_rate": 1.495958280776685e-05, "loss": 0.4432, "step": 5753 }, { "epoch": 1.06, "learning_rate": 1.4957848228603897e-05, "loss": 0.4455, "step": 5754 }, { "epoch": 1.06, "learning_rate": 1.4956113451631977e-05, "loss": 0.4237, "step": 5755 }, { "epoch": 1.06, "learning_rate": 1.4954378476920309e-05, "loss": 0.4193, "step": 5756 }, { "epoch": 1.07, "learning_rate": 1.495264330453811e-05, "loss": 0.4458, "step": 5757 }, { "epoch": 1.07, "learning_rate": 1.4950907934554612e-05, "loss": 0.4572, "step": 5758 }, { "epoch": 1.07, "learning_rate": 1.4949172367039055e-05, "loss": 0.4361, "step": 5759 }, { "epoch": 1.07, "learning_rate": 1.4947436602060685e-05, "loss": 0.4542, "step": 5760 }, { "epoch": 1.07, "learning_rate": 1.4945700639688753e-05, "loss": 0.47, "step": 5761 }, { "epoch": 1.07, "learning_rate": 1.4943964479992525e-05, "loss": 0.4333, "step": 5762 }, { "epoch": 1.07, "learning_rate": 1.4942228123041265e-05, "loss": 0.4539, "step": 5763 }, { "epoch": 1.07, "learning_rate": 1.4940491568904252e-05, "loss": 0.4445, "step": 5764 }, { "epoch": 1.07, "learning_rate": 1.4938754817650773e-05, "loss": 0.4396, "step": 5765 }, { "epoch": 1.07, "learning_rate": 1.4937017869350123e-05, "loss": 0.447, "step": 5766 }, { "epoch": 1.07, "learning_rate": 1.49352807240716e-05, "loss": 0.4722, "step": 5767 }, { "epoch": 1.07, "learning_rate": 1.4933543381884512e-05, "loss": 0.4416, "step": 5768 }, { "epoch": 1.07, "learning_rate": 1.4931805842858178e-05, "loss": 0.4357, "step": 5769 }, { "epoch": 1.07, "learning_rate": 1.493006810706192e-05, "loss": 0.4416, "step": 5770 }, { "epoch": 1.07, "learning_rate": 1.4928330174565075e-05, "loss": 0.4266, "step": 5771 }, { "epoch": 1.07, "learning_rate": 1.4926592045436979e-05, "loss": 0.4423, "step": 5772 }, { "epoch": 1.07, "learning_rate": 1.4924853719746985e-05, "loss": 0.4459, "step": 5773 }, { "epoch": 1.07, "learning_rate": 1.4923115197564442e-05, "loss": 0.447, "step": 5774 }, { "epoch": 1.07, "learning_rate": 1.4921376478958717e-05, "loss": 0.4479, "step": 5775 }, { "epoch": 1.07, "learning_rate": 1.4919637563999185e-05, "loss": 0.4687, "step": 5776 }, { "epoch": 1.07, "learning_rate": 1.4917898452755222e-05, "loss": 0.4513, "step": 5777 }, { "epoch": 1.07, "learning_rate": 1.4916159145296216e-05, "loss": 0.4399, "step": 5778 }, { "epoch": 1.07, "learning_rate": 1.4914419641691562e-05, "loss": 0.4442, "step": 5779 }, { "epoch": 1.07, "learning_rate": 1.4912679942010663e-05, "loss": 0.4468, "step": 5780 }, { "epoch": 1.07, "learning_rate": 1.491094004632293e-05, "loss": 0.439, "step": 5781 }, { "epoch": 1.07, "learning_rate": 1.4909199954697782e-05, "loss": 0.4193, "step": 5782 }, { "epoch": 1.07, "learning_rate": 1.4907459667204643e-05, "loss": 0.4321, "step": 5783 }, { "epoch": 1.07, "learning_rate": 1.4905719183912953e-05, "loss": 0.4278, "step": 5784 }, { "epoch": 1.07, "learning_rate": 1.4903978504892147e-05, "loss": 0.4357, "step": 5785 }, { "epoch": 1.07, "learning_rate": 1.4902237630211678e-05, "loss": 0.4547, "step": 5786 }, { "epoch": 1.07, "learning_rate": 1.4900496559941004e-05, "loss": 0.4375, "step": 5787 }, { "epoch": 1.07, "learning_rate": 1.4898755294149591e-05, "loss": 0.4385, "step": 5788 }, { "epoch": 1.07, "learning_rate": 1.489701383290691e-05, "loss": 0.4357, "step": 5789 }, { "epoch": 1.07, "learning_rate": 1.4895272176282447e-05, "loss": 0.4373, "step": 5790 }, { "epoch": 1.07, "learning_rate": 1.4893530324345686e-05, "loss": 0.4572, "step": 5791 }, { "epoch": 1.07, "learning_rate": 1.4891788277166125e-05, "loss": 0.4099, "step": 5792 }, { "epoch": 1.07, "learning_rate": 1.4890046034813268e-05, "loss": 0.4387, "step": 5793 }, { "epoch": 1.07, "learning_rate": 1.4888303597356628e-05, "loss": 0.4501, "step": 5794 }, { "epoch": 1.07, "learning_rate": 1.4886560964865725e-05, "loss": 0.4519, "step": 5795 }, { "epoch": 1.07, "learning_rate": 1.4884818137410087e-05, "loss": 0.4514, "step": 5796 }, { "epoch": 1.07, "learning_rate": 1.488307511505925e-05, "loss": 0.4388, "step": 5797 }, { "epoch": 1.07, "learning_rate": 1.4881331897882753e-05, "loss": 0.4438, "step": 5798 }, { "epoch": 1.07, "learning_rate": 1.4879588485950155e-05, "loss": 0.4305, "step": 5799 }, { "epoch": 1.07, "learning_rate": 1.4877844879331009e-05, "loss": 0.4245, "step": 5800 }, { "epoch": 1.07, "learning_rate": 1.4876101078094887e-05, "loss": 0.4364, "step": 5801 }, { "epoch": 1.07, "learning_rate": 1.4874357082311355e-05, "loss": 0.4809, "step": 5802 }, { "epoch": 1.07, "learning_rate": 1.4872612892050002e-05, "loss": 0.4444, "step": 5803 }, { "epoch": 1.07, "learning_rate": 1.4870868507380416e-05, "loss": 0.4408, "step": 5804 }, { "epoch": 1.07, "learning_rate": 1.4869123928372194e-05, "loss": 0.4405, "step": 5805 }, { "epoch": 1.07, "learning_rate": 1.4867379155094943e-05, "loss": 0.4397, "step": 5806 }, { "epoch": 1.07, "learning_rate": 1.4865634187618276e-05, "loss": 0.4488, "step": 5807 }, { "epoch": 1.07, "learning_rate": 1.4863889026011813e-05, "loss": 0.4335, "step": 5808 }, { "epoch": 1.07, "learning_rate": 1.4862143670345182e-05, "loss": 0.4344, "step": 5809 }, { "epoch": 1.07, "learning_rate": 1.486039812068802e-05, "loss": 0.4635, "step": 5810 }, { "epoch": 1.08, "learning_rate": 1.4858652377109974e-05, "loss": 0.4427, "step": 5811 }, { "epoch": 1.08, "learning_rate": 1.4856906439680694e-05, "loss": 0.4436, "step": 5812 }, { "epoch": 1.08, "learning_rate": 1.4855160308469838e-05, "loss": 0.4575, "step": 5813 }, { "epoch": 1.08, "learning_rate": 1.4853413983547075e-05, "loss": 0.4286, "step": 5814 }, { "epoch": 1.08, "learning_rate": 1.4851667464982077e-05, "loss": 0.4384, "step": 5815 }, { "epoch": 1.08, "learning_rate": 1.4849920752844535e-05, "loss": 0.4386, "step": 5816 }, { "epoch": 1.08, "learning_rate": 1.484817384720413e-05, "loss": 0.4443, "step": 5817 }, { "epoch": 1.08, "learning_rate": 1.4846426748130567e-05, "loss": 0.4431, "step": 5818 }, { "epoch": 1.08, "learning_rate": 1.4844679455693549e-05, "loss": 0.4527, "step": 5819 }, { "epoch": 1.08, "learning_rate": 1.4842931969962791e-05, "loss": 0.4361, "step": 5820 }, { "epoch": 1.08, "learning_rate": 1.4841184291008012e-05, "loss": 0.4298, "step": 5821 }, { "epoch": 1.08, "learning_rate": 1.4839436418898945e-05, "loss": 0.448, "step": 5822 }, { "epoch": 1.08, "learning_rate": 1.4837688353705327e-05, "loss": 0.4404, "step": 5823 }, { "epoch": 1.08, "learning_rate": 1.4835940095496897e-05, "loss": 0.4402, "step": 5824 }, { "epoch": 1.08, "learning_rate": 1.4834191644343413e-05, "loss": 0.4603, "step": 5825 }, { "epoch": 1.08, "learning_rate": 1.4832443000314628e-05, "loss": 0.4346, "step": 5826 }, { "epoch": 1.08, "learning_rate": 1.4830694163480319e-05, "loss": 0.4607, "step": 5827 }, { "epoch": 1.08, "learning_rate": 1.4828945133910257e-05, "loss": 0.4565, "step": 5828 }, { "epoch": 1.08, "learning_rate": 1.4827195911674221e-05, "loss": 0.4181, "step": 5829 }, { "epoch": 1.08, "learning_rate": 1.4825446496842008e-05, "loss": 0.4279, "step": 5830 }, { "epoch": 1.08, "learning_rate": 1.4823696889483414e-05, "loss": 0.4371, "step": 5831 }, { "epoch": 1.08, "learning_rate": 1.4821947089668242e-05, "loss": 0.4404, "step": 5832 }, { "epoch": 1.08, "learning_rate": 1.4820197097466312e-05, "loss": 0.4358, "step": 5833 }, { "epoch": 1.08, "learning_rate": 1.4818446912947441e-05, "loss": 0.4367, "step": 5834 }, { "epoch": 1.08, "learning_rate": 1.481669653618146e-05, "loss": 0.4396, "step": 5835 }, { "epoch": 1.08, "learning_rate": 1.4814945967238204e-05, "loss": 0.4379, "step": 5836 }, { "epoch": 1.08, "learning_rate": 1.4813195206187518e-05, "loss": 0.4417, "step": 5837 }, { "epoch": 1.08, "learning_rate": 1.4811444253099256e-05, "loss": 0.4488, "step": 5838 }, { "epoch": 1.08, "learning_rate": 1.4809693108043276e-05, "loss": 0.4338, "step": 5839 }, { "epoch": 1.08, "learning_rate": 1.4807941771089447e-05, "loss": 0.4211, "step": 5840 }, { "epoch": 1.08, "learning_rate": 1.480619024230764e-05, "loss": 0.4376, "step": 5841 }, { "epoch": 1.08, "learning_rate": 1.4804438521767743e-05, "loss": 0.4398, "step": 5842 }, { "epoch": 1.08, "learning_rate": 1.4802686609539645e-05, "loss": 0.4575, "step": 5843 }, { "epoch": 1.08, "learning_rate": 1.4800934505693242e-05, "loss": 0.4598, "step": 5844 }, { "epoch": 1.08, "learning_rate": 1.479918221029844e-05, "loss": 0.4248, "step": 5845 }, { "epoch": 1.08, "learning_rate": 1.4797429723425154e-05, "loss": 0.436, "step": 5846 }, { "epoch": 1.08, "learning_rate": 1.4795677045143304e-05, "loss": 0.4423, "step": 5847 }, { "epoch": 1.08, "learning_rate": 1.4793924175522821e-05, "loss": 0.4597, "step": 5848 }, { "epoch": 1.08, "learning_rate": 1.4792171114633635e-05, "loss": 0.4361, "step": 5849 }, { "epoch": 1.08, "learning_rate": 1.4790417862545698e-05, "loss": 0.4277, "step": 5850 }, { "epoch": 1.08, "learning_rate": 1.4788664419328957e-05, "loss": 0.4295, "step": 5851 }, { "epoch": 1.08, "learning_rate": 1.478691078505337e-05, "loss": 0.4469, "step": 5852 }, { "epoch": 1.08, "learning_rate": 1.4785156959788906e-05, "loss": 0.4431, "step": 5853 }, { "epoch": 1.08, "learning_rate": 1.4783402943605539e-05, "loss": 0.4398, "step": 5854 }, { "epoch": 1.08, "learning_rate": 1.4781648736573248e-05, "loss": 0.4583, "step": 5855 }, { "epoch": 1.08, "learning_rate": 1.477989433876203e-05, "loss": 0.4633, "step": 5856 }, { "epoch": 1.08, "learning_rate": 1.4778139750241876e-05, "loss": 0.4362, "step": 5857 }, { "epoch": 1.08, "learning_rate": 1.4776384971082794e-05, "loss": 0.4261, "step": 5858 }, { "epoch": 1.08, "learning_rate": 1.477463000135479e-05, "loss": 0.4568, "step": 5859 }, { "epoch": 1.08, "learning_rate": 1.4772874841127894e-05, "loss": 0.435, "step": 5860 }, { "epoch": 1.08, "learning_rate": 1.4771119490472128e-05, "loss": 0.4438, "step": 5861 }, { "epoch": 1.08, "learning_rate": 1.4769363949457525e-05, "loss": 0.4495, "step": 5862 }, { "epoch": 1.08, "learning_rate": 1.4767608218154133e-05, "loss": 0.4283, "step": 5863 }, { "epoch": 1.08, "learning_rate": 1.4765852296631998e-05, "loss": 0.4407, "step": 5864 }, { "epoch": 1.09, "learning_rate": 1.4764096184961181e-05, "loss": 0.4168, "step": 5865 }, { "epoch": 1.09, "learning_rate": 1.4762339883211745e-05, "loss": 0.4574, "step": 5866 }, { "epoch": 1.09, "learning_rate": 1.4760583391453767e-05, "loss": 0.446, "step": 5867 }, { "epoch": 1.09, "learning_rate": 1.4758826709757326e-05, "loss": 0.4526, "step": 5868 }, { "epoch": 1.09, "learning_rate": 1.4757069838192508e-05, "loss": 0.4446, "step": 5869 }, { "epoch": 1.09, "learning_rate": 1.4755312776829414e-05, "loss": 0.4501, "step": 5870 }, { "epoch": 1.09, "learning_rate": 1.4753555525738142e-05, "loss": 0.4393, "step": 5871 }, { "epoch": 1.09, "learning_rate": 1.4751798084988807e-05, "loss": 0.4547, "step": 5872 }, { "epoch": 1.09, "learning_rate": 1.4750040454651525e-05, "loss": 0.4383, "step": 5873 }, { "epoch": 1.09, "learning_rate": 1.4748282634796423e-05, "loss": 0.4473, "step": 5874 }, { "epoch": 1.09, "learning_rate": 1.4746524625493637e-05, "loss": 0.4635, "step": 5875 }, { "epoch": 1.09, "learning_rate": 1.4744766426813304e-05, "loss": 0.4403, "step": 5876 }, { "epoch": 1.09, "learning_rate": 1.4743008038825577e-05, "loss": 0.4563, "step": 5877 }, { "epoch": 1.09, "learning_rate": 1.4741249461600611e-05, "loss": 0.4575, "step": 5878 }, { "epoch": 1.09, "learning_rate": 1.4739490695208569e-05, "loss": 0.4392, "step": 5879 }, { "epoch": 1.09, "learning_rate": 1.4737731739719624e-05, "loss": 0.4374, "step": 5880 }, { "epoch": 1.09, "learning_rate": 1.4735972595203951e-05, "loss": 0.455, "step": 5881 }, { "epoch": 1.09, "learning_rate": 1.4734213261731742e-05, "loss": 0.4473, "step": 5882 }, { "epoch": 1.09, "learning_rate": 1.473245373937319e-05, "loss": 0.4238, "step": 5883 }, { "epoch": 1.09, "learning_rate": 1.4730694028198496e-05, "loss": 0.4177, "step": 5884 }, { "epoch": 1.09, "learning_rate": 1.4728934128277868e-05, "loss": 0.4544, "step": 5885 }, { "epoch": 1.09, "learning_rate": 1.4727174039681522e-05, "loss": 0.4552, "step": 5886 }, { "epoch": 1.09, "learning_rate": 1.4725413762479686e-05, "loss": 0.4418, "step": 5887 }, { "epoch": 1.09, "learning_rate": 1.472365329674259e-05, "loss": 0.4295, "step": 5888 }, { "epoch": 1.09, "learning_rate": 1.4721892642540475e-05, "loss": 0.4668, "step": 5889 }, { "epoch": 1.09, "learning_rate": 1.4720131799943582e-05, "loss": 0.4492, "step": 5890 }, { "epoch": 1.09, "learning_rate": 1.471837076902217e-05, "loss": 0.4246, "step": 5891 }, { "epoch": 1.09, "learning_rate": 1.4716609549846498e-05, "loss": 0.4372, "step": 5892 }, { "epoch": 1.09, "learning_rate": 1.4714848142486842e-05, "loss": 0.4277, "step": 5893 }, { "epoch": 1.09, "learning_rate": 1.471308654701347e-05, "loss": 0.4515, "step": 5894 }, { "epoch": 1.09, "learning_rate": 1.4711324763496674e-05, "loss": 0.4562, "step": 5895 }, { "epoch": 1.09, "learning_rate": 1.4709562792006744e-05, "loss": 0.4268, "step": 5896 }, { "epoch": 1.09, "learning_rate": 1.4707800632613975e-05, "loss": 0.4526, "step": 5897 }, { "epoch": 1.09, "learning_rate": 1.4706038285388678e-05, "loss": 0.4495, "step": 5898 }, { "epoch": 1.09, "learning_rate": 1.470427575040117e-05, "loss": 0.4452, "step": 5899 }, { "epoch": 1.09, "learning_rate": 1.4702513027721763e-05, "loss": 0.4461, "step": 5900 }, { "epoch": 1.09, "learning_rate": 1.4700750117420796e-05, "loss": 0.4446, "step": 5901 }, { "epoch": 1.09, "learning_rate": 1.4698987019568603e-05, "loss": 0.4568, "step": 5902 }, { "epoch": 1.09, "learning_rate": 1.4697223734235526e-05, "loss": 0.4304, "step": 5903 }, { "epoch": 1.09, "learning_rate": 1.4695460261491918e-05, "loss": 0.4413, "step": 5904 }, { "epoch": 1.09, "learning_rate": 1.4693696601408143e-05, "loss": 0.4334, "step": 5905 }, { "epoch": 1.09, "learning_rate": 1.469193275405456e-05, "loss": 0.4354, "step": 5906 }, { "epoch": 1.09, "learning_rate": 1.469016871950155e-05, "loss": 0.4619, "step": 5907 }, { "epoch": 1.09, "learning_rate": 1.4688404497819489e-05, "loss": 0.4682, "step": 5908 }, { "epoch": 1.09, "learning_rate": 1.468664008907877e-05, "loss": 0.4302, "step": 5909 }, { "epoch": 1.09, "learning_rate": 1.468487549334979e-05, "loss": 0.4334, "step": 5910 }, { "epoch": 1.09, "learning_rate": 1.468311071070295e-05, "loss": 0.4295, "step": 5911 }, { "epoch": 1.09, "learning_rate": 1.4681345741208663e-05, "loss": 0.4577, "step": 5912 }, { "epoch": 1.09, "learning_rate": 1.4679580584937348e-05, "loss": 0.4453, "step": 5913 }, { "epoch": 1.09, "learning_rate": 1.4677815241959432e-05, "loss": 0.4314, "step": 5914 }, { "epoch": 1.09, "learning_rate": 1.4676049712345348e-05, "loss": 0.4392, "step": 5915 }, { "epoch": 1.09, "learning_rate": 1.4674283996165542e-05, "loss": 0.4543, "step": 5916 }, { "epoch": 1.09, "learning_rate": 1.4672518093490455e-05, "loss": 0.4236, "step": 5917 }, { "epoch": 1.09, "learning_rate": 1.4670752004390547e-05, "loss": 0.4473, "step": 5918 }, { "epoch": 1.1, "learning_rate": 1.4668985728936282e-05, "loss": 0.422, "step": 5919 }, { "epoch": 1.1, "learning_rate": 1.4667219267198132e-05, "loss": 0.4388, "step": 5920 }, { "epoch": 1.1, "learning_rate": 1.4665452619246571e-05, "loss": 0.4706, "step": 5921 }, { "epoch": 1.1, "learning_rate": 1.466368578515209e-05, "loss": 0.453, "step": 5922 }, { "epoch": 1.1, "learning_rate": 1.4661918764985184e-05, "loss": 0.4441, "step": 5923 }, { "epoch": 1.1, "learning_rate": 1.4660151558816346e-05, "loss": 0.4446, "step": 5924 }, { "epoch": 1.1, "learning_rate": 1.465838416671609e-05, "loss": 0.4485, "step": 5925 }, { "epoch": 1.1, "learning_rate": 1.4656616588754933e-05, "loss": 0.4366, "step": 5926 }, { "epoch": 1.1, "learning_rate": 1.4654848825003396e-05, "loss": 0.4476, "step": 5927 }, { "epoch": 1.1, "learning_rate": 1.4653080875532007e-05, "loss": 0.4376, "step": 5928 }, { "epoch": 1.1, "learning_rate": 1.4651312740411306e-05, "loss": 0.438, "step": 5929 }, { "epoch": 1.1, "learning_rate": 1.4649544419711838e-05, "loss": 0.4519, "step": 5930 }, { "epoch": 1.1, "learning_rate": 1.4647775913504156e-05, "loss": 0.4402, "step": 5931 }, { "epoch": 1.1, "learning_rate": 1.4646007221858823e-05, "loss": 0.4592, "step": 5932 }, { "epoch": 1.1, "learning_rate": 1.46442383448464e-05, "loss": 0.4283, "step": 5933 }, { "epoch": 1.1, "learning_rate": 1.4642469282537466e-05, "loss": 0.4561, "step": 5934 }, { "epoch": 1.1, "learning_rate": 1.4640700035002607e-05, "loss": 0.4525, "step": 5935 }, { "epoch": 1.1, "learning_rate": 1.4638930602312403e-05, "loss": 0.446, "step": 5936 }, { "epoch": 1.1, "learning_rate": 1.463716098453746e-05, "loss": 0.4432, "step": 5937 }, { "epoch": 1.1, "learning_rate": 1.4635391181748379e-05, "loss": 0.4534, "step": 5938 }, { "epoch": 1.1, "learning_rate": 1.4633621194015772e-05, "loss": 0.4497, "step": 5939 }, { "epoch": 1.1, "learning_rate": 1.4631851021410258e-05, "loss": 0.4371, "step": 5940 }, { "epoch": 1.1, "learning_rate": 1.4630080664002462e-05, "loss": 0.4352, "step": 5941 }, { "epoch": 1.1, "learning_rate": 1.4628310121863022e-05, "loss": 0.4493, "step": 5942 }, { "epoch": 1.1, "learning_rate": 1.4626539395062578e-05, "loss": 0.4414, "step": 5943 }, { "epoch": 1.1, "learning_rate": 1.4624768483671776e-05, "loss": 0.4496, "step": 5944 }, { "epoch": 1.1, "learning_rate": 1.4622997387761274e-05, "loss": 0.4159, "step": 5945 }, { "epoch": 1.1, "learning_rate": 1.4621226107401736e-05, "loss": 0.4406, "step": 5946 }, { "epoch": 1.1, "learning_rate": 1.4619454642663833e-05, "loss": 0.4359, "step": 5947 }, { "epoch": 1.1, "learning_rate": 1.4617682993618241e-05, "loss": 0.4457, "step": 5948 }, { "epoch": 1.1, "learning_rate": 1.461591116033565e-05, "loss": 0.4382, "step": 5949 }, { "epoch": 1.1, "learning_rate": 1.4614139142886748e-05, "loss": 0.4435, "step": 5950 }, { "epoch": 1.1, "learning_rate": 1.4612366941342236e-05, "loss": 0.4346, "step": 5951 }, { "epoch": 1.1, "learning_rate": 1.4610594555772824e-05, "loss": 0.4512, "step": 5952 }, { "epoch": 1.1, "learning_rate": 1.4608821986249225e-05, "loss": 0.4479, "step": 5953 }, { "epoch": 1.1, "learning_rate": 1.4607049232842162e-05, "loss": 0.4406, "step": 5954 }, { "epoch": 1.1, "learning_rate": 1.4605276295622366e-05, "loss": 0.4536, "step": 5955 }, { "epoch": 1.1, "learning_rate": 1.4603503174660569e-05, "loss": 0.4692, "step": 5956 }, { "epoch": 1.1, "learning_rate": 1.4601729870027519e-05, "loss": 0.4431, "step": 5957 }, { "epoch": 1.1, "learning_rate": 1.4599956381793967e-05, "loss": 0.4548, "step": 5958 }, { "epoch": 1.1, "learning_rate": 1.4598182710030673e-05, "loss": 0.4374, "step": 5959 }, { "epoch": 1.1, "learning_rate": 1.4596408854808403e-05, "loss": 0.45, "step": 5960 }, { "epoch": 1.1, "learning_rate": 1.459463481619793e-05, "loss": 0.4479, "step": 5961 }, { "epoch": 1.1, "learning_rate": 1.4592860594270033e-05, "loss": 0.4407, "step": 5962 }, { "epoch": 1.1, "learning_rate": 1.4591086189095503e-05, "loss": 0.4593, "step": 5963 }, { "epoch": 1.1, "learning_rate": 1.458931160074513e-05, "loss": 0.425, "step": 5964 }, { "epoch": 1.1, "learning_rate": 1.4587536829289729e-05, "loss": 0.4316, "step": 5965 }, { "epoch": 1.1, "learning_rate": 1.4585761874800097e-05, "loss": 0.4534, "step": 5966 }, { "epoch": 1.1, "learning_rate": 1.4583986737347056e-05, "loss": 0.4447, "step": 5967 }, { "epoch": 1.1, "learning_rate": 1.4582211417001432e-05, "loss": 0.4392, "step": 5968 }, { "epoch": 1.1, "learning_rate": 1.4580435913834054e-05, "loss": 0.464, "step": 5969 }, { "epoch": 1.1, "learning_rate": 1.4578660227915769e-05, "loss": 0.4311, "step": 5970 }, { "epoch": 1.1, "learning_rate": 1.4576884359317411e-05, "loss": 0.4415, "step": 5971 }, { "epoch": 1.1, "learning_rate": 1.4575108308109846e-05, "loss": 0.4196, "step": 5972 }, { "epoch": 1.11, "learning_rate": 1.4573332074363929e-05, "loss": 0.4595, "step": 5973 }, { "epoch": 1.11, "learning_rate": 1.4571555658150529e-05, "loss": 0.4209, "step": 5974 }, { "epoch": 1.11, "learning_rate": 1.4569779059540522e-05, "loss": 0.4372, "step": 5975 }, { "epoch": 1.11, "learning_rate": 1.4568002278604793e-05, "loss": 0.4394, "step": 5976 }, { "epoch": 1.11, "learning_rate": 1.456622531541423e-05, "loss": 0.4622, "step": 5977 }, { "epoch": 1.11, "learning_rate": 1.4564448170039732e-05, "loss": 0.4428, "step": 5978 }, { "epoch": 1.11, "learning_rate": 1.45626708425522e-05, "loss": 0.4531, "step": 5979 }, { "epoch": 1.11, "learning_rate": 1.456089333302255e-05, "loss": 0.4355, "step": 5980 }, { "epoch": 1.11, "learning_rate": 1.4559115641521699e-05, "loss": 0.4419, "step": 5981 }, { "epoch": 1.11, "learning_rate": 1.4557337768120578e-05, "loss": 0.4573, "step": 5982 }, { "epoch": 1.11, "learning_rate": 1.4555559712890118e-05, "loss": 0.4426, "step": 5983 }, { "epoch": 1.11, "learning_rate": 1.4553781475901256e-05, "loss": 0.4426, "step": 5984 }, { "epoch": 1.11, "learning_rate": 1.4552003057224948e-05, "loss": 0.4436, "step": 5985 }, { "epoch": 1.11, "learning_rate": 1.4550224456932143e-05, "loss": 0.4519, "step": 5986 }, { "epoch": 1.11, "learning_rate": 1.454844567509381e-05, "loss": 0.4578, "step": 5987 }, { "epoch": 1.11, "learning_rate": 1.4546666711780914e-05, "loss": 0.4393, "step": 5988 }, { "epoch": 1.11, "learning_rate": 1.4544887567064434e-05, "loss": 0.4324, "step": 5989 }, { "epoch": 1.11, "learning_rate": 1.4543108241015353e-05, "loss": 0.4454, "step": 5990 }, { "epoch": 1.11, "learning_rate": 1.4541328733704664e-05, "loss": 0.4425, "step": 5991 }, { "epoch": 1.11, "learning_rate": 1.453954904520337e-05, "loss": 0.4621, "step": 5992 }, { "epoch": 1.11, "learning_rate": 1.4537769175582473e-05, "loss": 0.4498, "step": 5993 }, { "epoch": 1.11, "learning_rate": 1.4535989124912987e-05, "loss": 0.4558, "step": 5994 }, { "epoch": 1.11, "learning_rate": 1.453420889326593e-05, "loss": 0.4439, "step": 5995 }, { "epoch": 1.11, "learning_rate": 1.4532428480712338e-05, "loss": 0.4595, "step": 5996 }, { "epoch": 1.11, "learning_rate": 1.4530647887323236e-05, "loss": 0.4447, "step": 5997 }, { "epoch": 1.11, "learning_rate": 1.4528867113169677e-05, "loss": 0.4589, "step": 5998 }, { "epoch": 1.11, "learning_rate": 1.4527086158322703e-05, "loss": 0.4559, "step": 5999 }, { "epoch": 1.11, "learning_rate": 1.4525305022853372e-05, "loss": 0.4524, "step": 6000 }, { "epoch": 1.11, "learning_rate": 1.4523523706832749e-05, "loss": 0.4645, "step": 6001 }, { "epoch": 1.11, "learning_rate": 1.4521742210331906e-05, "loss": 0.4192, "step": 6002 }, { "epoch": 1.11, "learning_rate": 1.451996053342192e-05, "loss": 0.4524, "step": 6003 }, { "epoch": 1.11, "learning_rate": 1.451817867617388e-05, "loss": 0.4399, "step": 6004 }, { "epoch": 1.11, "learning_rate": 1.4516396638658874e-05, "loss": 0.4332, "step": 6005 }, { "epoch": 1.11, "learning_rate": 1.4514614420948004e-05, "loss": 0.442, "step": 6006 }, { "epoch": 1.11, "learning_rate": 1.4512832023112375e-05, "loss": 0.4484, "step": 6007 }, { "epoch": 1.11, "learning_rate": 1.4511049445223107e-05, "loss": 0.4356, "step": 6008 }, { "epoch": 1.11, "learning_rate": 1.4509266687351318e-05, "loss": 0.4404, "step": 6009 }, { "epoch": 1.11, "learning_rate": 1.4507483749568134e-05, "loss": 0.4501, "step": 6010 }, { "epoch": 1.11, "learning_rate": 1.4505700631944694e-05, "loss": 0.4543, "step": 6011 }, { "epoch": 1.11, "learning_rate": 1.4503917334552142e-05, "loss": 0.4553, "step": 6012 }, { "epoch": 1.11, "learning_rate": 1.4502133857461629e-05, "loss": 0.4472, "step": 6013 }, { "epoch": 1.11, "learning_rate": 1.4500350200744307e-05, "loss": 0.4648, "step": 6014 }, { "epoch": 1.11, "learning_rate": 1.4498566364471348e-05, "loss": 0.4367, "step": 6015 }, { "epoch": 1.11, "learning_rate": 1.4496782348713919e-05, "loss": 0.433, "step": 6016 }, { "epoch": 1.11, "learning_rate": 1.4494998153543196e-05, "loss": 0.4473, "step": 6017 }, { "epoch": 1.11, "learning_rate": 1.4493213779030373e-05, "loss": 0.4472, "step": 6018 }, { "epoch": 1.11, "learning_rate": 1.4491429225246636e-05, "loss": 0.4402, "step": 6019 }, { "epoch": 1.11, "learning_rate": 1.448964449226319e-05, "loss": 0.4554, "step": 6020 }, { "epoch": 1.11, "learning_rate": 1.4487859580151243e-05, "loss": 0.425, "step": 6021 }, { "epoch": 1.11, "learning_rate": 1.4486074488982004e-05, "loss": 0.4172, "step": 6022 }, { "epoch": 1.11, "learning_rate": 1.44842892188267e-05, "loss": 0.4605, "step": 6023 }, { "epoch": 1.11, "learning_rate": 1.448250376975656e-05, "loss": 0.4289, "step": 6024 }, { "epoch": 1.11, "learning_rate": 1.448071814184282e-05, "loss": 0.4475, "step": 6025 }, { "epoch": 1.11, "learning_rate": 1.4478932335156721e-05, "loss": 0.4434, "step": 6026 }, { "epoch": 1.12, "learning_rate": 1.4477146349769513e-05, "loss": 0.4553, "step": 6027 }, { "epoch": 1.12, "learning_rate": 1.4475360185752454e-05, "loss": 0.4498, "step": 6028 }, { "epoch": 1.12, "learning_rate": 1.4473573843176812e-05, "loss": 0.448, "step": 6029 }, { "epoch": 1.12, "learning_rate": 1.4471787322113855e-05, "loss": 0.4584, "step": 6030 }, { "epoch": 1.12, "learning_rate": 1.4470000622634865e-05, "loss": 0.4546, "step": 6031 }, { "epoch": 1.12, "learning_rate": 1.4468213744811124e-05, "loss": 0.451, "step": 6032 }, { "epoch": 1.12, "learning_rate": 1.4466426688713928e-05, "loss": 0.4361, "step": 6033 }, { "epoch": 1.12, "learning_rate": 1.4464639454414576e-05, "loss": 0.4409, "step": 6034 }, { "epoch": 1.12, "learning_rate": 1.4462852041984374e-05, "loss": 0.419, "step": 6035 }, { "epoch": 1.12, "learning_rate": 1.4461064451494642e-05, "loss": 0.4386, "step": 6036 }, { "epoch": 1.12, "learning_rate": 1.44592766830167e-05, "loss": 0.4566, "step": 6037 }, { "epoch": 1.12, "learning_rate": 1.4457488736621868e-05, "loss": 0.4488, "step": 6038 }, { "epoch": 1.12, "learning_rate": 1.445570061238149e-05, "loss": 0.4398, "step": 6039 }, { "epoch": 1.12, "learning_rate": 1.4453912310366907e-05, "loss": 0.459, "step": 6040 }, { "epoch": 1.12, "learning_rate": 1.4452123830649471e-05, "loss": 0.447, "step": 6041 }, { "epoch": 1.12, "learning_rate": 1.4450335173300537e-05, "loss": 0.465, "step": 6042 }, { "epoch": 1.12, "learning_rate": 1.444854633839147e-05, "loss": 0.4568, "step": 6043 }, { "epoch": 1.12, "learning_rate": 1.4446757325993636e-05, "loss": 0.4439, "step": 6044 }, { "epoch": 1.12, "learning_rate": 1.4444968136178421e-05, "loss": 0.443, "step": 6045 }, { "epoch": 1.12, "learning_rate": 1.4443178769017205e-05, "loss": 0.4423, "step": 6046 }, { "epoch": 1.12, "learning_rate": 1.4441389224581384e-05, "loss": 0.4642, "step": 6047 }, { "epoch": 1.12, "learning_rate": 1.4439599502942354e-05, "loss": 0.4156, "step": 6048 }, { "epoch": 1.12, "learning_rate": 1.4437809604171527e-05, "loss": 0.4454, "step": 6049 }, { "epoch": 1.12, "learning_rate": 1.443601952834031e-05, "loss": 0.4456, "step": 6050 }, { "epoch": 1.12, "learning_rate": 1.4434229275520128e-05, "loss": 0.4648, "step": 6051 }, { "epoch": 1.12, "learning_rate": 1.4432438845782408e-05, "loss": 0.4512, "step": 6052 }, { "epoch": 1.12, "learning_rate": 1.4430648239198586e-05, "loss": 0.4299, "step": 6053 }, { "epoch": 1.12, "learning_rate": 1.44288574558401e-05, "loss": 0.4502, "step": 6054 }, { "epoch": 1.12, "learning_rate": 1.4427066495778401e-05, "loss": 0.4454, "step": 6055 }, { "epoch": 1.12, "learning_rate": 1.4425275359084946e-05, "loss": 0.4341, "step": 6056 }, { "epoch": 1.12, "learning_rate": 1.4423484045831197e-05, "loss": 0.4528, "step": 6057 }, { "epoch": 1.12, "learning_rate": 1.4421692556088627e-05, "loss": 0.4521, "step": 6058 }, { "epoch": 1.12, "learning_rate": 1.441990088992871e-05, "loss": 0.4458, "step": 6059 }, { "epoch": 1.12, "learning_rate": 1.4418109047422928e-05, "loss": 0.4607, "step": 6060 }, { "epoch": 1.12, "learning_rate": 1.4416317028642776e-05, "loss": 0.4421, "step": 6061 }, { "epoch": 1.12, "learning_rate": 1.441452483365975e-05, "loss": 0.4396, "step": 6062 }, { "epoch": 1.12, "learning_rate": 1.441273246254536e-05, "loss": 0.4502, "step": 6063 }, { "epoch": 1.12, "learning_rate": 1.4410939915371114e-05, "loss": 0.4279, "step": 6064 }, { "epoch": 1.12, "learning_rate": 1.4409147192208531e-05, "loss": 0.437, "step": 6065 }, { "epoch": 1.12, "learning_rate": 1.4407354293129137e-05, "loss": 0.4395, "step": 6066 }, { "epoch": 1.12, "learning_rate": 1.4405561218204467e-05, "loss": 0.446, "step": 6067 }, { "epoch": 1.12, "learning_rate": 1.4403767967506061e-05, "loss": 0.4608, "step": 6068 }, { "epoch": 1.12, "learning_rate": 1.4401974541105468e-05, "loss": 0.4437, "step": 6069 }, { "epoch": 1.12, "learning_rate": 1.440018093907424e-05, "loss": 0.4459, "step": 6070 }, { "epoch": 1.12, "learning_rate": 1.4398387161483938e-05, "loss": 0.4483, "step": 6071 }, { "epoch": 1.12, "learning_rate": 1.4396593208406134e-05, "loss": 0.447, "step": 6072 }, { "epoch": 1.12, "learning_rate": 1.4394799079912399e-05, "loss": 0.4205, "step": 6073 }, { "epoch": 1.12, "learning_rate": 1.4393004776074317e-05, "loss": 0.4415, "step": 6074 }, { "epoch": 1.12, "learning_rate": 1.4391210296963483e-05, "loss": 0.4273, "step": 6075 }, { "epoch": 1.12, "learning_rate": 1.4389415642651482e-05, "loss": 0.4354, "step": 6076 }, { "epoch": 1.12, "learning_rate": 1.4387620813209928e-05, "loss": 0.44, "step": 6077 }, { "epoch": 1.12, "learning_rate": 1.4385825808710423e-05, "loss": 0.443, "step": 6078 }, { "epoch": 1.12, "learning_rate": 1.4384030629224593e-05, "loss": 0.4426, "step": 6079 }, { "epoch": 1.12, "learning_rate": 1.4382235274824055e-05, "loss": 0.45, "step": 6080 }, { "epoch": 1.13, "learning_rate": 1.4380439745580444e-05, "loss": 0.4603, "step": 6081 }, { "epoch": 1.13, "learning_rate": 1.4378644041565398e-05, "loss": 0.4541, "step": 6082 }, { "epoch": 1.13, "learning_rate": 1.4376848162850558e-05, "loss": 0.4393, "step": 6083 }, { "epoch": 1.13, "learning_rate": 1.4375052109507582e-05, "loss": 0.4304, "step": 6084 }, { "epoch": 1.13, "learning_rate": 1.4373255881608126e-05, "loss": 0.4649, "step": 6085 }, { "epoch": 1.13, "learning_rate": 1.4371459479223861e-05, "loss": 0.4407, "step": 6086 }, { "epoch": 1.13, "learning_rate": 1.4369662902426454e-05, "loss": 0.436, "step": 6087 }, { "epoch": 1.13, "learning_rate": 1.4367866151287586e-05, "loss": 0.4455, "step": 6088 }, { "epoch": 1.13, "learning_rate": 1.4366069225878947e-05, "loss": 0.4247, "step": 6089 }, { "epoch": 1.13, "learning_rate": 1.4364272126272227e-05, "loss": 0.4622, "step": 6090 }, { "epoch": 1.13, "learning_rate": 1.4362474852539133e-05, "loss": 0.4442, "step": 6091 }, { "epoch": 1.13, "learning_rate": 1.4360677404751368e-05, "loss": 0.4544, "step": 6092 }, { "epoch": 1.13, "learning_rate": 1.4358879782980648e-05, "loss": 0.4534, "step": 6093 }, { "epoch": 1.13, "learning_rate": 1.4357081987298696e-05, "loss": 0.4399, "step": 6094 }, { "epoch": 1.13, "learning_rate": 1.4355284017777235e-05, "loss": 0.4427, "step": 6095 }, { "epoch": 1.13, "learning_rate": 1.4353485874488009e-05, "loss": 0.4528, "step": 6096 }, { "epoch": 1.13, "learning_rate": 1.4351687557502759e-05, "loss": 0.441, "step": 6097 }, { "epoch": 1.13, "learning_rate": 1.4349889066893227e-05, "loss": 0.4238, "step": 6098 }, { "epoch": 1.13, "learning_rate": 1.4348090402731178e-05, "loss": 0.4592, "step": 6099 }, { "epoch": 1.13, "learning_rate": 1.4346291565088373e-05, "loss": 0.4439, "step": 6100 }, { "epoch": 1.13, "learning_rate": 1.4344492554036578e-05, "loss": 0.4419, "step": 6101 }, { "epoch": 1.13, "learning_rate": 1.4342693369647575e-05, "loss": 0.4654, "step": 6102 }, { "epoch": 1.13, "learning_rate": 1.4340894011993152e-05, "loss": 0.4482, "step": 6103 }, { "epoch": 1.13, "learning_rate": 1.433909448114509e-05, "loss": 0.4365, "step": 6104 }, { "epoch": 1.13, "learning_rate": 1.4337294777175192e-05, "loss": 0.4396, "step": 6105 }, { "epoch": 1.13, "learning_rate": 1.4335494900155263e-05, "loss": 0.4399, "step": 6106 }, { "epoch": 1.13, "learning_rate": 1.4333694850157113e-05, "loss": 0.4497, "step": 6107 }, { "epoch": 1.13, "learning_rate": 1.4331894627252567e-05, "loss": 0.4511, "step": 6108 }, { "epoch": 1.13, "learning_rate": 1.4330094231513443e-05, "loss": 0.4533, "step": 6109 }, { "epoch": 1.13, "learning_rate": 1.4328293663011574e-05, "loss": 0.4461, "step": 6110 }, { "epoch": 1.13, "learning_rate": 1.4326492921818801e-05, "loss": 0.4467, "step": 6111 }, { "epoch": 1.13, "learning_rate": 1.4324692008006975e-05, "loss": 0.4667, "step": 6112 }, { "epoch": 1.13, "learning_rate": 1.4322890921647943e-05, "loss": 0.4419, "step": 6113 }, { "epoch": 1.13, "learning_rate": 1.4321089662813568e-05, "loss": 0.4433, "step": 6114 }, { "epoch": 1.13, "learning_rate": 1.4319288231575714e-05, "loss": 0.4123, "step": 6115 }, { "epoch": 1.13, "learning_rate": 1.4317486628006256e-05, "loss": 0.4351, "step": 6116 }, { "epoch": 1.13, "learning_rate": 1.4315684852177074e-05, "loss": 0.4401, "step": 6117 }, { "epoch": 1.13, "learning_rate": 1.4313882904160059e-05, "loss": 0.4375, "step": 6118 }, { "epoch": 1.13, "learning_rate": 1.4312080784027103e-05, "loss": 0.4292, "step": 6119 }, { "epoch": 1.13, "learning_rate": 1.4310278491850107e-05, "loss": 0.4331, "step": 6120 }, { "epoch": 1.13, "learning_rate": 1.4308476027700979e-05, "loss": 0.4351, "step": 6121 }, { "epoch": 1.13, "learning_rate": 1.4306673391651634e-05, "loss": 0.4317, "step": 6122 }, { "epoch": 1.13, "learning_rate": 1.4304870583773995e-05, "loss": 0.4658, "step": 6123 }, { "epoch": 1.13, "learning_rate": 1.430306760413999e-05, "loss": 0.4504, "step": 6124 }, { "epoch": 1.13, "learning_rate": 1.4301264452821557e-05, "loss": 0.4462, "step": 6125 }, { "epoch": 1.13, "learning_rate": 1.4299461129890633e-05, "loss": 0.4276, "step": 6126 }, { "epoch": 1.13, "learning_rate": 1.4297657635419171e-05, "loss": 0.4421, "step": 6127 }, { "epoch": 1.13, "learning_rate": 1.4295853969479123e-05, "loss": 0.4431, "step": 6128 }, { "epoch": 1.13, "learning_rate": 1.4294050132142458e-05, "loss": 0.4453, "step": 6129 }, { "epoch": 1.13, "learning_rate": 1.4292246123481147e-05, "loss": 0.4242, "step": 6130 }, { "epoch": 1.13, "learning_rate": 1.4290441943567158e-05, "loss": 0.4322, "step": 6131 }, { "epoch": 1.13, "learning_rate": 1.4288637592472479e-05, "loss": 0.434, "step": 6132 }, { "epoch": 1.13, "learning_rate": 1.42868330702691e-05, "loss": 0.4311, "step": 6133 }, { "epoch": 1.13, "learning_rate": 1.4285028377029018e-05, "loss": 0.4565, "step": 6134 }, { "epoch": 1.14, "learning_rate": 1.4283223512824238e-05, "loss": 0.4298, "step": 6135 }, { "epoch": 1.14, "learning_rate": 1.4281418477726773e-05, "loss": 0.4354, "step": 6136 }, { "epoch": 1.14, "learning_rate": 1.4279613271808634e-05, "loss": 0.4285, "step": 6137 }, { "epoch": 1.14, "learning_rate": 1.427780789514185e-05, "loss": 0.4235, "step": 6138 }, { "epoch": 1.14, "learning_rate": 1.4276002347798453e-05, "loss": 0.4549, "step": 6139 }, { "epoch": 1.14, "learning_rate": 1.4274196629850474e-05, "loss": 0.4297, "step": 6140 }, { "epoch": 1.14, "learning_rate": 1.427239074136997e-05, "loss": 0.4677, "step": 6141 }, { "epoch": 1.14, "learning_rate": 1.427058468242898e-05, "loss": 0.4175, "step": 6142 }, { "epoch": 1.14, "learning_rate": 1.426877845309957e-05, "loss": 0.4524, "step": 6143 }, { "epoch": 1.14, "learning_rate": 1.4266972053453802e-05, "loss": 0.4363, "step": 6144 }, { "epoch": 1.14, "learning_rate": 1.426516548356375e-05, "loss": 0.457, "step": 6145 }, { "epoch": 1.14, "learning_rate": 1.4263358743501492e-05, "loss": 0.4674, "step": 6146 }, { "epoch": 1.14, "learning_rate": 1.4261551833339113e-05, "loss": 0.4761, "step": 6147 }, { "epoch": 1.14, "learning_rate": 1.4259744753148707e-05, "loss": 0.4483, "step": 6148 }, { "epoch": 1.14, "learning_rate": 1.425793750300237e-05, "loss": 0.4397, "step": 6149 }, { "epoch": 1.14, "learning_rate": 1.4256130082972211e-05, "loss": 0.4327, "step": 6150 }, { "epoch": 1.14, "learning_rate": 1.425432249313034e-05, "loss": 0.4381, "step": 6151 }, { "epoch": 1.14, "learning_rate": 1.4252514733548885e-05, "loss": 0.4753, "step": 6152 }, { "epoch": 1.14, "learning_rate": 1.4250706804299961e-05, "loss": 0.4349, "step": 6153 }, { "epoch": 1.14, "learning_rate": 1.4248898705455704e-05, "loss": 0.4544, "step": 6154 }, { "epoch": 1.14, "learning_rate": 1.4247090437088256e-05, "loss": 0.4413, "step": 6155 }, { "epoch": 1.14, "learning_rate": 1.4245281999269764e-05, "loss": 0.4391, "step": 6156 }, { "epoch": 1.14, "learning_rate": 1.4243473392072377e-05, "loss": 0.4557, "step": 6157 }, { "epoch": 1.14, "learning_rate": 1.4241664615568265e-05, "loss": 0.4263, "step": 6158 }, { "epoch": 1.14, "learning_rate": 1.4239855669829583e-05, "loss": 0.4347, "step": 6159 }, { "epoch": 1.14, "learning_rate": 1.4238046554928508e-05, "loss": 0.4295, "step": 6160 }, { "epoch": 1.14, "learning_rate": 1.4236237270937226e-05, "loss": 0.4324, "step": 6161 }, { "epoch": 1.14, "learning_rate": 1.4234427817927919e-05, "loss": 0.446, "step": 6162 }, { "epoch": 1.14, "learning_rate": 1.4232618195972783e-05, "loss": 0.4586, "step": 6163 }, { "epoch": 1.14, "learning_rate": 1.4230808405144013e-05, "loss": 0.4432, "step": 6164 }, { "epoch": 1.14, "learning_rate": 1.4228998445513826e-05, "loss": 0.438, "step": 6165 }, { "epoch": 1.14, "learning_rate": 1.4227188317154428e-05, "loss": 0.4468, "step": 6166 }, { "epoch": 1.14, "learning_rate": 1.4225378020138043e-05, "loss": 0.4284, "step": 6167 }, { "epoch": 1.14, "learning_rate": 1.4223567554536897e-05, "loss": 0.4424, "step": 6168 }, { "epoch": 1.14, "learning_rate": 1.4221756920423227e-05, "loss": 0.4421, "step": 6169 }, { "epoch": 1.14, "learning_rate": 1.4219946117869273e-05, "loss": 0.4454, "step": 6170 }, { "epoch": 1.14, "learning_rate": 1.4218135146947278e-05, "loss": 0.4355, "step": 6171 }, { "epoch": 1.14, "learning_rate": 1.4216324007729503e-05, "loss": 0.4384, "step": 6172 }, { "epoch": 1.14, "learning_rate": 1.4214512700288206e-05, "loss": 0.4352, "step": 6173 }, { "epoch": 1.14, "learning_rate": 1.4212701224695657e-05, "loss": 0.4348, "step": 6174 }, { "epoch": 1.14, "learning_rate": 1.4210889581024127e-05, "loss": 0.4423, "step": 6175 }, { "epoch": 1.14, "learning_rate": 1.4209077769345899e-05, "loss": 0.4361, "step": 6176 }, { "epoch": 1.14, "learning_rate": 1.420726578973326e-05, "loss": 0.4508, "step": 6177 }, { "epoch": 1.14, "learning_rate": 1.4205453642258507e-05, "loss": 0.46, "step": 6178 }, { "epoch": 1.14, "learning_rate": 1.420364132699394e-05, "loss": 0.435, "step": 6179 }, { "epoch": 1.14, "learning_rate": 1.4201828844011867e-05, "loss": 0.4502, "step": 6180 }, { "epoch": 1.14, "learning_rate": 1.4200016193384603e-05, "loss": 0.433, "step": 6181 }, { "epoch": 1.14, "learning_rate": 1.4198203375184468e-05, "loss": 0.4641, "step": 6182 }, { "epoch": 1.14, "learning_rate": 1.419639038948379e-05, "loss": 0.447, "step": 6183 }, { "epoch": 1.14, "learning_rate": 1.4194577236354908e-05, "loss": 0.4369, "step": 6184 }, { "epoch": 1.14, "learning_rate": 1.4192763915870157e-05, "loss": 0.445, "step": 6185 }, { "epoch": 1.14, "learning_rate": 1.419095042810189e-05, "loss": 0.425, "step": 6186 }, { "epoch": 1.14, "learning_rate": 1.4189136773122461e-05, "loss": 0.4536, "step": 6187 }, { "epoch": 1.14, "learning_rate": 1.418732295100423e-05, "loss": 0.4416, "step": 6188 }, { "epoch": 1.15, "learning_rate": 1.4185508961819566e-05, "loss": 0.4288, "step": 6189 }, { "epoch": 1.15, "learning_rate": 1.4183694805640842e-05, "loss": 0.4279, "step": 6190 }, { "epoch": 1.15, "learning_rate": 1.4181880482540444e-05, "loss": 0.4399, "step": 6191 }, { "epoch": 1.15, "learning_rate": 1.4180065992590754e-05, "loss": 0.434, "step": 6192 }, { "epoch": 1.15, "learning_rate": 1.4178251335864173e-05, "loss": 0.432, "step": 6193 }, { "epoch": 1.15, "learning_rate": 1.4176436512433099e-05, "loss": 0.4388, "step": 6194 }, { "epoch": 1.15, "learning_rate": 1.4174621522369937e-05, "loss": 0.4464, "step": 6195 }, { "epoch": 1.15, "learning_rate": 1.417280636574711e-05, "loss": 0.4255, "step": 6196 }, { "epoch": 1.15, "learning_rate": 1.4170991042637032e-05, "loss": 0.4202, "step": 6197 }, { "epoch": 1.15, "learning_rate": 1.4169175553112135e-05, "loss": 0.4273, "step": 6198 }, { "epoch": 1.15, "learning_rate": 1.4167359897244852e-05, "loss": 0.4504, "step": 6199 }, { "epoch": 1.15, "learning_rate": 1.4165544075107627e-05, "loss": 0.4648, "step": 6200 }, { "epoch": 1.15, "learning_rate": 1.41637280867729e-05, "loss": 0.4504, "step": 6201 }, { "epoch": 1.15, "learning_rate": 1.416191193231314e-05, "loss": 0.4333, "step": 6202 }, { "epoch": 1.15, "learning_rate": 1.4160095611800793e-05, "loss": 0.4636, "step": 6203 }, { "epoch": 1.15, "learning_rate": 1.4158279125308334e-05, "loss": 0.4514, "step": 6204 }, { "epoch": 1.15, "learning_rate": 1.4156462472908239e-05, "loss": 0.4316, "step": 6205 }, { "epoch": 1.15, "learning_rate": 1.4154645654672984e-05, "loss": 0.4365, "step": 6206 }, { "epoch": 1.15, "learning_rate": 1.4152828670675063e-05, "loss": 0.4718, "step": 6207 }, { "epoch": 1.15, "learning_rate": 1.4151011520986964e-05, "loss": 0.4484, "step": 6208 }, { "epoch": 1.15, "learning_rate": 1.414919420568119e-05, "loss": 0.4431, "step": 6209 }, { "epoch": 1.15, "learning_rate": 1.4147376724830252e-05, "loss": 0.4334, "step": 6210 }, { "epoch": 1.15, "learning_rate": 1.414555907850666e-05, "loss": 0.4455, "step": 6211 }, { "epoch": 1.15, "learning_rate": 1.4143741266782936e-05, "loss": 0.4519, "step": 6212 }, { "epoch": 1.15, "learning_rate": 1.414192328973161e-05, "loss": 0.4504, "step": 6213 }, { "epoch": 1.15, "learning_rate": 1.414010514742521e-05, "loss": 0.4367, "step": 6214 }, { "epoch": 1.15, "learning_rate": 1.413828683993628e-05, "loss": 0.4516, "step": 6215 }, { "epoch": 1.15, "learning_rate": 1.4136468367337366e-05, "loss": 0.4339, "step": 6216 }, { "epoch": 1.15, "learning_rate": 1.4134649729701024e-05, "loss": 0.4435, "step": 6217 }, { "epoch": 1.15, "learning_rate": 1.4132830927099816e-05, "loss": 0.434, "step": 6218 }, { "epoch": 1.15, "learning_rate": 1.4131011959606302e-05, "loss": 0.4442, "step": 6219 }, { "epoch": 1.15, "learning_rate": 1.412919282729306e-05, "loss": 0.436, "step": 6220 }, { "epoch": 1.15, "learning_rate": 1.4127373530232668e-05, "loss": 0.4213, "step": 6221 }, { "epoch": 1.15, "learning_rate": 1.4125554068497716e-05, "loss": 0.4022, "step": 6222 }, { "epoch": 1.15, "learning_rate": 1.4123734442160793e-05, "loss": 0.446, "step": 6223 }, { "epoch": 1.15, "learning_rate": 1.4121914651294502e-05, "loss": 0.4386, "step": 6224 }, { "epoch": 1.15, "learning_rate": 1.4120094695971447e-05, "loss": 0.4498, "step": 6225 }, { "epoch": 1.15, "learning_rate": 1.4118274576264241e-05, "loss": 0.4441, "step": 6226 }, { "epoch": 1.15, "learning_rate": 1.4116454292245505e-05, "loss": 0.4369, "step": 6227 }, { "epoch": 1.15, "learning_rate": 1.4114633843987864e-05, "loss": 0.444, "step": 6228 }, { "epoch": 1.15, "learning_rate": 1.4112813231563953e-05, "loss": 0.4423, "step": 6229 }, { "epoch": 1.15, "learning_rate": 1.4110992455046408e-05, "loss": 0.4398, "step": 6230 }, { "epoch": 1.15, "learning_rate": 1.4109171514507873e-05, "loss": 0.4453, "step": 6231 }, { "epoch": 1.15, "learning_rate": 1.4107350410021004e-05, "loss": 0.4392, "step": 6232 }, { "epoch": 1.15, "learning_rate": 1.4105529141658458e-05, "loss": 0.4337, "step": 6233 }, { "epoch": 1.15, "learning_rate": 1.4103707709492902e-05, "loss": 0.4409, "step": 6234 }, { "epoch": 1.15, "learning_rate": 1.4101886113597003e-05, "loss": 0.4411, "step": 6235 }, { "epoch": 1.15, "learning_rate": 1.4100064354043443e-05, "loss": 0.4431, "step": 6236 }, { "epoch": 1.15, "learning_rate": 1.409824243090491e-05, "loss": 0.4485, "step": 6237 }, { "epoch": 1.15, "learning_rate": 1.4096420344254087e-05, "loss": 0.4615, "step": 6238 }, { "epoch": 1.15, "learning_rate": 1.4094598094163679e-05, "loss": 0.4561, "step": 6239 }, { "epoch": 1.15, "learning_rate": 1.409277568070639e-05, "loss": 0.4413, "step": 6240 }, { "epoch": 1.15, "learning_rate": 1.4090953103954925e-05, "loss": 0.4586, "step": 6241 }, { "epoch": 1.15, "learning_rate": 1.4089130363982006e-05, "loss": 0.4464, "step": 6242 }, { "epoch": 1.16, "learning_rate": 1.408730746086036e-05, "loss": 0.4246, "step": 6243 }, { "epoch": 1.16, "learning_rate": 1.408548439466271e-05, "loss": 0.4505, "step": 6244 }, { "epoch": 1.16, "learning_rate": 1.4083661165461796e-05, "loss": 0.429, "step": 6245 }, { "epoch": 1.16, "learning_rate": 1.4081837773330365e-05, "loss": 0.4553, "step": 6246 }, { "epoch": 1.16, "learning_rate": 1.4080014218341162e-05, "loss": 0.462, "step": 6247 }, { "epoch": 1.16, "learning_rate": 1.4078190500566949e-05, "loss": 0.4446, "step": 6248 }, { "epoch": 1.16, "learning_rate": 1.4076366620080481e-05, "loss": 0.4295, "step": 6249 }, { "epoch": 1.16, "learning_rate": 1.4074542576954536e-05, "loss": 0.4686, "step": 6250 }, { "epoch": 1.16, "learning_rate": 1.4072718371261884e-05, "loss": 0.4416, "step": 6251 }, { "epoch": 1.16, "learning_rate": 1.407089400307531e-05, "loss": 0.4274, "step": 6252 }, { "epoch": 1.16, "learning_rate": 1.4069069472467603e-05, "loss": 0.4337, "step": 6253 }, { "epoch": 1.16, "learning_rate": 1.4067244779511555e-05, "loss": 0.4525, "step": 6254 }, { "epoch": 1.16, "learning_rate": 1.4065419924279973e-05, "loss": 0.4401, "step": 6255 }, { "epoch": 1.16, "learning_rate": 1.4063594906845663e-05, "loss": 0.426, "step": 6256 }, { "epoch": 1.16, "learning_rate": 1.406176972728144e-05, "loss": 0.4284, "step": 6257 }, { "epoch": 1.16, "learning_rate": 1.4059944385660124e-05, "loss": 0.4547, "step": 6258 }, { "epoch": 1.16, "learning_rate": 1.4058118882054544e-05, "loss": 0.4306, "step": 6259 }, { "epoch": 1.16, "learning_rate": 1.4056293216537533e-05, "loss": 0.4224, "step": 6260 }, { "epoch": 1.16, "learning_rate": 1.4054467389181934e-05, "loss": 0.4754, "step": 6261 }, { "epoch": 1.16, "learning_rate": 1.4052641400060594e-05, "loss": 0.4603, "step": 6262 }, { "epoch": 1.16, "learning_rate": 1.4050815249246364e-05, "loss": 0.4317, "step": 6263 }, { "epoch": 1.16, "learning_rate": 1.4048988936812105e-05, "loss": 0.4322, "step": 6264 }, { "epoch": 1.16, "learning_rate": 1.4047162462830684e-05, "loss": 0.4241, "step": 6265 }, { "epoch": 1.16, "learning_rate": 1.4045335827374973e-05, "loss": 0.4275, "step": 6266 }, { "epoch": 1.16, "learning_rate": 1.4043509030517857e-05, "loss": 0.4176, "step": 6267 }, { "epoch": 1.16, "learning_rate": 1.4041682072332213e-05, "loss": 0.4476, "step": 6268 }, { "epoch": 1.16, "learning_rate": 1.4039854952890937e-05, "loss": 0.448, "step": 6269 }, { "epoch": 1.16, "learning_rate": 1.4038027672266927e-05, "loss": 0.4256, "step": 6270 }, { "epoch": 1.16, "learning_rate": 1.4036200230533093e-05, "loss": 0.4329, "step": 6271 }, { "epoch": 1.16, "learning_rate": 1.403437262776234e-05, "loss": 0.4463, "step": 6272 }, { "epoch": 1.16, "learning_rate": 1.4032544864027588e-05, "loss": 0.4442, "step": 6273 }, { "epoch": 1.16, "learning_rate": 1.4030716939401763e-05, "loss": 0.4536, "step": 6274 }, { "epoch": 1.16, "learning_rate": 1.4028888853957793e-05, "loss": 0.4389, "step": 6275 }, { "epoch": 1.16, "learning_rate": 1.402706060776862e-05, "loss": 0.4274, "step": 6276 }, { "epoch": 1.16, "learning_rate": 1.4025232200907182e-05, "loss": 0.4439, "step": 6277 }, { "epoch": 1.16, "learning_rate": 1.4023403633446436e-05, "loss": 0.4361, "step": 6278 }, { "epoch": 1.16, "learning_rate": 1.4021574905459332e-05, "loss": 0.4542, "step": 6279 }, { "epoch": 1.16, "learning_rate": 1.4019746017018833e-05, "loss": 0.4649, "step": 6280 }, { "epoch": 1.16, "learning_rate": 1.401791696819791e-05, "loss": 0.4475, "step": 6281 }, { "epoch": 1.16, "learning_rate": 1.401608775906954e-05, "loss": 0.4329, "step": 6282 }, { "epoch": 1.16, "learning_rate": 1.4014258389706705e-05, "loss": 0.4429, "step": 6283 }, { "epoch": 1.16, "learning_rate": 1.4012428860182395e-05, "loss": 0.4415, "step": 6284 }, { "epoch": 1.16, "learning_rate": 1.40105991705696e-05, "loss": 0.4423, "step": 6285 }, { "epoch": 1.16, "learning_rate": 1.4008769320941323e-05, "loss": 0.4294, "step": 6286 }, { "epoch": 1.16, "learning_rate": 1.4006939311370571e-05, "loss": 0.4386, "step": 6287 }, { "epoch": 1.16, "learning_rate": 1.4005109141930359e-05, "loss": 0.4323, "step": 6288 }, { "epoch": 1.16, "learning_rate": 1.400327881269371e-05, "loss": 0.4515, "step": 6289 }, { "epoch": 1.16, "learning_rate": 1.4001448323733647e-05, "loss": 0.4385, "step": 6290 }, { "epoch": 1.16, "learning_rate": 1.3999617675123203e-05, "loss": 0.4346, "step": 6291 }, { "epoch": 1.16, "learning_rate": 1.3997786866935421e-05, "loss": 0.4374, "step": 6292 }, { "epoch": 1.16, "learning_rate": 1.3995955899243343e-05, "loss": 0.4687, "step": 6293 }, { "epoch": 1.16, "learning_rate": 1.3994124772120023e-05, "loss": 0.4308, "step": 6294 }, { "epoch": 1.16, "learning_rate": 1.3992293485638521e-05, "loss": 0.4616, "step": 6295 }, { "epoch": 1.16, "learning_rate": 1.39904620398719e-05, "loss": 0.4358, "step": 6296 }, { "epoch": 1.17, "learning_rate": 1.3988630434893231e-05, "loss": 0.4351, "step": 6297 }, { "epoch": 1.17, "learning_rate": 1.3986798670775592e-05, "loss": 0.4559, "step": 6298 }, { "epoch": 1.17, "learning_rate": 1.3984966747592068e-05, "loss": 0.438, "step": 6299 }, { "epoch": 1.17, "learning_rate": 1.3983134665415752e-05, "loss": 0.4383, "step": 6300 }, { "epoch": 1.17, "learning_rate": 1.3981302424319734e-05, "loss": 0.4464, "step": 6301 }, { "epoch": 1.17, "learning_rate": 1.397947002437712e-05, "loss": 0.4179, "step": 6302 }, { "epoch": 1.17, "learning_rate": 1.397763746566102e-05, "loss": 0.4552, "step": 6303 }, { "epoch": 1.17, "learning_rate": 1.397580474824455e-05, "loss": 0.4402, "step": 6304 }, { "epoch": 1.17, "learning_rate": 1.3973971872200831e-05, "loss": 0.418, "step": 6305 }, { "epoch": 1.17, "learning_rate": 1.3972138837602996e-05, "loss": 0.4669, "step": 6306 }, { "epoch": 1.17, "learning_rate": 1.397030564452417e-05, "loss": 0.4372, "step": 6307 }, { "epoch": 1.17, "learning_rate": 1.3968472293037503e-05, "loss": 0.45, "step": 6308 }, { "epoch": 1.17, "learning_rate": 1.3966638783216138e-05, "loss": 0.443, "step": 6309 }, { "epoch": 1.17, "learning_rate": 1.3964805115133229e-05, "loss": 0.4409, "step": 6310 }, { "epoch": 1.17, "learning_rate": 1.3962971288861937e-05, "loss": 0.439, "step": 6311 }, { "epoch": 1.17, "learning_rate": 1.3961137304475428e-05, "loss": 0.4324, "step": 6312 }, { "epoch": 1.17, "learning_rate": 1.3959303162046873e-05, "loss": 0.4441, "step": 6313 }, { "epoch": 1.17, "learning_rate": 1.3957468861649455e-05, "loss": 0.4397, "step": 6314 }, { "epoch": 1.17, "learning_rate": 1.3955634403356353e-05, "loss": 0.4354, "step": 6315 }, { "epoch": 1.17, "learning_rate": 1.3953799787240765e-05, "loss": 0.4288, "step": 6316 }, { "epoch": 1.17, "learning_rate": 1.3951965013375886e-05, "loss": 0.4498, "step": 6317 }, { "epoch": 1.17, "learning_rate": 1.3950130081834918e-05, "loss": 0.4335, "step": 6318 }, { "epoch": 1.17, "learning_rate": 1.3948294992691074e-05, "loss": 0.4557, "step": 6319 }, { "epoch": 1.17, "learning_rate": 1.3946459746017569e-05, "loss": 0.4373, "step": 6320 }, { "epoch": 1.17, "learning_rate": 1.3944624341887627e-05, "loss": 0.4503, "step": 6321 }, { "epoch": 1.17, "learning_rate": 1.3942788780374477e-05, "loss": 0.434, "step": 6322 }, { "epoch": 1.17, "learning_rate": 1.3940953061551354e-05, "loss": 0.4361, "step": 6323 }, { "epoch": 1.17, "learning_rate": 1.3939117185491503e-05, "loss": 0.4358, "step": 6324 }, { "epoch": 1.17, "learning_rate": 1.3937281152268168e-05, "loss": 0.455, "step": 6325 }, { "epoch": 1.17, "learning_rate": 1.3935444961954602e-05, "loss": 0.4376, "step": 6326 }, { "epoch": 1.17, "learning_rate": 1.3933608614624073e-05, "loss": 0.4505, "step": 6327 }, { "epoch": 1.17, "learning_rate": 1.3931772110349839e-05, "loss": 0.4537, "step": 6328 }, { "epoch": 1.17, "learning_rate": 1.3929935449205181e-05, "loss": 0.4376, "step": 6329 }, { "epoch": 1.17, "learning_rate": 1.3928098631263372e-05, "loss": 0.4595, "step": 6330 }, { "epoch": 1.17, "learning_rate": 1.3926261656597702e-05, "loss": 0.4253, "step": 6331 }, { "epoch": 1.17, "learning_rate": 1.3924424525281459e-05, "loss": 0.4181, "step": 6332 }, { "epoch": 1.17, "learning_rate": 1.3922587237387945e-05, "loss": 0.4303, "step": 6333 }, { "epoch": 1.17, "learning_rate": 1.3920749792990464e-05, "loss": 0.4386, "step": 6334 }, { "epoch": 1.17, "learning_rate": 1.3918912192162322e-05, "loss": 0.4592, "step": 6335 }, { "epoch": 1.17, "learning_rate": 1.3917074434976841e-05, "loss": 0.4523, "step": 6336 }, { "epoch": 1.17, "learning_rate": 1.3915236521507342e-05, "loss": 0.4328, "step": 6337 }, { "epoch": 1.17, "learning_rate": 1.3913398451827153e-05, "loss": 0.4436, "step": 6338 }, { "epoch": 1.17, "learning_rate": 1.3911560226009617e-05, "loss": 0.4555, "step": 6339 }, { "epoch": 1.17, "learning_rate": 1.3909721844128065e-05, "loss": 0.4596, "step": 6340 }, { "epoch": 1.17, "learning_rate": 1.3907883306255851e-05, "loss": 0.4412, "step": 6341 }, { "epoch": 1.17, "learning_rate": 1.3906044612466328e-05, "loss": 0.4547, "step": 6342 }, { "epoch": 1.17, "learning_rate": 1.3904205762832856e-05, "loss": 0.4163, "step": 6343 }, { "epoch": 1.17, "learning_rate": 1.3902366757428808e-05, "loss": 0.4353, "step": 6344 }, { "epoch": 1.17, "learning_rate": 1.3900527596327545e-05, "loss": 0.4576, "step": 6345 }, { "epoch": 1.17, "learning_rate": 1.3898688279602456e-05, "loss": 0.455, "step": 6346 }, { "epoch": 1.17, "learning_rate": 1.3896848807326921e-05, "loss": 0.4329, "step": 6347 }, { "epoch": 1.17, "learning_rate": 1.3895009179574332e-05, "loss": 0.4613, "step": 6348 }, { "epoch": 1.17, "learning_rate": 1.3893169396418092e-05, "loss": 0.4572, "step": 6349 }, { "epoch": 1.17, "learning_rate": 1.38913294579316e-05, "loss": 0.4446, "step": 6350 }, { "epoch": 1.18, "learning_rate": 1.3889489364188265e-05, "loss": 0.4354, "step": 6351 }, { "epoch": 1.18, "learning_rate": 1.3887649115261506e-05, "loss": 0.4506, "step": 6352 }, { "epoch": 1.18, "learning_rate": 1.3885808711224747e-05, "loss": 0.4478, "step": 6353 }, { "epoch": 1.18, "learning_rate": 1.3883968152151412e-05, "loss": 0.4605, "step": 6354 }, { "epoch": 1.18, "learning_rate": 1.3882127438114943e-05, "loss": 0.4218, "step": 6355 }, { "epoch": 1.18, "learning_rate": 1.3880286569188775e-05, "loss": 0.4426, "step": 6356 }, { "epoch": 1.18, "learning_rate": 1.3878445545446355e-05, "loss": 0.4361, "step": 6357 }, { "epoch": 1.18, "learning_rate": 1.3876604366961139e-05, "loss": 0.4338, "step": 6358 }, { "epoch": 1.18, "learning_rate": 1.387476303380659e-05, "loss": 0.4625, "step": 6359 }, { "epoch": 1.18, "learning_rate": 1.3872921546056164e-05, "loss": 0.4564, "step": 6360 }, { "epoch": 1.18, "learning_rate": 1.3871079903783344e-05, "loss": 0.434, "step": 6361 }, { "epoch": 1.18, "learning_rate": 1.38692381070616e-05, "loss": 0.4296, "step": 6362 }, { "epoch": 1.18, "learning_rate": 1.3867396155964422e-05, "loss": 0.4496, "step": 6363 }, { "epoch": 1.18, "learning_rate": 1.3865554050565293e-05, "loss": 0.4349, "step": 6364 }, { "epoch": 1.18, "learning_rate": 1.3863711790937717e-05, "loss": 0.4261, "step": 6365 }, { "epoch": 1.18, "learning_rate": 1.3861869377155196e-05, "loss": 0.4534, "step": 6366 }, { "epoch": 1.18, "learning_rate": 1.3860026809291237e-05, "loss": 0.4675, "step": 6367 }, { "epoch": 1.18, "learning_rate": 1.385818408741935e-05, "loss": 0.4454, "step": 6368 }, { "epoch": 1.18, "learning_rate": 1.3856341211613064e-05, "loss": 0.4442, "step": 6369 }, { "epoch": 1.18, "learning_rate": 1.3854498181945903e-05, "loss": 0.4485, "step": 6370 }, { "epoch": 1.18, "learning_rate": 1.3852654998491401e-05, "loss": 0.4447, "step": 6371 }, { "epoch": 1.18, "learning_rate": 1.3850811661323098e-05, "loss": 0.4244, "step": 6372 }, { "epoch": 1.18, "learning_rate": 1.384896817051454e-05, "loss": 0.4285, "step": 6373 }, { "epoch": 1.18, "learning_rate": 1.3847124526139278e-05, "loss": 0.4378, "step": 6374 }, { "epoch": 1.18, "learning_rate": 1.3845280728270867e-05, "loss": 0.4677, "step": 6375 }, { "epoch": 1.18, "learning_rate": 1.3843436776982877e-05, "loss": 0.4508, "step": 6376 }, { "epoch": 1.18, "learning_rate": 1.3841592672348878e-05, "loss": 0.4279, "step": 6377 }, { "epoch": 1.18, "learning_rate": 1.383974841444244e-05, "loss": 0.4291, "step": 6378 }, { "epoch": 1.18, "learning_rate": 1.383790400333715e-05, "loss": 0.452, "step": 6379 }, { "epoch": 1.18, "learning_rate": 1.3836059439106597e-05, "loss": 0.4229, "step": 6380 }, { "epoch": 1.18, "learning_rate": 1.3834214721824375e-05, "loss": 0.4451, "step": 6381 }, { "epoch": 1.18, "learning_rate": 1.3832369851564082e-05, "loss": 0.4545, "step": 6382 }, { "epoch": 1.18, "learning_rate": 1.3830524828399332e-05, "loss": 0.4399, "step": 6383 }, { "epoch": 1.18, "learning_rate": 1.3828679652403732e-05, "loss": 0.4478, "step": 6384 }, { "epoch": 1.18, "learning_rate": 1.3826834323650899e-05, "loss": 0.4297, "step": 6385 }, { "epoch": 1.18, "learning_rate": 1.3824988842214464e-05, "loss": 0.4449, "step": 6386 }, { "epoch": 1.18, "learning_rate": 1.3823143208168055e-05, "loss": 0.424, "step": 6387 }, { "epoch": 1.18, "learning_rate": 1.3821297421585314e-05, "loss": 0.4173, "step": 6388 }, { "epoch": 1.18, "learning_rate": 1.3819451482539875e-05, "loss": 0.4442, "step": 6389 }, { "epoch": 1.18, "learning_rate": 1.3817605391105398e-05, "loss": 0.4318, "step": 6390 }, { "epoch": 1.18, "learning_rate": 1.3815759147355532e-05, "loss": 0.4552, "step": 6391 }, { "epoch": 1.18, "learning_rate": 1.381391275136394e-05, "loss": 0.4296, "step": 6392 }, { "epoch": 1.18, "learning_rate": 1.3812066203204291e-05, "loss": 0.4465, "step": 6393 }, { "epoch": 1.18, "learning_rate": 1.381021950295026e-05, "loss": 0.4366, "step": 6394 }, { "epoch": 1.18, "learning_rate": 1.3808372650675526e-05, "loss": 0.4375, "step": 6395 }, { "epoch": 1.18, "learning_rate": 1.380652564645377e-05, "loss": 0.4372, "step": 6396 }, { "epoch": 1.18, "learning_rate": 1.3804678490358691e-05, "loss": 0.4647, "step": 6397 }, { "epoch": 1.18, "learning_rate": 1.3802831182463983e-05, "loss": 0.4168, "step": 6398 }, { "epoch": 1.18, "learning_rate": 1.3800983722843352e-05, "loss": 0.4227, "step": 6399 }, { "epoch": 1.18, "learning_rate": 1.3799136111570509e-05, "loss": 0.4559, "step": 6400 }, { "epoch": 1.18, "learning_rate": 1.3797288348719166e-05, "loss": 0.46, "step": 6401 }, { "epoch": 1.18, "learning_rate": 1.3795440434363052e-05, "loss": 0.444, "step": 6402 }, { "epoch": 1.18, "learning_rate": 1.379359236857589e-05, "loss": 0.4388, "step": 6403 }, { "epoch": 1.18, "learning_rate": 1.3791744151431416e-05, "loss": 0.4218, "step": 6404 }, { "epoch": 1.19, "learning_rate": 1.3789895783003373e-05, "loss": 0.4131, "step": 6405 }, { "epoch": 1.19, "learning_rate": 1.3788047263365502e-05, "loss": 0.4415, "step": 6406 }, { "epoch": 1.19, "learning_rate": 1.3786198592591561e-05, "loss": 0.4617, "step": 6407 }, { "epoch": 1.19, "learning_rate": 1.3784349770755305e-05, "loss": 0.4355, "step": 6408 }, { "epoch": 1.19, "learning_rate": 1.37825007979305e-05, "loss": 0.445, "step": 6409 }, { "epoch": 1.19, "learning_rate": 1.3780651674190917e-05, "loss": 0.4259, "step": 6410 }, { "epoch": 1.19, "learning_rate": 1.3778802399610332e-05, "loss": 0.4361, "step": 6411 }, { "epoch": 1.19, "learning_rate": 1.3776952974262525e-05, "loss": 0.4324, "step": 6412 }, { "epoch": 1.19, "learning_rate": 1.3775103398221288e-05, "loss": 0.4287, "step": 6413 }, { "epoch": 1.19, "learning_rate": 1.3773253671560417e-05, "loss": 0.4626, "step": 6414 }, { "epoch": 1.19, "learning_rate": 1.3771403794353707e-05, "loss": 0.4505, "step": 6415 }, { "epoch": 1.19, "learning_rate": 1.3769553766674973e-05, "loss": 0.4398, "step": 6416 }, { "epoch": 1.19, "learning_rate": 1.3767703588598018e-05, "loss": 0.416, "step": 6417 }, { "epoch": 1.19, "learning_rate": 1.376585326019667e-05, "loss": 0.429, "step": 6418 }, { "epoch": 1.19, "learning_rate": 1.3764002781544745e-05, "loss": 0.4556, "step": 6419 }, { "epoch": 1.19, "learning_rate": 1.376215215271608e-05, "loss": 0.4573, "step": 6420 }, { "epoch": 1.19, "learning_rate": 1.3760301373784507e-05, "loss": 0.4369, "step": 6421 }, { "epoch": 1.19, "learning_rate": 1.3758450444823872e-05, "loss": 0.4196, "step": 6422 }, { "epoch": 1.19, "learning_rate": 1.3756599365908025e-05, "loss": 0.4312, "step": 6423 }, { "epoch": 1.19, "learning_rate": 1.3754748137110818e-05, "loss": 0.4275, "step": 6424 }, { "epoch": 1.19, "learning_rate": 1.3752896758506111e-05, "loss": 0.4217, "step": 6425 }, { "epoch": 1.19, "learning_rate": 1.3751045230167772e-05, "loss": 0.4304, "step": 6426 }, { "epoch": 1.19, "learning_rate": 1.3749193552169675e-05, "loss": 0.4473, "step": 6427 }, { "epoch": 1.19, "learning_rate": 1.3747341724585695e-05, "loss": 0.4679, "step": 6428 }, { "epoch": 1.19, "learning_rate": 1.3745489747489717e-05, "loss": 0.4296, "step": 6429 }, { "epoch": 1.19, "learning_rate": 1.3743637620955635e-05, "loss": 0.4559, "step": 6430 }, { "epoch": 1.19, "learning_rate": 1.3741785345057342e-05, "loss": 0.4466, "step": 6431 }, { "epoch": 1.19, "learning_rate": 1.3739932919868744e-05, "loss": 0.444, "step": 6432 }, { "epoch": 1.19, "learning_rate": 1.3738080345463743e-05, "loss": 0.4399, "step": 6433 }, { "epoch": 1.19, "learning_rate": 1.3736227621916258e-05, "loss": 0.4553, "step": 6434 }, { "epoch": 1.19, "learning_rate": 1.3734374749300208e-05, "loss": 0.449, "step": 6435 }, { "epoch": 1.19, "learning_rate": 1.373252172768952e-05, "loss": 0.429, "step": 6436 }, { "epoch": 1.19, "learning_rate": 1.3730668557158127e-05, "loss": 0.4429, "step": 6437 }, { "epoch": 1.19, "learning_rate": 1.3728815237779967e-05, "loss": 0.4554, "step": 6438 }, { "epoch": 1.19, "learning_rate": 1.3726961769628978e-05, "loss": 0.447, "step": 6439 }, { "epoch": 1.19, "learning_rate": 1.3725108152779118e-05, "loss": 0.442, "step": 6440 }, { "epoch": 1.19, "learning_rate": 1.3723254387304338e-05, "loss": 0.4412, "step": 6441 }, { "epoch": 1.19, "learning_rate": 1.3721400473278603e-05, "loss": 0.4467, "step": 6442 }, { "epoch": 1.19, "learning_rate": 1.3719546410775879e-05, "loss": 0.447, "step": 6443 }, { "epoch": 1.19, "learning_rate": 1.3717692199870138e-05, "loss": 0.4343, "step": 6444 }, { "epoch": 1.19, "learning_rate": 1.3715837840635363e-05, "loss": 0.4473, "step": 6445 }, { "epoch": 1.19, "learning_rate": 1.3713983333145535e-05, "loss": 0.4346, "step": 6446 }, { "epoch": 1.19, "learning_rate": 1.3712128677474653e-05, "loss": 0.4414, "step": 6447 }, { "epoch": 1.19, "learning_rate": 1.3710273873696705e-05, "loss": 0.4416, "step": 6448 }, { "epoch": 1.19, "learning_rate": 1.37084189218857e-05, "loss": 0.43, "step": 6449 }, { "epoch": 1.19, "learning_rate": 1.3706563822115646e-05, "loss": 0.4475, "step": 6450 }, { "epoch": 1.19, "learning_rate": 1.3704708574460558e-05, "loss": 0.4392, "step": 6451 }, { "epoch": 1.19, "learning_rate": 1.3702853178994459e-05, "loss": 0.4346, "step": 6452 }, { "epoch": 1.19, "learning_rate": 1.3700997635791372e-05, "loss": 0.4449, "step": 6453 }, { "epoch": 1.19, "learning_rate": 1.3699141944925334e-05, "loss": 0.4482, "step": 6454 }, { "epoch": 1.19, "learning_rate": 1.3697286106470378e-05, "loss": 0.4547, "step": 6455 }, { "epoch": 1.19, "learning_rate": 1.3695430120500555e-05, "loss": 0.4503, "step": 6456 }, { "epoch": 1.19, "learning_rate": 1.3693573987089908e-05, "loss": 0.4397, "step": 6457 }, { "epoch": 1.19, "learning_rate": 1.36917177063125e-05, "loss": 0.4344, "step": 6458 }, { "epoch": 1.2, "learning_rate": 1.3689861278242389e-05, "loss": 0.4413, "step": 6459 }, { "epoch": 1.2, "learning_rate": 1.3688004702953649e-05, "loss": 0.4386, "step": 6460 }, { "epoch": 1.2, "learning_rate": 1.3686147980520343e-05, "loss": 0.4532, "step": 6461 }, { "epoch": 1.2, "learning_rate": 1.368429111101656e-05, "loss": 0.4301, "step": 6462 }, { "epoch": 1.2, "learning_rate": 1.3682434094516386e-05, "loss": 0.4205, "step": 6463 }, { "epoch": 1.2, "learning_rate": 1.3680576931093905e-05, "loss": 0.4426, "step": 6464 }, { "epoch": 1.2, "learning_rate": 1.3678719620823222e-05, "loss": 0.4405, "step": 6465 }, { "epoch": 1.2, "learning_rate": 1.3676862163778437e-05, "loss": 0.4485, "step": 6466 }, { "epoch": 1.2, "learning_rate": 1.3675004560033656e-05, "loss": 0.4418, "step": 6467 }, { "epoch": 1.2, "learning_rate": 1.3673146809662998e-05, "loss": 0.442, "step": 6468 }, { "epoch": 1.2, "learning_rate": 1.3671288912740586e-05, "loss": 0.4342, "step": 6469 }, { "epoch": 1.2, "learning_rate": 1.3669430869340541e-05, "loss": 0.4456, "step": 6470 }, { "epoch": 1.2, "learning_rate": 1.3667572679537e-05, "loss": 0.4449, "step": 6471 }, { "epoch": 1.2, "learning_rate": 1.3665714343404098e-05, "loss": 0.4378, "step": 6472 }, { "epoch": 1.2, "learning_rate": 1.366385586101598e-05, "loss": 0.4324, "step": 6473 }, { "epoch": 1.2, "learning_rate": 1.3661997232446797e-05, "loss": 0.4313, "step": 6474 }, { "epoch": 1.2, "learning_rate": 1.3660138457770703e-05, "loss": 0.4191, "step": 6475 }, { "epoch": 1.2, "learning_rate": 1.3658279537061866e-05, "loss": 0.4436, "step": 6476 }, { "epoch": 1.2, "learning_rate": 1.3656420470394443e-05, "loss": 0.44, "step": 6477 }, { "epoch": 1.2, "learning_rate": 1.3654561257842616e-05, "loss": 0.4507, "step": 6478 }, { "epoch": 1.2, "learning_rate": 1.365270189948056e-05, "loss": 0.4559, "step": 6479 }, { "epoch": 1.2, "learning_rate": 1.3650842395382462e-05, "loss": 0.4335, "step": 6480 }, { "epoch": 1.2, "learning_rate": 1.364898274562251e-05, "loss": 0.4539, "step": 6481 }, { "epoch": 1.2, "learning_rate": 1.3647122950274905e-05, "loss": 0.4488, "step": 6482 }, { "epoch": 1.2, "learning_rate": 1.3645263009413845e-05, "loss": 0.4422, "step": 6483 }, { "epoch": 1.2, "learning_rate": 1.364340292311354e-05, "loss": 0.4497, "step": 6484 }, { "epoch": 1.2, "learning_rate": 1.3641542691448204e-05, "loss": 0.4128, "step": 6485 }, { "epoch": 1.2, "learning_rate": 1.3639682314492058e-05, "loss": 0.4564, "step": 6486 }, { "epoch": 1.2, "learning_rate": 1.3637821792319326e-05, "loss": 0.4374, "step": 6487 }, { "epoch": 1.2, "learning_rate": 1.363596112500424e-05, "loss": 0.47, "step": 6488 }, { "epoch": 1.2, "learning_rate": 1.3634100312621035e-05, "loss": 0.4587, "step": 6489 }, { "epoch": 1.2, "learning_rate": 1.3632239355243958e-05, "loss": 0.4172, "step": 6490 }, { "epoch": 1.2, "learning_rate": 1.3630378252947252e-05, "loss": 0.4441, "step": 6491 }, { "epoch": 1.2, "learning_rate": 1.3628517005805177e-05, "loss": 0.4262, "step": 6492 }, { "epoch": 1.2, "learning_rate": 1.3626655613891995e-05, "loss": 0.4458, "step": 6493 }, { "epoch": 1.2, "learning_rate": 1.3624794077281967e-05, "loss": 0.4241, "step": 6494 }, { "epoch": 1.2, "learning_rate": 1.3622932396049362e-05, "loss": 0.4454, "step": 6495 }, { "epoch": 1.2, "learning_rate": 1.3621070570268466e-05, "loss": 0.4464, "step": 6496 }, { "epoch": 1.2, "learning_rate": 1.3619208600013557e-05, "loss": 0.4426, "step": 6497 }, { "epoch": 1.2, "learning_rate": 1.3617346485358927e-05, "loss": 0.4253, "step": 6498 }, { "epoch": 1.2, "learning_rate": 1.3615484226378867e-05, "loss": 0.4617, "step": 6499 }, { "epoch": 1.2, "learning_rate": 1.3613621823147682e-05, "loss": 0.4526, "step": 6500 }, { "epoch": 1.2, "learning_rate": 1.3611759275739677e-05, "loss": 0.4621, "step": 6501 }, { "epoch": 1.2, "learning_rate": 1.3609896584229163e-05, "loss": 0.4475, "step": 6502 }, { "epoch": 1.2, "learning_rate": 1.3608033748690461e-05, "loss": 0.4425, "step": 6503 }, { "epoch": 1.2, "learning_rate": 1.3606170769197894e-05, "loss": 0.4571, "step": 6504 }, { "epoch": 1.2, "learning_rate": 1.3604307645825785e-05, "loss": 0.4587, "step": 6505 }, { "epoch": 1.2, "learning_rate": 1.3602444378648477e-05, "loss": 0.4499, "step": 6506 }, { "epoch": 1.2, "learning_rate": 1.3600580967740306e-05, "loss": 0.4316, "step": 6507 }, { "epoch": 1.2, "learning_rate": 1.3598717413175622e-05, "loss": 0.4526, "step": 6508 }, { "epoch": 1.2, "learning_rate": 1.3596853715028776e-05, "loss": 0.451, "step": 6509 }, { "epoch": 1.2, "learning_rate": 1.3594989873374126e-05, "loss": 0.4583, "step": 6510 }, { "epoch": 1.2, "learning_rate": 1.3593125888286039e-05, "loss": 0.453, "step": 6511 }, { "epoch": 1.2, "learning_rate": 1.3591261759838879e-05, "loss": 0.4549, "step": 6512 }, { "epoch": 1.2, "learning_rate": 1.3589397488107021e-05, "loss": 0.4279, "step": 6513 }, { "epoch": 1.21, "learning_rate": 1.3587533073164851e-05, "loss": 0.4518, "step": 6514 }, { "epoch": 1.21, "learning_rate": 1.3585668515086756e-05, "loss": 0.4588, "step": 6515 }, { "epoch": 1.21, "learning_rate": 1.3583803813947122e-05, "loss": 0.43, "step": 6516 }, { "epoch": 1.21, "learning_rate": 1.3581938969820355e-05, "loss": 0.437, "step": 6517 }, { "epoch": 1.21, "learning_rate": 1.3580073982780853e-05, "loss": 0.4322, "step": 6518 }, { "epoch": 1.21, "learning_rate": 1.3578208852903025e-05, "loss": 0.4481, "step": 6519 }, { "epoch": 1.21, "learning_rate": 1.3576343580261293e-05, "loss": 0.4286, "step": 6520 }, { "epoch": 1.21, "learning_rate": 1.3574478164930071e-05, "loss": 0.4333, "step": 6521 }, { "epoch": 1.21, "learning_rate": 1.3572612606983789e-05, "loss": 0.4373, "step": 6522 }, { "epoch": 1.21, "learning_rate": 1.3570746906496877e-05, "loss": 0.4341, "step": 6523 }, { "epoch": 1.21, "learning_rate": 1.3568881063543776e-05, "loss": 0.4427, "step": 6524 }, { "epoch": 1.21, "learning_rate": 1.3567015078198929e-05, "loss": 0.4524, "step": 6525 }, { "epoch": 1.21, "learning_rate": 1.3565148950536782e-05, "loss": 0.4489, "step": 6526 }, { "epoch": 1.21, "learning_rate": 1.3563282680631793e-05, "loss": 0.444, "step": 6527 }, { "epoch": 1.21, "learning_rate": 1.3561416268558422e-05, "loss": 0.4354, "step": 6528 }, { "epoch": 1.21, "learning_rate": 1.3559549714391139e-05, "loss": 0.4342, "step": 6529 }, { "epoch": 1.21, "learning_rate": 1.3557683018204408e-05, "loss": 0.4252, "step": 6530 }, { "epoch": 1.21, "learning_rate": 1.3555816180072717e-05, "loss": 0.4459, "step": 6531 }, { "epoch": 1.21, "learning_rate": 1.3553949200070539e-05, "loss": 0.4452, "step": 6532 }, { "epoch": 1.21, "learning_rate": 1.3552082078272371e-05, "loss": 0.4463, "step": 6533 }, { "epoch": 1.21, "learning_rate": 1.3550214814752702e-05, "loss": 0.405, "step": 6534 }, { "epoch": 1.21, "learning_rate": 1.3548347409586038e-05, "loss": 0.4509, "step": 6535 }, { "epoch": 1.21, "learning_rate": 1.354647986284688e-05, "loss": 0.4448, "step": 6536 }, { "epoch": 1.21, "learning_rate": 1.3544612174609744e-05, "loss": 0.4325, "step": 6537 }, { "epoch": 1.21, "learning_rate": 1.3542744344949142e-05, "loss": 0.4493, "step": 6538 }, { "epoch": 1.21, "learning_rate": 1.35408763739396e-05, "loss": 0.4443, "step": 6539 }, { "epoch": 1.21, "learning_rate": 1.3539008261655646e-05, "loss": 0.4317, "step": 6540 }, { "epoch": 1.21, "learning_rate": 1.3537140008171817e-05, "loss": 0.4563, "step": 6541 }, { "epoch": 1.21, "learning_rate": 1.353527161356265e-05, "loss": 0.4464, "step": 6542 }, { "epoch": 1.21, "learning_rate": 1.3533403077902689e-05, "loss": 0.4339, "step": 6543 }, { "epoch": 1.21, "learning_rate": 1.3531534401266489e-05, "loss": 0.4452, "step": 6544 }, { "epoch": 1.21, "learning_rate": 1.3529665583728605e-05, "loss": 0.4266, "step": 6545 }, { "epoch": 1.21, "learning_rate": 1.3527796625363597e-05, "loss": 0.444, "step": 6546 }, { "epoch": 1.21, "learning_rate": 1.3525927526246036e-05, "loss": 0.476, "step": 6547 }, { "epoch": 1.21, "learning_rate": 1.3524058286450495e-05, "loss": 0.4545, "step": 6548 }, { "epoch": 1.21, "learning_rate": 1.3522188906051551e-05, "loss": 0.4324, "step": 6549 }, { "epoch": 1.21, "learning_rate": 1.3520319385123794e-05, "loss": 0.4244, "step": 6550 }, { "epoch": 1.21, "learning_rate": 1.3518449723741811e-05, "loss": 0.4143, "step": 6551 }, { "epoch": 1.21, "learning_rate": 1.3516579921980197e-05, "loss": 0.4449, "step": 6552 }, { "epoch": 1.21, "learning_rate": 1.3514709979913556e-05, "loss": 0.4075, "step": 6553 }, { "epoch": 1.21, "learning_rate": 1.3512839897616495e-05, "loss": 0.4448, "step": 6554 }, { "epoch": 1.21, "learning_rate": 1.3510969675163623e-05, "loss": 0.4446, "step": 6555 }, { "epoch": 1.21, "learning_rate": 1.3509099312629564e-05, "loss": 0.4589, "step": 6556 }, { "epoch": 1.21, "learning_rate": 1.3507228810088938e-05, "loss": 0.4318, "step": 6557 }, { "epoch": 1.21, "learning_rate": 1.3505358167616378e-05, "loss": 0.4251, "step": 6558 }, { "epoch": 1.21, "learning_rate": 1.3503487385286514e-05, "loss": 0.4404, "step": 6559 }, { "epoch": 1.21, "learning_rate": 1.3501616463173992e-05, "loss": 0.4445, "step": 6560 }, { "epoch": 1.21, "learning_rate": 1.3499745401353455e-05, "loss": 0.4545, "step": 6561 }, { "epoch": 1.21, "learning_rate": 1.3497874199899554e-05, "loss": 0.4248, "step": 6562 }, { "epoch": 1.21, "learning_rate": 1.3496002858886951e-05, "loss": 0.4355, "step": 6563 }, { "epoch": 1.21, "learning_rate": 1.3494131378390309e-05, "loss": 0.4201, "step": 6564 }, { "epoch": 1.21, "learning_rate": 1.3492259758484291e-05, "loss": 0.4577, "step": 6565 }, { "epoch": 1.21, "learning_rate": 1.3490387999243577e-05, "loss": 0.4354, "step": 6566 }, { "epoch": 1.21, "learning_rate": 1.3488516100742841e-05, "loss": 0.4422, "step": 6567 }, { "epoch": 1.22, "learning_rate": 1.3486644063056772e-05, "loss": 0.4493, "step": 6568 }, { "epoch": 1.22, "learning_rate": 1.3484771886260064e-05, "loss": 0.4401, "step": 6569 }, { "epoch": 1.22, "learning_rate": 1.3482899570427406e-05, "loss": 0.4416, "step": 6570 }, { "epoch": 1.22, "learning_rate": 1.3481027115633503e-05, "loss": 0.4374, "step": 6571 }, { "epoch": 1.22, "learning_rate": 1.3479154521953065e-05, "loss": 0.4479, "step": 6572 }, { "epoch": 1.22, "learning_rate": 1.34772817894608e-05, "loss": 0.4506, "step": 6573 }, { "epoch": 1.22, "learning_rate": 1.3475408918231432e-05, "loss": 0.4445, "step": 6574 }, { "epoch": 1.22, "learning_rate": 1.3473535908339684e-05, "loss": 0.4405, "step": 6575 }, { "epoch": 1.22, "learning_rate": 1.347166275986028e-05, "loss": 0.4372, "step": 6576 }, { "epoch": 1.22, "learning_rate": 1.3469789472867962e-05, "loss": 0.4652, "step": 6577 }, { "epoch": 1.22, "learning_rate": 1.3467916047437471e-05, "loss": 0.4079, "step": 6578 }, { "epoch": 1.22, "learning_rate": 1.3466042483643547e-05, "loss": 0.4686, "step": 6579 }, { "epoch": 1.22, "learning_rate": 1.3464168781560947e-05, "loss": 0.4338, "step": 6580 }, { "epoch": 1.22, "learning_rate": 1.3462294941264426e-05, "loss": 0.4415, "step": 6581 }, { "epoch": 1.22, "learning_rate": 1.3460420962828747e-05, "loss": 0.4479, "step": 6582 }, { "epoch": 1.22, "learning_rate": 1.3458546846328676e-05, "loss": 0.4437, "step": 6583 }, { "epoch": 1.22, "learning_rate": 1.345667259183899e-05, "loss": 0.4457, "step": 6584 }, { "epoch": 1.22, "learning_rate": 1.345479819943447e-05, "loss": 0.4281, "step": 6585 }, { "epoch": 1.22, "learning_rate": 1.3452923669189897e-05, "loss": 0.4356, "step": 6586 }, { "epoch": 1.22, "learning_rate": 1.3451049001180064e-05, "loss": 0.4425, "step": 6587 }, { "epoch": 1.22, "learning_rate": 1.3449174195479762e-05, "loss": 0.4532, "step": 6588 }, { "epoch": 1.22, "learning_rate": 1.3447299252163797e-05, "loss": 0.4346, "step": 6589 }, { "epoch": 1.22, "learning_rate": 1.3445424171306973e-05, "loss": 0.4369, "step": 6590 }, { "epoch": 1.22, "learning_rate": 1.3443548952984106e-05, "loss": 0.4282, "step": 6591 }, { "epoch": 1.22, "learning_rate": 1.3441673597270012e-05, "loss": 0.4691, "step": 6592 }, { "epoch": 1.22, "learning_rate": 1.3439798104239512e-05, "loss": 0.4507, "step": 6593 }, { "epoch": 1.22, "learning_rate": 1.3437922473967436e-05, "loss": 0.4383, "step": 6594 }, { "epoch": 1.22, "learning_rate": 1.3436046706528618e-05, "loss": 0.4486, "step": 6595 }, { "epoch": 1.22, "learning_rate": 1.3434170801997898e-05, "loss": 0.445, "step": 6596 }, { "epoch": 1.22, "learning_rate": 1.3432294760450124e-05, "loss": 0.435, "step": 6597 }, { "epoch": 1.22, "learning_rate": 1.3430418581960141e-05, "loss": 0.439, "step": 6598 }, { "epoch": 1.22, "learning_rate": 1.3428542266602809e-05, "loss": 0.4657, "step": 6599 }, { "epoch": 1.22, "learning_rate": 1.3426665814452986e-05, "loss": 0.4552, "step": 6600 }, { "epoch": 1.22, "learning_rate": 1.3424789225585544e-05, "loss": 0.4455, "step": 6601 }, { "epoch": 1.22, "learning_rate": 1.3422912500075351e-05, "loss": 0.4347, "step": 6602 }, { "epoch": 1.22, "learning_rate": 1.3421035637997288e-05, "loss": 0.4321, "step": 6603 }, { "epoch": 1.22, "learning_rate": 1.3419158639426234e-05, "loss": 0.4387, "step": 6604 }, { "epoch": 1.22, "learning_rate": 1.3417281504437086e-05, "loss": 0.4465, "step": 6605 }, { "epoch": 1.22, "learning_rate": 1.3415404233104727e-05, "loss": 0.4384, "step": 6606 }, { "epoch": 1.22, "learning_rate": 1.3413526825504066e-05, "loss": 0.4448, "step": 6607 }, { "epoch": 1.22, "learning_rate": 1.3411649281710007e-05, "loss": 0.4496, "step": 6608 }, { "epoch": 1.22, "learning_rate": 1.3409771601797455e-05, "loss": 0.4245, "step": 6609 }, { "epoch": 1.22, "learning_rate": 1.340789378584133e-05, "loss": 0.4368, "step": 6610 }, { "epoch": 1.22, "learning_rate": 1.340601583391655e-05, "loss": 0.4404, "step": 6611 }, { "epoch": 1.22, "learning_rate": 1.3404137746098047e-05, "loss": 0.4225, "step": 6612 }, { "epoch": 1.22, "learning_rate": 1.3402259522460752e-05, "loss": 0.4225, "step": 6613 }, { "epoch": 1.22, "learning_rate": 1.3400381163079598e-05, "loss": 0.4362, "step": 6614 }, { "epoch": 1.22, "learning_rate": 1.3398502668029531e-05, "loss": 0.4218, "step": 6615 }, { "epoch": 1.22, "learning_rate": 1.3396624037385502e-05, "loss": 0.4408, "step": 6616 }, { "epoch": 1.22, "learning_rate": 1.339474527122246e-05, "loss": 0.442, "step": 6617 }, { "epoch": 1.22, "learning_rate": 1.339286636961537e-05, "loss": 0.4384, "step": 6618 }, { "epoch": 1.22, "learning_rate": 1.3390987332639193e-05, "loss": 0.4525, "step": 6619 }, { "epoch": 1.22, "learning_rate": 1.3389108160368897e-05, "loss": 0.442, "step": 6620 }, { "epoch": 1.22, "learning_rate": 1.3387228852879463e-05, "loss": 0.4423, "step": 6621 }, { "epoch": 1.23, "learning_rate": 1.3385349410245867e-05, "loss": 0.4635, "step": 6622 }, { "epoch": 1.23, "learning_rate": 1.3383469832543099e-05, "loss": 0.4468, "step": 6623 }, { "epoch": 1.23, "learning_rate": 1.3381590119846148e-05, "loss": 0.4554, "step": 6624 }, { "epoch": 1.23, "learning_rate": 1.3379710272230012e-05, "loss": 0.4473, "step": 6625 }, { "epoch": 1.23, "learning_rate": 1.3377830289769693e-05, "loss": 0.4157, "step": 6626 }, { "epoch": 1.23, "learning_rate": 1.33759501725402e-05, "loss": 0.4429, "step": 6627 }, { "epoch": 1.23, "learning_rate": 1.3374069920616544e-05, "loss": 0.4075, "step": 6628 }, { "epoch": 1.23, "learning_rate": 1.3372189534073747e-05, "loss": 0.4473, "step": 6629 }, { "epoch": 1.23, "learning_rate": 1.3370309012986832e-05, "loss": 0.4531, "step": 6630 }, { "epoch": 1.23, "learning_rate": 1.3368428357430826e-05, "loss": 0.4385, "step": 6631 }, { "epoch": 1.23, "learning_rate": 1.3366547567480765e-05, "loss": 0.436, "step": 6632 }, { "epoch": 1.23, "learning_rate": 1.336466664321169e-05, "loss": 0.4291, "step": 6633 }, { "epoch": 1.23, "learning_rate": 1.3362785584698643e-05, "loss": 0.4718, "step": 6634 }, { "epoch": 1.23, "learning_rate": 1.336090439201668e-05, "loss": 0.4456, "step": 6635 }, { "epoch": 1.23, "learning_rate": 1.3359023065240854e-05, "loss": 0.449, "step": 6636 }, { "epoch": 1.23, "learning_rate": 1.3357141604446226e-05, "loss": 0.4684, "step": 6637 }, { "epoch": 1.23, "learning_rate": 1.3355260009707863e-05, "loss": 0.4581, "step": 6638 }, { "epoch": 1.23, "learning_rate": 1.3353378281100838e-05, "loss": 0.4562, "step": 6639 }, { "epoch": 1.23, "learning_rate": 1.3351496418700227e-05, "loss": 0.4359, "step": 6640 }, { "epoch": 1.23, "learning_rate": 1.3349614422581119e-05, "loss": 0.4485, "step": 6641 }, { "epoch": 1.23, "learning_rate": 1.3347732292818592e-05, "loss": 0.4659, "step": 6642 }, { "epoch": 1.23, "learning_rate": 1.3345850029487746e-05, "loss": 0.46, "step": 6643 }, { "epoch": 1.23, "learning_rate": 1.334396763266368e-05, "loss": 0.4296, "step": 6644 }, { "epoch": 1.23, "learning_rate": 1.3342085102421494e-05, "loss": 0.4325, "step": 6645 }, { "epoch": 1.23, "learning_rate": 1.3340202438836303e-05, "loss": 0.4348, "step": 6646 }, { "epoch": 1.23, "learning_rate": 1.3338319641983217e-05, "loss": 0.4529, "step": 6647 }, { "epoch": 1.23, "learning_rate": 1.3336436711937357e-05, "loss": 0.4365, "step": 6648 }, { "epoch": 1.23, "learning_rate": 1.3334553648773852e-05, "loss": 0.4248, "step": 6649 }, { "epoch": 1.23, "learning_rate": 1.3332670452567828e-05, "loss": 0.4614, "step": 6650 }, { "epoch": 1.23, "learning_rate": 1.3330787123394424e-05, "loss": 0.4455, "step": 6651 }, { "epoch": 1.23, "learning_rate": 1.3328903661328782e-05, "loss": 0.4334, "step": 6652 }, { "epoch": 1.23, "learning_rate": 1.3327020066446046e-05, "loss": 0.4397, "step": 6653 }, { "epoch": 1.23, "learning_rate": 1.3325136338821367e-05, "loss": 0.4489, "step": 6654 }, { "epoch": 1.23, "learning_rate": 1.3323252478529907e-05, "loss": 0.4457, "step": 6655 }, { "epoch": 1.23, "learning_rate": 1.3321368485646827e-05, "loss": 0.4474, "step": 6656 }, { "epoch": 1.23, "learning_rate": 1.3319484360247293e-05, "loss": 0.4528, "step": 6657 }, { "epoch": 1.23, "learning_rate": 1.3317600102406477e-05, "loss": 0.4163, "step": 6658 }, { "epoch": 1.23, "learning_rate": 1.3315715712199562e-05, "loss": 0.4203, "step": 6659 }, { "epoch": 1.23, "learning_rate": 1.3313831189701727e-05, "loss": 0.426, "step": 6660 }, { "epoch": 1.23, "learning_rate": 1.3311946534988162e-05, "loss": 0.4276, "step": 6661 }, { "epoch": 1.23, "learning_rate": 1.3310061748134065e-05, "loss": 0.4427, "step": 6662 }, { "epoch": 1.23, "learning_rate": 1.3308176829214632e-05, "loss": 0.4616, "step": 6663 }, { "epoch": 1.23, "learning_rate": 1.3306291778305067e-05, "loss": 0.4279, "step": 6664 }, { "epoch": 1.23, "learning_rate": 1.3304406595480581e-05, "loss": 0.4226, "step": 6665 }, { "epoch": 1.23, "learning_rate": 1.3302521280816392e-05, "loss": 0.4588, "step": 6666 }, { "epoch": 1.23, "learning_rate": 1.3300635834387716e-05, "loss": 0.4391, "step": 6667 }, { "epoch": 1.23, "learning_rate": 1.3298750256269786e-05, "loss": 0.4387, "step": 6668 }, { "epoch": 1.23, "learning_rate": 1.3296864546537824e-05, "loss": 0.4262, "step": 6669 }, { "epoch": 1.23, "learning_rate": 1.329497870526707e-05, "loss": 0.4275, "step": 6670 }, { "epoch": 1.23, "learning_rate": 1.3293092732532768e-05, "loss": 0.4348, "step": 6671 }, { "epoch": 1.23, "learning_rate": 1.3291206628410161e-05, "loss": 0.439, "step": 6672 }, { "epoch": 1.23, "learning_rate": 1.3289320392974505e-05, "loss": 0.4534, "step": 6673 }, { "epoch": 1.23, "learning_rate": 1.3287434026301053e-05, "loss": 0.4481, "step": 6674 }, { "epoch": 1.23, "learning_rate": 1.3285547528465072e-05, "loss": 0.4505, "step": 6675 }, { "epoch": 1.24, "learning_rate": 1.3283660899541828e-05, "loss": 0.4483, "step": 6676 }, { "epoch": 1.24, "learning_rate": 1.3281774139606594e-05, "loss": 0.4664, "step": 6677 }, { "epoch": 1.24, "learning_rate": 1.3279887248734644e-05, "loss": 0.4235, "step": 6678 }, { "epoch": 1.24, "learning_rate": 1.3278000227001271e-05, "loss": 0.4263, "step": 6679 }, { "epoch": 1.24, "learning_rate": 1.3276113074481756e-05, "loss": 0.4406, "step": 6680 }, { "epoch": 1.24, "learning_rate": 1.3274225791251392e-05, "loss": 0.4483, "step": 6681 }, { "epoch": 1.24, "learning_rate": 1.3272338377385483e-05, "loss": 0.4297, "step": 6682 }, { "epoch": 1.24, "learning_rate": 1.3270450832959332e-05, "loss": 0.4157, "step": 6683 }, { "epoch": 1.24, "learning_rate": 1.3268563158048246e-05, "loss": 0.4273, "step": 6684 }, { "epoch": 1.24, "learning_rate": 1.3266675352727544e-05, "loss": 0.4185, "step": 6685 }, { "epoch": 1.24, "learning_rate": 1.3264787417072542e-05, "loss": 0.431, "step": 6686 }, { "epoch": 1.24, "learning_rate": 1.3262899351158568e-05, "loss": 0.4453, "step": 6687 }, { "epoch": 1.24, "learning_rate": 1.326101115506095e-05, "loss": 0.4429, "step": 6688 }, { "epoch": 1.24, "learning_rate": 1.3259122828855022e-05, "loss": 0.4324, "step": 6689 }, { "epoch": 1.24, "learning_rate": 1.3257234372616133e-05, "loss": 0.4416, "step": 6690 }, { "epoch": 1.24, "learning_rate": 1.3255345786419618e-05, "loss": 0.4337, "step": 6691 }, { "epoch": 1.24, "learning_rate": 1.3253457070340836e-05, "loss": 0.4319, "step": 6692 }, { "epoch": 1.24, "learning_rate": 1.3251568224455138e-05, "loss": 0.4469, "step": 6693 }, { "epoch": 1.24, "learning_rate": 1.324967924883789e-05, "loss": 0.4356, "step": 6694 }, { "epoch": 1.24, "learning_rate": 1.3247790143564456e-05, "loss": 0.4465, "step": 6695 }, { "epoch": 1.24, "learning_rate": 1.324590090871021e-05, "loss": 0.4359, "step": 6696 }, { "epoch": 1.24, "learning_rate": 1.3244011544350525e-05, "loss": 0.4359, "step": 6697 }, { "epoch": 1.24, "learning_rate": 1.3242122050560786e-05, "loss": 0.4379, "step": 6698 }, { "epoch": 1.24, "learning_rate": 1.324023242741638e-05, "loss": 0.4375, "step": 6699 }, { "epoch": 1.24, "learning_rate": 1.3238342674992702e-05, "loss": 0.4377, "step": 6700 }, { "epoch": 1.24, "learning_rate": 1.3236452793365143e-05, "loss": 0.4453, "step": 6701 }, { "epoch": 1.24, "learning_rate": 1.323456278260911e-05, "loss": 0.4676, "step": 6702 }, { "epoch": 1.24, "learning_rate": 1.323267264280001e-05, "loss": 0.4415, "step": 6703 }, { "epoch": 1.24, "learning_rate": 1.323078237401326e-05, "loss": 0.4603, "step": 6704 }, { "epoch": 1.24, "learning_rate": 1.3228891976324272e-05, "loss": 0.4232, "step": 6705 }, { "epoch": 1.24, "learning_rate": 1.3227001449808475e-05, "loss": 0.4221, "step": 6706 }, { "epoch": 1.24, "learning_rate": 1.3225110794541294e-05, "loss": 0.4416, "step": 6707 }, { "epoch": 1.24, "learning_rate": 1.3223220010598161e-05, "loss": 0.4237, "step": 6708 }, { "epoch": 1.24, "learning_rate": 1.3221329098054519e-05, "loss": 0.4278, "step": 6709 }, { "epoch": 1.24, "learning_rate": 1.321943805698581e-05, "loss": 0.4533, "step": 6710 }, { "epoch": 1.24, "learning_rate": 1.3217546887467482e-05, "loss": 0.4418, "step": 6711 }, { "epoch": 1.24, "learning_rate": 1.3215655589574996e-05, "loss": 0.4536, "step": 6712 }, { "epoch": 1.24, "learning_rate": 1.32137641633838e-05, "loss": 0.432, "step": 6713 }, { "epoch": 1.24, "learning_rate": 1.3211872608969365e-05, "loss": 0.4263, "step": 6714 }, { "epoch": 1.24, "learning_rate": 1.320998092640716e-05, "loss": 0.4556, "step": 6715 }, { "epoch": 1.24, "learning_rate": 1.3208089115772658e-05, "loss": 0.4268, "step": 6716 }, { "epoch": 1.24, "learning_rate": 1.320619717714134e-05, "loss": 0.4509, "step": 6717 }, { "epoch": 1.24, "learning_rate": 1.3204305110588693e-05, "loss": 0.4331, "step": 6718 }, { "epoch": 1.24, "learning_rate": 1.3202412916190204e-05, "loss": 0.4188, "step": 6719 }, { "epoch": 1.24, "learning_rate": 1.3200520594021366e-05, "loss": 0.4219, "step": 6720 }, { "epoch": 1.24, "learning_rate": 1.3198628144157683e-05, "loss": 0.4255, "step": 6721 }, { "epoch": 1.24, "learning_rate": 1.3196735566674662e-05, "loss": 0.4182, "step": 6722 }, { "epoch": 1.24, "learning_rate": 1.3194842861647807e-05, "loss": 0.4532, "step": 6723 }, { "epoch": 1.24, "learning_rate": 1.3192950029152638e-05, "loss": 0.4438, "step": 6724 }, { "epoch": 1.24, "learning_rate": 1.3191057069264675e-05, "loss": 0.4596, "step": 6725 }, { "epoch": 1.24, "learning_rate": 1.3189163982059443e-05, "loss": 0.4685, "step": 6726 }, { "epoch": 1.24, "learning_rate": 1.3187270767612473e-05, "loss": 0.4428, "step": 6727 }, { "epoch": 1.24, "learning_rate": 1.3185377425999298e-05, "loss": 0.4388, "step": 6728 }, { "epoch": 1.24, "learning_rate": 1.3183483957295465e-05, "loss": 0.456, "step": 6729 }, { "epoch": 1.25, "learning_rate": 1.3181590361576515e-05, "loss": 0.4562, "step": 6730 }, { "epoch": 1.25, "learning_rate": 1.3179696638917998e-05, "loss": 0.4628, "step": 6731 }, { "epoch": 1.25, "learning_rate": 1.3177802789395476e-05, "loss": 0.4479, "step": 6732 }, { "epoch": 1.25, "learning_rate": 1.3175908813084501e-05, "loss": 0.4241, "step": 6733 }, { "epoch": 1.25, "learning_rate": 1.317401471006065e-05, "loss": 0.447, "step": 6734 }, { "epoch": 1.25, "learning_rate": 1.3172120480399486e-05, "loss": 0.435, "step": 6735 }, { "epoch": 1.25, "learning_rate": 1.3170226124176586e-05, "loss": 0.4391, "step": 6736 }, { "epoch": 1.25, "learning_rate": 1.3168331641467535e-05, "loss": 0.4183, "step": 6737 }, { "epoch": 1.25, "learning_rate": 1.3166437032347918e-05, "loss": 0.4361, "step": 6738 }, { "epoch": 1.25, "learning_rate": 1.3164542296893326e-05, "loss": 0.4432, "step": 6739 }, { "epoch": 1.25, "learning_rate": 1.3162647435179357e-05, "loss": 0.4221, "step": 6740 }, { "epoch": 1.25, "learning_rate": 1.3160752447281606e-05, "loss": 0.4488, "step": 6741 }, { "epoch": 1.25, "learning_rate": 1.3158857333275687e-05, "loss": 0.4559, "step": 6742 }, { "epoch": 1.25, "learning_rate": 1.3156962093237208e-05, "loss": 0.4453, "step": 6743 }, { "epoch": 1.25, "learning_rate": 1.3155066727241788e-05, "loss": 0.4098, "step": 6744 }, { "epoch": 1.25, "learning_rate": 1.3153171235365047e-05, "loss": 0.4555, "step": 6745 }, { "epoch": 1.25, "learning_rate": 1.3151275617682613e-05, "loss": 0.4302, "step": 6746 }, { "epoch": 1.25, "learning_rate": 1.3149379874270114e-05, "loss": 0.4173, "step": 6747 }, { "epoch": 1.25, "learning_rate": 1.3147484005203188e-05, "loss": 0.4521, "step": 6748 }, { "epoch": 1.25, "learning_rate": 1.3145588010557477e-05, "loss": 0.4348, "step": 6749 }, { "epoch": 1.25, "learning_rate": 1.3143691890408632e-05, "loss": 0.4414, "step": 6750 }, { "epoch": 1.25, "learning_rate": 1.3141795644832298e-05, "loss": 0.4414, "step": 6751 }, { "epoch": 1.25, "learning_rate": 1.3139899273904136e-05, "loss": 0.4252, "step": 6752 }, { "epoch": 1.25, "learning_rate": 1.3138002777699805e-05, "loss": 0.4273, "step": 6753 }, { "epoch": 1.25, "learning_rate": 1.3136106156294974e-05, "loss": 0.4373, "step": 6754 }, { "epoch": 1.25, "learning_rate": 1.3134209409765312e-05, "loss": 0.4389, "step": 6755 }, { "epoch": 1.25, "learning_rate": 1.3132312538186502e-05, "loss": 0.4312, "step": 6756 }, { "epoch": 1.25, "learning_rate": 1.3130415541634217e-05, "loss": 0.4571, "step": 6757 }, { "epoch": 1.25, "learning_rate": 1.3128518420184148e-05, "loss": 0.4206, "step": 6758 }, { "epoch": 1.25, "learning_rate": 1.3126621173911986e-05, "loss": 0.446, "step": 6759 }, { "epoch": 1.25, "learning_rate": 1.3124723802893431e-05, "loss": 0.4633, "step": 6760 }, { "epoch": 1.25, "learning_rate": 1.312282630720418e-05, "loss": 0.4375, "step": 6761 }, { "epoch": 1.25, "learning_rate": 1.3120928686919942e-05, "loss": 0.4432, "step": 6762 }, { "epoch": 1.25, "learning_rate": 1.3119030942116427e-05, "loss": 0.4329, "step": 6763 }, { "epoch": 1.25, "learning_rate": 1.311713307286935e-05, "loss": 0.4628, "step": 6764 }, { "epoch": 1.25, "learning_rate": 1.3115235079254435e-05, "loss": 0.4507, "step": 6765 }, { "epoch": 1.25, "learning_rate": 1.311333696134741e-05, "loss": 0.4429, "step": 6766 }, { "epoch": 1.25, "learning_rate": 1.3111438719224005e-05, "loss": 0.4341, "step": 6767 }, { "epoch": 1.25, "learning_rate": 1.3109540352959954e-05, "loss": 0.4286, "step": 6768 }, { "epoch": 1.25, "learning_rate": 1.3107641862631e-05, "loss": 0.4678, "step": 6769 }, { "epoch": 1.25, "learning_rate": 1.310574324831289e-05, "loss": 0.438, "step": 6770 }, { "epoch": 1.25, "learning_rate": 1.3103844510081374e-05, "loss": 0.4374, "step": 6771 }, { "epoch": 1.25, "learning_rate": 1.310194564801221e-05, "loss": 0.4335, "step": 6772 }, { "epoch": 1.25, "learning_rate": 1.3100046662181157e-05, "loss": 0.4371, "step": 6773 }, { "epoch": 1.25, "learning_rate": 1.3098147552663983e-05, "loss": 0.4594, "step": 6774 }, { "epoch": 1.25, "learning_rate": 1.3096248319536455e-05, "loss": 0.4432, "step": 6775 }, { "epoch": 1.25, "learning_rate": 1.3094348962874351e-05, "loss": 0.4332, "step": 6776 }, { "epoch": 1.25, "learning_rate": 1.3092449482753456e-05, "loss": 0.4292, "step": 6777 }, { "epoch": 1.25, "learning_rate": 1.3090549879249547e-05, "loss": 0.4409, "step": 6778 }, { "epoch": 1.25, "learning_rate": 1.3088650152438424e-05, "loss": 0.4391, "step": 6779 }, { "epoch": 1.25, "learning_rate": 1.3086750302395878e-05, "loss": 0.4344, "step": 6780 }, { "epoch": 1.25, "learning_rate": 1.3084850329197709e-05, "loss": 0.4303, "step": 6781 }, { "epoch": 1.25, "learning_rate": 1.3082950232919722e-05, "loss": 0.4406, "step": 6782 }, { "epoch": 1.25, "learning_rate": 1.3081050013637731e-05, "loss": 0.4397, "step": 6783 }, { "epoch": 1.26, "learning_rate": 1.3079149671427551e-05, "loss": 0.4369, "step": 6784 }, { "epoch": 1.26, "learning_rate": 1.3077249206364997e-05, "loss": 0.4307, "step": 6785 }, { "epoch": 1.26, "learning_rate": 1.3075348618525899e-05, "loss": 0.4315, "step": 6786 }, { "epoch": 1.26, "learning_rate": 1.3073447907986081e-05, "loss": 0.446, "step": 6787 }, { "epoch": 1.26, "learning_rate": 1.3071547074821385e-05, "loss": 0.4429, "step": 6788 }, { "epoch": 1.26, "learning_rate": 1.3069646119107645e-05, "loss": 0.4358, "step": 6789 }, { "epoch": 1.26, "learning_rate": 1.3067745040920712e-05, "loss": 0.4364, "step": 6790 }, { "epoch": 1.26, "learning_rate": 1.3065843840336429e-05, "loss": 0.4435, "step": 6791 }, { "epoch": 1.26, "learning_rate": 1.3063942517430652e-05, "loss": 0.4443, "step": 6792 }, { "epoch": 1.26, "learning_rate": 1.3062041072279244e-05, "loss": 0.4329, "step": 6793 }, { "epoch": 1.26, "learning_rate": 1.3060139504958065e-05, "loss": 0.4176, "step": 6794 }, { "epoch": 1.26, "learning_rate": 1.3058237815542987e-05, "loss": 0.4511, "step": 6795 }, { "epoch": 1.26, "learning_rate": 1.305633600410988e-05, "loss": 0.4336, "step": 6796 }, { "epoch": 1.26, "learning_rate": 1.3054434070734627e-05, "loss": 0.4401, "step": 6797 }, { "epoch": 1.26, "learning_rate": 1.3052532015493107e-05, "loss": 0.4425, "step": 6798 }, { "epoch": 1.26, "learning_rate": 1.3050629838461215e-05, "loss": 0.4215, "step": 6799 }, { "epoch": 1.26, "learning_rate": 1.3048727539714837e-05, "loss": 0.4588, "step": 6800 }, { "epoch": 1.26, "learning_rate": 1.3046825119329875e-05, "loss": 0.4348, "step": 6801 }, { "epoch": 1.26, "learning_rate": 1.3044922577382236e-05, "loss": 0.4488, "step": 6802 }, { "epoch": 1.26, "learning_rate": 1.3043019913947819e-05, "loss": 0.4508, "step": 6803 }, { "epoch": 1.26, "learning_rate": 1.3041117129102544e-05, "loss": 0.417, "step": 6804 }, { "epoch": 1.26, "learning_rate": 1.3039214222922323e-05, "loss": 0.4394, "step": 6805 }, { "epoch": 1.26, "learning_rate": 1.3037311195483086e-05, "loss": 0.4507, "step": 6806 }, { "epoch": 1.26, "learning_rate": 1.3035408046860752e-05, "loss": 0.4296, "step": 6807 }, { "epoch": 1.26, "learning_rate": 1.3033504777131258e-05, "loss": 0.4245, "step": 6808 }, { "epoch": 1.26, "learning_rate": 1.303160138637054e-05, "loss": 0.4448, "step": 6809 }, { "epoch": 1.26, "learning_rate": 1.302969787465454e-05, "loss": 0.4466, "step": 6810 }, { "epoch": 1.26, "learning_rate": 1.3027794242059203e-05, "loss": 0.4318, "step": 6811 }, { "epoch": 1.26, "learning_rate": 1.3025890488660484e-05, "loss": 0.4101, "step": 6812 }, { "epoch": 1.26, "learning_rate": 1.3023986614534334e-05, "loss": 0.4599, "step": 6813 }, { "epoch": 1.26, "learning_rate": 1.3022082619756717e-05, "loss": 0.4309, "step": 6814 }, { "epoch": 1.26, "learning_rate": 1.30201785044036e-05, "loss": 0.4027, "step": 6815 }, { "epoch": 1.26, "learning_rate": 1.3018274268550952e-05, "loss": 0.4609, "step": 6816 }, { "epoch": 1.26, "learning_rate": 1.3016369912274752e-05, "loss": 0.448, "step": 6817 }, { "epoch": 1.26, "learning_rate": 1.3014465435650974e-05, "loss": 0.4378, "step": 6818 }, { "epoch": 1.26, "learning_rate": 1.3012560838755603e-05, "loss": 0.4383, "step": 6819 }, { "epoch": 1.26, "learning_rate": 1.3010656121664638e-05, "loss": 0.4554, "step": 6820 }, { "epoch": 1.26, "learning_rate": 1.3008751284454064e-05, "loss": 0.4351, "step": 6821 }, { "epoch": 1.26, "learning_rate": 1.3006846327199888e-05, "loss": 0.4617, "step": 6822 }, { "epoch": 1.26, "learning_rate": 1.3004941249978107e-05, "loss": 0.4415, "step": 6823 }, { "epoch": 1.26, "learning_rate": 1.3003036052864735e-05, "loss": 0.4518, "step": 6824 }, { "epoch": 1.26, "learning_rate": 1.3001130735935783e-05, "loss": 0.4371, "step": 6825 }, { "epoch": 1.26, "learning_rate": 1.2999225299267273e-05, "loss": 0.4218, "step": 6826 }, { "epoch": 1.26, "learning_rate": 1.2997319742935224e-05, "loss": 0.4394, "step": 6827 }, { "epoch": 1.26, "learning_rate": 1.2995414067015669e-05, "loss": 0.4278, "step": 6828 }, { "epoch": 1.26, "learning_rate": 1.2993508271584638e-05, "loss": 0.4439, "step": 6829 }, { "epoch": 1.26, "learning_rate": 1.299160235671817e-05, "loss": 0.4534, "step": 6830 }, { "epoch": 1.26, "learning_rate": 1.2989696322492305e-05, "loss": 0.4365, "step": 6831 }, { "epoch": 1.26, "learning_rate": 1.2987790168983092e-05, "loss": 0.4353, "step": 6832 }, { "epoch": 1.26, "learning_rate": 1.2985883896266587e-05, "loss": 0.4388, "step": 6833 }, { "epoch": 1.26, "learning_rate": 1.2983977504418839e-05, "loss": 0.4308, "step": 6834 }, { "epoch": 1.26, "learning_rate": 1.2982070993515913e-05, "loss": 0.443, "step": 6835 }, { "epoch": 1.26, "learning_rate": 1.2980164363633878e-05, "loss": 0.4148, "step": 6836 }, { "epoch": 1.26, "learning_rate": 1.2978257614848799e-05, "loss": 0.4295, "step": 6837 }, { "epoch": 1.27, "learning_rate": 1.2976350747236759e-05, "loss": 0.4378, "step": 6838 }, { "epoch": 1.27, "learning_rate": 1.2974443760873833e-05, "loss": 0.4546, "step": 6839 }, { "epoch": 1.27, "learning_rate": 1.297253665583611e-05, "loss": 0.4462, "step": 6840 }, { "epoch": 1.27, "learning_rate": 1.2970629432199674e-05, "loss": 0.4361, "step": 6841 }, { "epoch": 1.27, "learning_rate": 1.2968722090040626e-05, "loss": 0.4391, "step": 6842 }, { "epoch": 1.27, "learning_rate": 1.2966814629435063e-05, "loss": 0.4299, "step": 6843 }, { "epoch": 1.27, "learning_rate": 1.296490705045909e-05, "loss": 0.4277, "step": 6844 }, { "epoch": 1.27, "learning_rate": 1.2962999353188814e-05, "loss": 0.4384, "step": 6845 }, { "epoch": 1.27, "learning_rate": 1.296109153770035e-05, "loss": 0.4323, "step": 6846 }, { "epoch": 1.27, "learning_rate": 1.2959183604069813e-05, "loss": 0.4339, "step": 6847 }, { "epoch": 1.27, "learning_rate": 1.2957275552373331e-05, "loss": 0.4657, "step": 6848 }, { "epoch": 1.27, "learning_rate": 1.2955367382687032e-05, "loss": 0.4448, "step": 6849 }, { "epoch": 1.27, "learning_rate": 1.2953459095087045e-05, "loss": 0.4506, "step": 6850 }, { "epoch": 1.27, "learning_rate": 1.2951550689649506e-05, "loss": 0.4329, "step": 6851 }, { "epoch": 1.27, "learning_rate": 1.294964216645056e-05, "loss": 0.4549, "step": 6852 }, { "epoch": 1.27, "learning_rate": 1.2947733525566353e-05, "loss": 0.429, "step": 6853 }, { "epoch": 1.27, "learning_rate": 1.2945824767073037e-05, "loss": 0.4468, "step": 6854 }, { "epoch": 1.27, "learning_rate": 1.2943915891046767e-05, "loss": 0.4612, "step": 6855 }, { "epoch": 1.27, "learning_rate": 1.2942006897563703e-05, "loss": 0.4375, "step": 6856 }, { "epoch": 1.27, "learning_rate": 1.294009778670001e-05, "loss": 0.4381, "step": 6857 }, { "epoch": 1.27, "learning_rate": 1.2938188558531862e-05, "loss": 0.4403, "step": 6858 }, { "epoch": 1.27, "learning_rate": 1.2936279213135425e-05, "loss": 0.4382, "step": 6859 }, { "epoch": 1.27, "learning_rate": 1.2934369750586885e-05, "loss": 0.4318, "step": 6860 }, { "epoch": 1.27, "learning_rate": 1.293246017096243e-05, "loss": 0.446, "step": 6861 }, { "epoch": 1.27, "learning_rate": 1.293055047433824e-05, "loss": 0.4372, "step": 6862 }, { "epoch": 1.27, "learning_rate": 1.292864066079051e-05, "loss": 0.448, "step": 6863 }, { "epoch": 1.27, "learning_rate": 1.292673073039544e-05, "loss": 0.4333, "step": 6864 }, { "epoch": 1.27, "learning_rate": 1.2924820683229235e-05, "loss": 0.4241, "step": 6865 }, { "epoch": 1.27, "learning_rate": 1.2922910519368101e-05, "loss": 0.4632, "step": 6866 }, { "epoch": 1.27, "learning_rate": 1.2921000238888247e-05, "loss": 0.4301, "step": 6867 }, { "epoch": 1.27, "learning_rate": 1.291908984186589e-05, "loss": 0.442, "step": 6868 }, { "epoch": 1.27, "learning_rate": 1.2917179328377253e-05, "loss": 0.4399, "step": 6869 }, { "epoch": 1.27, "learning_rate": 1.2915268698498565e-05, "loss": 0.4332, "step": 6870 }, { "epoch": 1.27, "learning_rate": 1.2913357952306052e-05, "loss": 0.4678, "step": 6871 }, { "epoch": 1.27, "learning_rate": 1.291144708987595e-05, "loss": 0.4511, "step": 6872 }, { "epoch": 1.27, "learning_rate": 1.2909536111284499e-05, "loss": 0.4461, "step": 6873 }, { "epoch": 1.27, "learning_rate": 1.2907625016607946e-05, "loss": 0.4362, "step": 6874 }, { "epoch": 1.27, "learning_rate": 1.2905713805922535e-05, "loss": 0.4276, "step": 6875 }, { "epoch": 1.27, "learning_rate": 1.2903802479304526e-05, "loss": 0.4194, "step": 6876 }, { "epoch": 1.27, "learning_rate": 1.2901891036830171e-05, "loss": 0.4478, "step": 6877 }, { "epoch": 1.27, "learning_rate": 1.2899979478575739e-05, "loss": 0.4428, "step": 6878 }, { "epoch": 1.27, "learning_rate": 1.2898067804617495e-05, "loss": 0.4345, "step": 6879 }, { "epoch": 1.27, "learning_rate": 1.289615601503171e-05, "loss": 0.4395, "step": 6880 }, { "epoch": 1.27, "learning_rate": 1.2894244109894662e-05, "loss": 0.4396, "step": 6881 }, { "epoch": 1.27, "learning_rate": 1.2892332089282635e-05, "loss": 0.4436, "step": 6882 }, { "epoch": 1.27, "learning_rate": 1.289041995327191e-05, "loss": 0.4373, "step": 6883 }, { "epoch": 1.27, "learning_rate": 1.2888507701938781e-05, "loss": 0.407, "step": 6884 }, { "epoch": 1.27, "learning_rate": 1.2886595335359542e-05, "loss": 0.4749, "step": 6885 }, { "epoch": 1.27, "learning_rate": 1.2884682853610495e-05, "loss": 0.44, "step": 6886 }, { "epoch": 1.27, "learning_rate": 1.2882770256767942e-05, "loss": 0.4608, "step": 6887 }, { "epoch": 1.27, "learning_rate": 1.2880857544908197e-05, "loss": 0.4416, "step": 6888 }, { "epoch": 1.27, "learning_rate": 1.2878944718107565e-05, "loss": 0.4562, "step": 6889 }, { "epoch": 1.27, "learning_rate": 1.2877031776442369e-05, "loss": 0.4405, "step": 6890 }, { "epoch": 1.27, "learning_rate": 1.2875118719988933e-05, "loss": 0.4445, "step": 6891 }, { "epoch": 1.28, "learning_rate": 1.2873205548823581e-05, "loss": 0.4351, "step": 6892 }, { "epoch": 1.28, "learning_rate": 1.2871292263022653e-05, "loss": 0.4343, "step": 6893 }, { "epoch": 1.28, "learning_rate": 1.2869378862662476e-05, "loss": 0.4487, "step": 6894 }, { "epoch": 1.28, "learning_rate": 1.2867465347819395e-05, "loss": 0.4416, "step": 6895 }, { "epoch": 1.28, "learning_rate": 1.2865551718569756e-05, "loss": 0.4331, "step": 6896 }, { "epoch": 1.28, "learning_rate": 1.2863637974989906e-05, "loss": 0.4223, "step": 6897 }, { "epoch": 1.28, "learning_rate": 1.2861724117156205e-05, "loss": 0.4251, "step": 6898 }, { "epoch": 1.28, "learning_rate": 1.2859810145145014e-05, "loss": 0.4343, "step": 6899 }, { "epoch": 1.28, "learning_rate": 1.2857896059032689e-05, "loss": 0.4543, "step": 6900 }, { "epoch": 1.28, "learning_rate": 1.2855981858895601e-05, "loss": 0.4337, "step": 6901 }, { "epoch": 1.28, "learning_rate": 1.2854067544810125e-05, "loss": 0.446, "step": 6902 }, { "epoch": 1.28, "learning_rate": 1.2852153116852639e-05, "loss": 0.4552, "step": 6903 }, { "epoch": 1.28, "learning_rate": 1.2850238575099525e-05, "loss": 0.4507, "step": 6904 }, { "epoch": 1.28, "learning_rate": 1.2848323919627167e-05, "loss": 0.4321, "step": 6905 }, { "epoch": 1.28, "learning_rate": 1.284640915051196e-05, "loss": 0.4287, "step": 6906 }, { "epoch": 1.28, "learning_rate": 1.2844494267830299e-05, "loss": 0.4234, "step": 6907 }, { "epoch": 1.28, "learning_rate": 1.2842579271658581e-05, "loss": 0.4273, "step": 6908 }, { "epoch": 1.28, "learning_rate": 1.2840664162073212e-05, "loss": 0.4266, "step": 6909 }, { "epoch": 1.28, "learning_rate": 1.2838748939150607e-05, "loss": 0.4431, "step": 6910 }, { "epoch": 1.28, "learning_rate": 1.2836833602967172e-05, "loss": 0.4649, "step": 6911 }, { "epoch": 1.28, "learning_rate": 1.2834918153599327e-05, "loss": 0.4306, "step": 6912 }, { "epoch": 1.28, "learning_rate": 1.2833002591123499e-05, "loss": 0.4767, "step": 6913 }, { "epoch": 1.28, "learning_rate": 1.283108691561611e-05, "loss": 0.4635, "step": 6914 }, { "epoch": 1.28, "learning_rate": 1.28291711271536e-05, "loss": 0.4536, "step": 6915 }, { "epoch": 1.28, "learning_rate": 1.2827255225812396e-05, "loss": 0.4429, "step": 6916 }, { "epoch": 1.28, "learning_rate": 1.2825339211668943e-05, "loss": 0.4469, "step": 6917 }, { "epoch": 1.28, "learning_rate": 1.2823423084799687e-05, "loss": 0.4166, "step": 6918 }, { "epoch": 1.28, "learning_rate": 1.2821506845281077e-05, "loss": 0.4524, "step": 6919 }, { "epoch": 1.28, "learning_rate": 1.2819590493189566e-05, "loss": 0.4314, "step": 6920 }, { "epoch": 1.28, "learning_rate": 1.281767402860162e-05, "loss": 0.4445, "step": 6921 }, { "epoch": 1.28, "learning_rate": 1.2815757451593694e-05, "loss": 0.4269, "step": 6922 }, { "epoch": 1.28, "learning_rate": 1.2813840762242258e-05, "loss": 0.447, "step": 6923 }, { "epoch": 1.28, "learning_rate": 1.2811923960623784e-05, "loss": 0.4343, "step": 6924 }, { "epoch": 1.28, "learning_rate": 1.2810007046814752e-05, "loss": 0.436, "step": 6925 }, { "epoch": 1.28, "learning_rate": 1.2808090020891642e-05, "loss": 0.4367, "step": 6926 }, { "epoch": 1.28, "learning_rate": 1.2806172882930938e-05, "loss": 0.4402, "step": 6927 }, { "epoch": 1.28, "learning_rate": 1.2804255633009133e-05, "loss": 0.4536, "step": 6928 }, { "epoch": 1.28, "learning_rate": 1.280233827120272e-05, "loss": 0.4411, "step": 6929 }, { "epoch": 1.28, "learning_rate": 1.2800420797588195e-05, "loss": 0.4547, "step": 6930 }, { "epoch": 1.28, "learning_rate": 1.2798503212242068e-05, "loss": 0.4307, "step": 6931 }, { "epoch": 1.28, "learning_rate": 1.2796585515240848e-05, "loss": 0.4583, "step": 6932 }, { "epoch": 1.28, "learning_rate": 1.2794667706661037e-05, "loss": 0.4329, "step": 6933 }, { "epoch": 1.28, "learning_rate": 1.2792749786579162e-05, "loss": 0.4506, "step": 6934 }, { "epoch": 1.28, "learning_rate": 1.279083175507174e-05, "loss": 0.4615, "step": 6935 }, { "epoch": 1.28, "learning_rate": 1.2788913612215297e-05, "loss": 0.4351, "step": 6936 }, { "epoch": 1.28, "learning_rate": 1.2786995358086368e-05, "loss": 0.447, "step": 6937 }, { "epoch": 1.28, "learning_rate": 1.2785076992761483e-05, "loss": 0.4267, "step": 6938 }, { "epoch": 1.28, "learning_rate": 1.278315851631718e-05, "loss": 0.4357, "step": 6939 }, { "epoch": 1.28, "learning_rate": 1.2781239928830006e-05, "loss": 0.4255, "step": 6940 }, { "epoch": 1.28, "learning_rate": 1.277932123037651e-05, "loss": 0.4412, "step": 6941 }, { "epoch": 1.28, "learning_rate": 1.277740242103324e-05, "loss": 0.4342, "step": 6942 }, { "epoch": 1.28, "learning_rate": 1.2775483500876757e-05, "loss": 0.4248, "step": 6943 }, { "epoch": 1.28, "learning_rate": 1.2773564469983621e-05, "loss": 0.4342, "step": 6944 }, { "epoch": 1.28, "learning_rate": 1.27716453284304e-05, "loss": 0.4469, "step": 6945 }, { "epoch": 1.29, "learning_rate": 1.2769726076293659e-05, "loss": 0.4286, "step": 6946 }, { "epoch": 1.29, "learning_rate": 1.2767806713649974e-05, "loss": 0.4528, "step": 6947 }, { "epoch": 1.29, "learning_rate": 1.2765887240575931e-05, "loss": 0.4364, "step": 6948 }, { "epoch": 1.29, "learning_rate": 1.2763967657148105e-05, "loss": 0.4463, "step": 6949 }, { "epoch": 1.29, "learning_rate": 1.2762047963443087e-05, "loss": 0.4379, "step": 6950 }, { "epoch": 1.29, "learning_rate": 1.2760128159537468e-05, "loss": 0.44, "step": 6951 }, { "epoch": 1.29, "learning_rate": 1.2758208245507846e-05, "loss": 0.4592, "step": 6952 }, { "epoch": 1.29, "learning_rate": 1.2756288221430822e-05, "loss": 0.4031, "step": 6953 }, { "epoch": 1.29, "learning_rate": 1.2754368087383e-05, "loss": 0.4493, "step": 6954 }, { "epoch": 1.29, "learning_rate": 1.2752447843440994e-05, "loss": 0.432, "step": 6955 }, { "epoch": 1.29, "learning_rate": 1.275052748968141e-05, "loss": 0.4462, "step": 6956 }, { "epoch": 1.29, "learning_rate": 1.2748607026180876e-05, "loss": 0.4366, "step": 6957 }, { "epoch": 1.29, "learning_rate": 1.2746686453016008e-05, "loss": 0.4128, "step": 6958 }, { "epoch": 1.29, "learning_rate": 1.274476577026344e-05, "loss": 0.4574, "step": 6959 }, { "epoch": 1.29, "learning_rate": 1.2742844977999797e-05, "loss": 0.4663, "step": 6960 }, { "epoch": 1.29, "learning_rate": 1.2740924076301716e-05, "loss": 0.467, "step": 6961 }, { "epoch": 1.29, "learning_rate": 1.2739003065245841e-05, "loss": 0.4303, "step": 6962 }, { "epoch": 1.29, "learning_rate": 1.2737081944908814e-05, "loss": 0.4542, "step": 6963 }, { "epoch": 1.29, "learning_rate": 1.2735160715367285e-05, "loss": 0.4228, "step": 6964 }, { "epoch": 1.29, "learning_rate": 1.273323937669791e-05, "loss": 0.4493, "step": 6965 }, { "epoch": 1.29, "learning_rate": 1.273131792897734e-05, "loss": 0.4392, "step": 6966 }, { "epoch": 1.29, "learning_rate": 1.2729396372282245e-05, "loss": 0.4378, "step": 6967 }, { "epoch": 1.29, "learning_rate": 1.2727474706689287e-05, "loss": 0.4464, "step": 6968 }, { "epoch": 1.29, "learning_rate": 1.2725552932275135e-05, "loss": 0.4428, "step": 6969 }, { "epoch": 1.29, "learning_rate": 1.2723631049116474e-05, "loss": 0.4486, "step": 6970 }, { "epoch": 1.29, "learning_rate": 1.2721709057289973e-05, "loss": 0.4453, "step": 6971 }, { "epoch": 1.29, "learning_rate": 1.2719786956872317e-05, "loss": 0.4455, "step": 6972 }, { "epoch": 1.29, "learning_rate": 1.2717864747940201e-05, "loss": 0.4434, "step": 6973 }, { "epoch": 1.29, "learning_rate": 1.271594243057031e-05, "loss": 0.4412, "step": 6974 }, { "epoch": 1.29, "learning_rate": 1.2714020004839347e-05, "loss": 0.4363, "step": 6975 }, { "epoch": 1.29, "learning_rate": 1.2712097470824009e-05, "loss": 0.42, "step": 6976 }, { "epoch": 1.29, "learning_rate": 1.2710174828601005e-05, "loss": 0.4113, "step": 6977 }, { "epoch": 1.29, "learning_rate": 1.270825207824704e-05, "loss": 0.4461, "step": 6978 }, { "epoch": 1.29, "learning_rate": 1.2706329219838836e-05, "loss": 0.4537, "step": 6979 }, { "epoch": 1.29, "learning_rate": 1.2704406253453103e-05, "loss": 0.4315, "step": 6980 }, { "epoch": 1.29, "learning_rate": 1.2702483179166572e-05, "loss": 0.4232, "step": 6981 }, { "epoch": 1.29, "learning_rate": 1.2700559997055961e-05, "loss": 0.4503, "step": 6982 }, { "epoch": 1.29, "learning_rate": 1.2698636707198008e-05, "loss": 0.4345, "step": 6983 }, { "epoch": 1.29, "learning_rate": 1.2696713309669446e-05, "loss": 0.4421, "step": 6984 }, { "epoch": 1.29, "learning_rate": 1.2694789804547017e-05, "loss": 0.4351, "step": 6985 }, { "epoch": 1.29, "learning_rate": 1.2692866191907463e-05, "loss": 0.4375, "step": 6986 }, { "epoch": 1.29, "learning_rate": 1.2690942471827537e-05, "loss": 0.4359, "step": 6987 }, { "epoch": 1.29, "learning_rate": 1.2689018644383983e-05, "loss": 0.4555, "step": 6988 }, { "epoch": 1.29, "learning_rate": 1.2687094709653567e-05, "loss": 0.4241, "step": 6989 }, { "epoch": 1.29, "learning_rate": 1.2685170667713046e-05, "loss": 0.4419, "step": 6990 }, { "epoch": 1.29, "learning_rate": 1.2683246518639187e-05, "loss": 0.434, "step": 6991 }, { "epoch": 1.29, "learning_rate": 1.2681322262508762e-05, "loss": 0.4195, "step": 6992 }, { "epoch": 1.29, "learning_rate": 1.267939789939854e-05, "loss": 0.454, "step": 6993 }, { "epoch": 1.29, "learning_rate": 1.2677473429385304e-05, "loss": 0.4276, "step": 6994 }, { "epoch": 1.29, "learning_rate": 1.2675548852545833e-05, "loss": 0.4344, "step": 6995 }, { "epoch": 1.29, "learning_rate": 1.2673624168956919e-05, "loss": 0.4229, "step": 6996 }, { "epoch": 1.29, "learning_rate": 1.267169937869535e-05, "loss": 0.4267, "step": 6997 }, { "epoch": 1.29, "learning_rate": 1.2669774481837923e-05, "loss": 0.4226, "step": 6998 }, { "epoch": 1.29, "learning_rate": 1.2667849478461437e-05, "loss": 0.4182, "step": 6999 }, { "epoch": 1.3, "learning_rate": 1.2665924368642697e-05, "loss": 0.43, "step": 7000 }, { "epoch": 1.3, "learning_rate": 1.2663999152458509e-05, "loss": 0.4327, "step": 7001 }, { "epoch": 1.3, "learning_rate": 1.2662073829985686e-05, "loss": 0.4206, "step": 7002 }, { "epoch": 1.3, "learning_rate": 1.266014840130105e-05, "loss": 0.4259, "step": 7003 }, { "epoch": 1.3, "learning_rate": 1.2658222866481414e-05, "loss": 0.4357, "step": 7004 }, { "epoch": 1.3, "learning_rate": 1.2656297225603607e-05, "loss": 0.4072, "step": 7005 }, { "epoch": 1.3, "learning_rate": 1.2654371478744461e-05, "loss": 0.4522, "step": 7006 }, { "epoch": 1.3, "learning_rate": 1.2652445625980805e-05, "loss": 0.4453, "step": 7007 }, { "epoch": 1.3, "learning_rate": 1.265051966738948e-05, "loss": 0.4403, "step": 7008 }, { "epoch": 1.3, "learning_rate": 1.2648593603047331e-05, "loss": 0.4467, "step": 7009 }, { "epoch": 1.3, "learning_rate": 1.2646667433031198e-05, "loss": 0.4364, "step": 7010 }, { "epoch": 1.3, "learning_rate": 1.2644741157417934e-05, "loss": 0.4408, "step": 7011 }, { "epoch": 1.3, "learning_rate": 1.2642814776284395e-05, "loss": 0.4448, "step": 7012 }, { "epoch": 1.3, "learning_rate": 1.264088828970744e-05, "loss": 0.424, "step": 7013 }, { "epoch": 1.3, "learning_rate": 1.2638961697763935e-05, "loss": 0.4346, "step": 7014 }, { "epoch": 1.3, "learning_rate": 1.263703500053074e-05, "loss": 0.4509, "step": 7015 }, { "epoch": 1.3, "learning_rate": 1.2635108198084732e-05, "loss": 0.4293, "step": 7016 }, { "epoch": 1.3, "learning_rate": 1.2633181290502784e-05, "loss": 0.4594, "step": 7017 }, { "epoch": 1.3, "learning_rate": 1.263125427786178e-05, "loss": 0.4443, "step": 7018 }, { "epoch": 1.3, "learning_rate": 1.26293271602386e-05, "loss": 0.4536, "step": 7019 }, { "epoch": 1.3, "learning_rate": 1.262739993771014e-05, "loss": 0.4481, "step": 7020 }, { "epoch": 1.3, "learning_rate": 1.262547261035328e-05, "loss": 0.4216, "step": 7021 }, { "epoch": 1.3, "learning_rate": 1.2623545178244924e-05, "loss": 0.4306, "step": 7022 }, { "epoch": 1.3, "learning_rate": 1.2621617641461976e-05, "loss": 0.4324, "step": 7023 }, { "epoch": 1.3, "learning_rate": 1.2619690000081337e-05, "loss": 0.4397, "step": 7024 }, { "epoch": 1.3, "learning_rate": 1.2617762254179918e-05, "loss": 0.4333, "step": 7025 }, { "epoch": 1.3, "learning_rate": 1.261583440383463e-05, "loss": 0.4248, "step": 7026 }, { "epoch": 1.3, "learning_rate": 1.2613906449122392e-05, "loss": 0.4085, "step": 7027 }, { "epoch": 1.3, "learning_rate": 1.261197839012013e-05, "loss": 0.4352, "step": 7028 }, { "epoch": 1.3, "learning_rate": 1.2610050226904763e-05, "loss": 0.429, "step": 7029 }, { "epoch": 1.3, "learning_rate": 1.2608121959553224e-05, "loss": 0.4512, "step": 7030 }, { "epoch": 1.3, "learning_rate": 1.2606193588142449e-05, "loss": 0.4443, "step": 7031 }, { "epoch": 1.3, "learning_rate": 1.2604265112749374e-05, "loss": 0.4258, "step": 7032 }, { "epoch": 1.3, "learning_rate": 1.260233653345094e-05, "loss": 0.4395, "step": 7033 }, { "epoch": 1.3, "learning_rate": 1.2600407850324102e-05, "loss": 0.4327, "step": 7034 }, { "epoch": 1.3, "learning_rate": 1.25984790634458e-05, "loss": 0.4336, "step": 7035 }, { "epoch": 1.3, "learning_rate": 1.2596550172893001e-05, "loss": 0.4295, "step": 7036 }, { "epoch": 1.3, "learning_rate": 1.2594621178742655e-05, "loss": 0.4522, "step": 7037 }, { "epoch": 1.3, "learning_rate": 1.2592692081071724e-05, "loss": 0.4405, "step": 7038 }, { "epoch": 1.3, "learning_rate": 1.2590762879957183e-05, "loss": 0.4268, "step": 7039 }, { "epoch": 1.3, "learning_rate": 1.2588833575475996e-05, "loss": 0.4357, "step": 7040 }, { "epoch": 1.3, "learning_rate": 1.2586904167705147e-05, "loss": 0.4443, "step": 7041 }, { "epoch": 1.3, "learning_rate": 1.2584974656721611e-05, "loss": 0.4309, "step": 7042 }, { "epoch": 1.3, "learning_rate": 1.2583045042602369e-05, "loss": 0.4444, "step": 7043 }, { "epoch": 1.3, "learning_rate": 1.2581115325424414e-05, "loss": 0.4443, "step": 7044 }, { "epoch": 1.3, "learning_rate": 1.2579185505264735e-05, "loss": 0.4396, "step": 7045 }, { "epoch": 1.3, "learning_rate": 1.257725558220033e-05, "loss": 0.4103, "step": 7046 }, { "epoch": 1.3, "learning_rate": 1.25753255563082e-05, "loss": 0.4474, "step": 7047 }, { "epoch": 1.3, "learning_rate": 1.257339542766535e-05, "loss": 0.4375, "step": 7048 }, { "epoch": 1.3, "learning_rate": 1.2571465196348782e-05, "loss": 0.438, "step": 7049 }, { "epoch": 1.3, "learning_rate": 1.2569534862435517e-05, "loss": 0.435, "step": 7050 }, { "epoch": 1.3, "learning_rate": 1.2567604426002567e-05, "loss": 0.4357, "step": 7051 }, { "epoch": 1.3, "learning_rate": 1.2565673887126954e-05, "loss": 0.4095, "step": 7052 }, { "epoch": 1.3, "learning_rate": 1.2563743245885705e-05, "loss": 0.4236, "step": 7053 }, { "epoch": 1.31, "learning_rate": 1.2561812502355846e-05, "loss": 0.409, "step": 7054 }, { "epoch": 1.31, "learning_rate": 1.255988165661441e-05, "loss": 0.4257, "step": 7055 }, { "epoch": 1.31, "learning_rate": 1.2557950708738436e-05, "loss": 0.4419, "step": 7056 }, { "epoch": 1.31, "learning_rate": 1.2556019658804966e-05, "loss": 0.433, "step": 7057 }, { "epoch": 1.31, "learning_rate": 1.2554088506891044e-05, "loss": 0.4203, "step": 7058 }, { "epoch": 1.31, "learning_rate": 1.2552157253073718e-05, "loss": 0.4398, "step": 7059 }, { "epoch": 1.31, "learning_rate": 1.2550225897430045e-05, "loss": 0.4107, "step": 7060 }, { "epoch": 1.31, "learning_rate": 1.2548294440037077e-05, "loss": 0.439, "step": 7061 }, { "epoch": 1.31, "learning_rate": 1.254636288097188e-05, "loss": 0.4469, "step": 7062 }, { "epoch": 1.31, "learning_rate": 1.2544431220311519e-05, "loss": 0.4293, "step": 7063 }, { "epoch": 1.31, "learning_rate": 1.2542499458133066e-05, "loss": 0.4337, "step": 7064 }, { "epoch": 1.31, "learning_rate": 1.2540567594513589e-05, "loss": 0.4386, "step": 7065 }, { "epoch": 1.31, "learning_rate": 1.253863562953017e-05, "loss": 0.4311, "step": 7066 }, { "epoch": 1.31, "learning_rate": 1.2536703563259886e-05, "loss": 0.4292, "step": 7067 }, { "epoch": 1.31, "learning_rate": 1.253477139577983e-05, "loss": 0.4535, "step": 7068 }, { "epoch": 1.31, "learning_rate": 1.2532839127167089e-05, "loss": 0.443, "step": 7069 }, { "epoch": 1.31, "learning_rate": 1.2530906757498753e-05, "loss": 0.441, "step": 7070 }, { "epoch": 1.31, "learning_rate": 1.2528974286851924e-05, "loss": 0.4432, "step": 7071 }, { "epoch": 1.31, "learning_rate": 1.2527041715303706e-05, "loss": 0.4273, "step": 7072 }, { "epoch": 1.31, "learning_rate": 1.2525109042931199e-05, "loss": 0.4355, "step": 7073 }, { "epoch": 1.31, "learning_rate": 1.2523176269811517e-05, "loss": 0.4329, "step": 7074 }, { "epoch": 1.31, "learning_rate": 1.2521243396021776e-05, "loss": 0.449, "step": 7075 }, { "epoch": 1.31, "learning_rate": 1.2519310421639087e-05, "loss": 0.4413, "step": 7076 }, { "epoch": 1.31, "learning_rate": 1.251737734674058e-05, "loss": 0.4264, "step": 7077 }, { "epoch": 1.31, "learning_rate": 1.2515444171403377e-05, "loss": 0.4434, "step": 7078 }, { "epoch": 1.31, "learning_rate": 1.2513510895704608e-05, "loss": 0.4208, "step": 7079 }, { "epoch": 1.31, "learning_rate": 1.2511577519721408e-05, "loss": 0.4325, "step": 7080 }, { "epoch": 1.31, "learning_rate": 1.2509644043530915e-05, "loss": 0.4485, "step": 7081 }, { "epoch": 1.31, "learning_rate": 1.250771046721027e-05, "loss": 0.4338, "step": 7082 }, { "epoch": 1.31, "learning_rate": 1.2505776790836622e-05, "loss": 0.4415, "step": 7083 }, { "epoch": 1.31, "learning_rate": 1.2503843014487118e-05, "loss": 0.4167, "step": 7084 }, { "epoch": 1.31, "learning_rate": 1.2501909138238915e-05, "loss": 0.438, "step": 7085 }, { "epoch": 1.31, "learning_rate": 1.2499975162169171e-05, "loss": 0.4377, "step": 7086 }, { "epoch": 1.31, "learning_rate": 1.2498041086355045e-05, "loss": 0.4287, "step": 7087 }, { "epoch": 1.31, "learning_rate": 1.2496106910873702e-05, "loss": 0.4257, "step": 7088 }, { "epoch": 1.31, "learning_rate": 1.2494172635802317e-05, "loss": 0.4245, "step": 7089 }, { "epoch": 1.31, "learning_rate": 1.2492238261218062e-05, "loss": 0.4405, "step": 7090 }, { "epoch": 1.31, "learning_rate": 1.2490303787198118e-05, "loss": 0.4302, "step": 7091 }, { "epoch": 1.31, "learning_rate": 1.2488369213819658e-05, "loss": 0.4475, "step": 7092 }, { "epoch": 1.31, "learning_rate": 1.2486434541159876e-05, "loss": 0.4472, "step": 7093 }, { "epoch": 1.31, "learning_rate": 1.2484499769295958e-05, "loss": 0.4497, "step": 7094 }, { "epoch": 1.31, "learning_rate": 1.2482564898305098e-05, "loss": 0.447, "step": 7095 }, { "epoch": 1.31, "learning_rate": 1.2480629928264496e-05, "loss": 0.4315, "step": 7096 }, { "epoch": 1.31, "learning_rate": 1.2478694859251357e-05, "loss": 0.4469, "step": 7097 }, { "epoch": 1.31, "learning_rate": 1.2476759691342877e-05, "loss": 0.4222, "step": 7098 }, { "epoch": 1.31, "learning_rate": 1.2474824424616272e-05, "loss": 0.4418, "step": 7099 }, { "epoch": 1.31, "learning_rate": 1.2472889059148757e-05, "loss": 0.4706, "step": 7100 }, { "epoch": 1.31, "learning_rate": 1.2470953595017543e-05, "loss": 0.4303, "step": 7101 }, { "epoch": 1.31, "learning_rate": 1.2469018032299858e-05, "loss": 0.4296, "step": 7102 }, { "epoch": 1.31, "learning_rate": 1.2467082371072922e-05, "loss": 0.4381, "step": 7103 }, { "epoch": 1.31, "learning_rate": 1.246514661141397e-05, "loss": 0.4527, "step": 7104 }, { "epoch": 1.31, "learning_rate": 1.2463210753400231e-05, "loss": 0.459, "step": 7105 }, { "epoch": 1.31, "learning_rate": 1.2461274797108945e-05, "loss": 0.4135, "step": 7106 }, { "epoch": 1.31, "learning_rate": 1.2459338742617348e-05, "loss": 0.4364, "step": 7107 }, { "epoch": 1.32, "learning_rate": 1.2457402590002694e-05, "loss": 0.4263, "step": 7108 }, { "epoch": 1.32, "learning_rate": 1.2455466339342224e-05, "loss": 0.4301, "step": 7109 }, { "epoch": 1.32, "learning_rate": 1.245352999071319e-05, "loss": 0.4345, "step": 7110 }, { "epoch": 1.32, "learning_rate": 1.2451593544192856e-05, "loss": 0.4338, "step": 7111 }, { "epoch": 1.32, "learning_rate": 1.2449656999858477e-05, "loss": 0.4396, "step": 7112 }, { "epoch": 1.32, "learning_rate": 1.244772035778732e-05, "loss": 0.4351, "step": 7113 }, { "epoch": 1.32, "learning_rate": 1.2445783618056652e-05, "loss": 0.4349, "step": 7114 }, { "epoch": 1.32, "learning_rate": 1.2443846780743747e-05, "loss": 0.4446, "step": 7115 }, { "epoch": 1.32, "learning_rate": 1.2441909845925877e-05, "loss": 0.4217, "step": 7116 }, { "epoch": 1.32, "learning_rate": 1.2439972813680328e-05, "loss": 0.4278, "step": 7117 }, { "epoch": 1.32, "learning_rate": 1.243803568408438e-05, "loss": 0.4265, "step": 7118 }, { "epoch": 1.32, "learning_rate": 1.2436098457215324e-05, "loss": 0.4704, "step": 7119 }, { "epoch": 1.32, "learning_rate": 1.2434161133150449e-05, "loss": 0.4433, "step": 7120 }, { "epoch": 1.32, "learning_rate": 1.243222371196705e-05, "loss": 0.4345, "step": 7121 }, { "epoch": 1.32, "learning_rate": 1.2430286193742429e-05, "loss": 0.4297, "step": 7122 }, { "epoch": 1.32, "learning_rate": 1.2428348578553887e-05, "loss": 0.4432, "step": 7123 }, { "epoch": 1.32, "learning_rate": 1.2426410866478736e-05, "loss": 0.4297, "step": 7124 }, { "epoch": 1.32, "learning_rate": 1.2424473057594282e-05, "loss": 0.4486, "step": 7125 }, { "epoch": 1.32, "learning_rate": 1.2422535151977842e-05, "loss": 0.4281, "step": 7126 }, { "epoch": 1.32, "learning_rate": 1.2420597149706732e-05, "loss": 0.4306, "step": 7127 }, { "epoch": 1.32, "learning_rate": 1.2418659050858279e-05, "loss": 0.4268, "step": 7128 }, { "epoch": 1.32, "learning_rate": 1.241672085550981e-05, "loss": 0.4297, "step": 7129 }, { "epoch": 1.32, "learning_rate": 1.241478256373865e-05, "loss": 0.4567, "step": 7130 }, { "epoch": 1.32, "learning_rate": 1.2412844175622139e-05, "loss": 0.4302, "step": 7131 }, { "epoch": 1.32, "learning_rate": 1.2410905691237612e-05, "loss": 0.4366, "step": 7132 }, { "epoch": 1.32, "learning_rate": 1.240896711066241e-05, "loss": 0.4434, "step": 7133 }, { "epoch": 1.32, "learning_rate": 1.2407028433973883e-05, "loss": 0.4284, "step": 7134 }, { "epoch": 1.32, "learning_rate": 1.2405089661249378e-05, "loss": 0.4463, "step": 7135 }, { "epoch": 1.32, "learning_rate": 1.2403150792566247e-05, "loss": 0.4406, "step": 7136 }, { "epoch": 1.32, "learning_rate": 1.240121182800185e-05, "loss": 0.4369, "step": 7137 }, { "epoch": 1.32, "learning_rate": 1.2399272767633543e-05, "loss": 0.4185, "step": 7138 }, { "epoch": 1.32, "learning_rate": 1.2397333611538698e-05, "loss": 0.4367, "step": 7139 }, { "epoch": 1.32, "learning_rate": 1.239539435979468e-05, "loss": 0.4493, "step": 7140 }, { "epoch": 1.32, "learning_rate": 1.2393455012478863e-05, "loss": 0.4478, "step": 7141 }, { "epoch": 1.32, "learning_rate": 1.2391515569668621e-05, "loss": 0.45, "step": 7142 }, { "epoch": 1.32, "learning_rate": 1.2389576031441338e-05, "loss": 0.4178, "step": 7143 }, { "epoch": 1.32, "learning_rate": 1.2387636397874393e-05, "loss": 0.4315, "step": 7144 }, { "epoch": 1.32, "learning_rate": 1.2385696669045175e-05, "loss": 0.4277, "step": 7145 }, { "epoch": 1.32, "learning_rate": 1.2383756845031081e-05, "loss": 0.4606, "step": 7146 }, { "epoch": 1.32, "learning_rate": 1.23818169259095e-05, "loss": 0.45, "step": 7147 }, { "epoch": 1.32, "learning_rate": 1.2379876911757834e-05, "loss": 0.4456, "step": 7148 }, { "epoch": 1.32, "learning_rate": 1.2377936802653483e-05, "loss": 0.4327, "step": 7149 }, { "epoch": 1.32, "learning_rate": 1.2375996598673858e-05, "loss": 0.4276, "step": 7150 }, { "epoch": 1.32, "learning_rate": 1.2374056299896366e-05, "loss": 0.4464, "step": 7151 }, { "epoch": 1.32, "learning_rate": 1.2372115906398426e-05, "loss": 0.4526, "step": 7152 }, { "epoch": 1.32, "learning_rate": 1.237017541825745e-05, "loss": 0.443, "step": 7153 }, { "epoch": 1.32, "learning_rate": 1.2368234835550866e-05, "loss": 0.4155, "step": 7154 }, { "epoch": 1.32, "learning_rate": 1.2366294158356095e-05, "loss": 0.417, "step": 7155 }, { "epoch": 1.32, "learning_rate": 1.236435338675057e-05, "loss": 0.4578, "step": 7156 }, { "epoch": 1.32, "learning_rate": 1.2362412520811721e-05, "loss": 0.4414, "step": 7157 }, { "epoch": 1.32, "learning_rate": 1.236047156061699e-05, "loss": 0.4261, "step": 7158 }, { "epoch": 1.32, "learning_rate": 1.2358530506243809e-05, "loss": 0.4384, "step": 7159 }, { "epoch": 1.32, "learning_rate": 1.2356589357769628e-05, "loss": 0.4449, "step": 7160 }, { "epoch": 1.32, "learning_rate": 1.2354648115271897e-05, "loss": 0.4418, "step": 7161 }, { "epoch": 1.33, "learning_rate": 1.2352706778828063e-05, "loss": 0.4282, "step": 7162 }, { "epoch": 1.33, "learning_rate": 1.235076534851559e-05, "loss": 0.4331, "step": 7163 }, { "epoch": 1.33, "learning_rate": 1.2348823824411927e-05, "loss": 0.4324, "step": 7164 }, { "epoch": 1.33, "learning_rate": 1.2346882206594542e-05, "loss": 0.4248, "step": 7165 }, { "epoch": 1.33, "learning_rate": 1.2344940495140902e-05, "loss": 0.422, "step": 7166 }, { "epoch": 1.33, "learning_rate": 1.2342998690128481e-05, "loss": 0.4328, "step": 7167 }, { "epoch": 1.33, "learning_rate": 1.2341056791634749e-05, "loss": 0.4326, "step": 7168 }, { "epoch": 1.33, "learning_rate": 1.2339114799737184e-05, "loss": 0.4431, "step": 7169 }, { "epoch": 1.33, "learning_rate": 1.233717271451327e-05, "loss": 0.4383, "step": 7170 }, { "epoch": 1.33, "learning_rate": 1.2335230536040491e-05, "loss": 0.4283, "step": 7171 }, { "epoch": 1.33, "learning_rate": 1.2333288264396338e-05, "loss": 0.4315, "step": 7172 }, { "epoch": 1.33, "learning_rate": 1.2331345899658303e-05, "loss": 0.4439, "step": 7173 }, { "epoch": 1.33, "learning_rate": 1.2329403441903884e-05, "loss": 0.4415, "step": 7174 }, { "epoch": 1.33, "learning_rate": 1.2327460891210582e-05, "loss": 0.4388, "step": 7175 }, { "epoch": 1.33, "learning_rate": 1.2325518247655895e-05, "loss": 0.4087, "step": 7176 }, { "epoch": 1.33, "learning_rate": 1.2323575511317339e-05, "loss": 0.4391, "step": 7177 }, { "epoch": 1.33, "learning_rate": 1.232163268227242e-05, "loss": 0.416, "step": 7178 }, { "epoch": 1.33, "learning_rate": 1.2319689760598654e-05, "loss": 0.4318, "step": 7179 }, { "epoch": 1.33, "learning_rate": 1.2317746746373564e-05, "loss": 0.4399, "step": 7180 }, { "epoch": 1.33, "learning_rate": 1.2315803639674669e-05, "loss": 0.4303, "step": 7181 }, { "epoch": 1.33, "learning_rate": 1.2313860440579496e-05, "loss": 0.4344, "step": 7182 }, { "epoch": 1.33, "learning_rate": 1.2311917149165578e-05, "loss": 0.425, "step": 7183 }, { "epoch": 1.33, "learning_rate": 1.2309973765510443e-05, "loss": 0.4265, "step": 7184 }, { "epoch": 1.33, "learning_rate": 1.2308030289691634e-05, "loss": 0.4477, "step": 7185 }, { "epoch": 1.33, "learning_rate": 1.230608672178669e-05, "loss": 0.4476, "step": 7186 }, { "epoch": 1.33, "learning_rate": 1.2304143061873152e-05, "loss": 0.4308, "step": 7187 }, { "epoch": 1.33, "learning_rate": 1.2302199310028575e-05, "loss": 0.4259, "step": 7188 }, { "epoch": 1.33, "learning_rate": 1.2300255466330506e-05, "loss": 0.442, "step": 7189 }, { "epoch": 1.33, "learning_rate": 1.2298311530856506e-05, "loss": 0.4211, "step": 7190 }, { "epoch": 1.33, "learning_rate": 1.2296367503684128e-05, "loss": 0.4249, "step": 7191 }, { "epoch": 1.33, "learning_rate": 1.229442338489094e-05, "loss": 0.4389, "step": 7192 }, { "epoch": 1.33, "learning_rate": 1.2292479174554504e-05, "loss": 0.4471, "step": 7193 }, { "epoch": 1.33, "learning_rate": 1.2290534872752393e-05, "loss": 0.4296, "step": 7194 }, { "epoch": 1.33, "learning_rate": 1.2288590479562186e-05, "loss": 0.4297, "step": 7195 }, { "epoch": 1.33, "learning_rate": 1.2286645995061455e-05, "loss": 0.4284, "step": 7196 }, { "epoch": 1.33, "learning_rate": 1.2284701419327781e-05, "loss": 0.4439, "step": 7197 }, { "epoch": 1.33, "learning_rate": 1.2282756752438749e-05, "loss": 0.4587, "step": 7198 }, { "epoch": 1.33, "learning_rate": 1.228081199447195e-05, "loss": 0.4517, "step": 7199 }, { "epoch": 1.33, "learning_rate": 1.2278867145504976e-05, "loss": 0.4202, "step": 7200 }, { "epoch": 1.33, "learning_rate": 1.2276922205615423e-05, "loss": 0.424, "step": 7201 }, { "epoch": 1.33, "learning_rate": 1.227497717488089e-05, "loss": 0.4354, "step": 7202 }, { "epoch": 1.33, "learning_rate": 1.2273032053378975e-05, "loss": 0.4412, "step": 7203 }, { "epoch": 1.33, "learning_rate": 1.2271086841187292e-05, "loss": 0.4361, "step": 7204 }, { "epoch": 1.33, "learning_rate": 1.2269141538383451e-05, "loss": 0.4284, "step": 7205 }, { "epoch": 1.33, "learning_rate": 1.2267196145045062e-05, "loss": 0.4069, "step": 7206 }, { "epoch": 1.33, "learning_rate": 1.2265250661249744e-05, "loss": 0.4323, "step": 7207 }, { "epoch": 1.33, "learning_rate": 1.226330508707512e-05, "loss": 0.4218, "step": 7208 }, { "epoch": 1.33, "learning_rate": 1.226135942259881e-05, "loss": 0.4414, "step": 7209 }, { "epoch": 1.33, "learning_rate": 1.2259413667898449e-05, "loss": 0.4448, "step": 7210 }, { "epoch": 1.33, "learning_rate": 1.2257467823051665e-05, "loss": 0.4176, "step": 7211 }, { "epoch": 1.33, "learning_rate": 1.2255521888136097e-05, "loss": 0.4396, "step": 7212 }, { "epoch": 1.33, "learning_rate": 1.2253575863229378e-05, "loss": 0.4165, "step": 7213 }, { "epoch": 1.33, "learning_rate": 1.2251629748409158e-05, "loss": 0.4267, "step": 7214 }, { "epoch": 1.33, "learning_rate": 1.2249683543753074e-05, "loss": 0.4573, "step": 7215 }, { "epoch": 1.34, "learning_rate": 1.2247737249338787e-05, "loss": 0.4296, "step": 7216 }, { "epoch": 1.34, "learning_rate": 1.2245790865243945e-05, "loss": 0.4153, "step": 7217 }, { "epoch": 1.34, "learning_rate": 1.2243844391546204e-05, "loss": 0.4438, "step": 7218 }, { "epoch": 1.34, "learning_rate": 1.2241897828323227e-05, "loss": 0.4413, "step": 7219 }, { "epoch": 1.34, "learning_rate": 1.2239951175652675e-05, "loss": 0.4361, "step": 7220 }, { "epoch": 1.34, "learning_rate": 1.223800443361222e-05, "loss": 0.4137, "step": 7221 }, { "epoch": 1.34, "learning_rate": 1.2236057602279532e-05, "loss": 0.4309, "step": 7222 }, { "epoch": 1.34, "learning_rate": 1.2234110681732287e-05, "loss": 0.4473, "step": 7223 }, { "epoch": 1.34, "learning_rate": 1.2232163672048161e-05, "loss": 0.4345, "step": 7224 }, { "epoch": 1.34, "learning_rate": 1.2230216573304835e-05, "loss": 0.4334, "step": 7225 }, { "epoch": 1.34, "learning_rate": 1.2228269385579999e-05, "loss": 0.442, "step": 7226 }, { "epoch": 1.34, "learning_rate": 1.2226322108951341e-05, "loss": 0.4359, "step": 7227 }, { "epoch": 1.34, "learning_rate": 1.2224374743496549e-05, "loss": 0.437, "step": 7228 }, { "epoch": 1.34, "learning_rate": 1.2222427289293326e-05, "loss": 0.4246, "step": 7229 }, { "epoch": 1.34, "learning_rate": 1.2220479746419369e-05, "loss": 0.4584, "step": 7230 }, { "epoch": 1.34, "learning_rate": 1.2218532114952379e-05, "loss": 0.4453, "step": 7231 }, { "epoch": 1.34, "learning_rate": 1.2216584394970066e-05, "loss": 0.4358, "step": 7232 }, { "epoch": 1.34, "learning_rate": 1.2214636586550141e-05, "loss": 0.4335, "step": 7233 }, { "epoch": 1.34, "learning_rate": 1.2212688689770318e-05, "loss": 0.441, "step": 7234 }, { "epoch": 1.34, "learning_rate": 1.2210740704708311e-05, "loss": 0.433, "step": 7235 }, { "epoch": 1.34, "learning_rate": 1.2208792631441841e-05, "loss": 0.4367, "step": 7236 }, { "epoch": 1.34, "learning_rate": 1.2206844470048635e-05, "loss": 0.4447, "step": 7237 }, { "epoch": 1.34, "learning_rate": 1.220489622060642e-05, "loss": 0.4359, "step": 7238 }, { "epoch": 1.34, "learning_rate": 1.2202947883192933e-05, "loss": 0.4352, "step": 7239 }, { "epoch": 1.34, "learning_rate": 1.22009994578859e-05, "loss": 0.4399, "step": 7240 }, { "epoch": 1.34, "learning_rate": 1.2199050944763065e-05, "loss": 0.4397, "step": 7241 }, { "epoch": 1.34, "learning_rate": 1.2197102343902167e-05, "loss": 0.4417, "step": 7242 }, { "epoch": 1.34, "learning_rate": 1.2195153655380956e-05, "loss": 0.4472, "step": 7243 }, { "epoch": 1.34, "learning_rate": 1.2193204879277175e-05, "loss": 0.4488, "step": 7244 }, { "epoch": 1.34, "learning_rate": 1.2191256015668584e-05, "loss": 0.4217, "step": 7245 }, { "epoch": 1.34, "learning_rate": 1.2189307064632933e-05, "loss": 0.4413, "step": 7246 }, { "epoch": 1.34, "learning_rate": 1.2187358026247984e-05, "loss": 0.4256, "step": 7247 }, { "epoch": 1.34, "learning_rate": 1.2185408900591498e-05, "loss": 0.4502, "step": 7248 }, { "epoch": 1.34, "learning_rate": 1.2183459687741243e-05, "loss": 0.4432, "step": 7249 }, { "epoch": 1.34, "learning_rate": 1.2181510387774991e-05, "loss": 0.4604, "step": 7250 }, { "epoch": 1.34, "learning_rate": 1.2179561000770513e-05, "loss": 0.4291, "step": 7251 }, { "epoch": 1.34, "learning_rate": 1.2177611526805586e-05, "loss": 0.4245, "step": 7252 }, { "epoch": 1.34, "learning_rate": 1.217566196595799e-05, "loss": 0.4163, "step": 7253 }, { "epoch": 1.34, "learning_rate": 1.2173712318305508e-05, "loss": 0.4282, "step": 7254 }, { "epoch": 1.34, "learning_rate": 1.2171762583925932e-05, "loss": 0.4275, "step": 7255 }, { "epoch": 1.34, "learning_rate": 1.2169812762897049e-05, "loss": 0.4397, "step": 7256 }, { "epoch": 1.34, "learning_rate": 1.2167862855296655e-05, "loss": 0.4552, "step": 7257 }, { "epoch": 1.34, "learning_rate": 1.2165912861202544e-05, "loss": 0.4388, "step": 7258 }, { "epoch": 1.34, "learning_rate": 1.2163962780692522e-05, "loss": 0.4363, "step": 7259 }, { "epoch": 1.34, "learning_rate": 1.2162012613844392e-05, "loss": 0.4482, "step": 7260 }, { "epoch": 1.34, "learning_rate": 1.2160062360735962e-05, "loss": 0.44, "step": 7261 }, { "epoch": 1.34, "learning_rate": 1.2158112021445044e-05, "loss": 0.4561, "step": 7262 }, { "epoch": 1.34, "learning_rate": 1.2156161596049447e-05, "loss": 0.4443, "step": 7263 }, { "epoch": 1.34, "learning_rate": 1.2154211084626999e-05, "loss": 0.4327, "step": 7264 }, { "epoch": 1.34, "learning_rate": 1.2152260487255514e-05, "loss": 0.4341, "step": 7265 }, { "epoch": 1.34, "learning_rate": 1.215030980401282e-05, "loss": 0.4216, "step": 7266 }, { "epoch": 1.34, "learning_rate": 1.2148359034976752e-05, "loss": 0.4272, "step": 7267 }, { "epoch": 1.34, "learning_rate": 1.2146408180225131e-05, "loss": 0.4288, "step": 7268 }, { "epoch": 1.34, "learning_rate": 1.2144457239835798e-05, "loss": 0.4584, "step": 7269 }, { "epoch": 1.35, "learning_rate": 1.2142506213886591e-05, "loss": 0.4462, "step": 7270 }, { "epoch": 1.35, "learning_rate": 1.2140555102455354e-05, "loss": 0.4398, "step": 7271 }, { "epoch": 1.35, "learning_rate": 1.2138603905619935e-05, "loss": 0.4585, "step": 7272 }, { "epoch": 1.35, "learning_rate": 1.2136652623458174e-05, "loss": 0.4433, "step": 7273 }, { "epoch": 1.35, "learning_rate": 1.2134701256047931e-05, "loss": 0.4369, "step": 7274 }, { "epoch": 1.35, "learning_rate": 1.2132749803467062e-05, "loss": 0.4512, "step": 7275 }, { "epoch": 1.35, "learning_rate": 1.2130798265793422e-05, "loss": 0.4325, "step": 7276 }, { "epoch": 1.35, "learning_rate": 1.2128846643104877e-05, "loss": 0.4501, "step": 7277 }, { "epoch": 1.35, "learning_rate": 1.2126894935479292e-05, "loss": 0.4242, "step": 7278 }, { "epoch": 1.35, "learning_rate": 1.2124943142994536e-05, "loss": 0.4446, "step": 7279 }, { "epoch": 1.35, "learning_rate": 1.2122991265728485e-05, "loss": 0.419, "step": 7280 }, { "epoch": 1.35, "learning_rate": 1.2121039303759013e-05, "loss": 0.4464, "step": 7281 }, { "epoch": 1.35, "learning_rate": 1.2119087257163997e-05, "loss": 0.4423, "step": 7282 }, { "epoch": 1.35, "learning_rate": 1.2117135126021328e-05, "loss": 0.4284, "step": 7283 }, { "epoch": 1.35, "learning_rate": 1.2115182910408885e-05, "loss": 0.438, "step": 7284 }, { "epoch": 1.35, "learning_rate": 1.2113230610404558e-05, "loss": 0.4558, "step": 7285 }, { "epoch": 1.35, "learning_rate": 1.2111278226086243e-05, "loss": 0.4269, "step": 7286 }, { "epoch": 1.35, "learning_rate": 1.2109325757531835e-05, "loss": 0.4441, "step": 7287 }, { "epoch": 1.35, "learning_rate": 1.2107373204819238e-05, "loss": 0.4509, "step": 7288 }, { "epoch": 1.35, "learning_rate": 1.210542056802635e-05, "loss": 0.4288, "step": 7289 }, { "epoch": 1.35, "learning_rate": 1.2103467847231078e-05, "loss": 0.442, "step": 7290 }, { "epoch": 1.35, "learning_rate": 1.2101515042511335e-05, "loss": 0.4385, "step": 7291 }, { "epoch": 1.35, "learning_rate": 1.2099562153945033e-05, "loss": 0.4479, "step": 7292 }, { "epoch": 1.35, "learning_rate": 1.2097609181610087e-05, "loss": 0.4301, "step": 7293 }, { "epoch": 1.35, "learning_rate": 1.2095656125584421e-05, "loss": 0.4356, "step": 7294 }, { "epoch": 1.35, "learning_rate": 1.2093702985945952e-05, "loss": 0.4474, "step": 7295 }, { "epoch": 1.35, "learning_rate": 1.209174976277261e-05, "loss": 0.4438, "step": 7296 }, { "epoch": 1.35, "learning_rate": 1.2089796456142326e-05, "loss": 0.4097, "step": 7297 }, { "epoch": 1.35, "learning_rate": 1.2087843066133033e-05, "loss": 0.4172, "step": 7298 }, { "epoch": 1.35, "learning_rate": 1.2085889592822668e-05, "loss": 0.4528, "step": 7299 }, { "epoch": 1.35, "learning_rate": 1.2083936036289171e-05, "loss": 0.4294, "step": 7300 }, { "epoch": 1.35, "learning_rate": 1.2081982396610484e-05, "loss": 0.4517, "step": 7301 }, { "epoch": 1.35, "learning_rate": 1.2080028673864552e-05, "loss": 0.4485, "step": 7302 }, { "epoch": 1.35, "learning_rate": 1.2078074868129329e-05, "loss": 0.4337, "step": 7303 }, { "epoch": 1.35, "learning_rate": 1.2076120979482763e-05, "loss": 0.4478, "step": 7304 }, { "epoch": 1.35, "learning_rate": 1.2074167008002817e-05, "loss": 0.4338, "step": 7305 }, { "epoch": 1.35, "learning_rate": 1.2072212953767448e-05, "loss": 0.4349, "step": 7306 }, { "epoch": 1.35, "learning_rate": 1.2070258816854617e-05, "loss": 0.4274, "step": 7307 }, { "epoch": 1.35, "learning_rate": 1.206830459734229e-05, "loss": 0.4517, "step": 7308 }, { "epoch": 1.35, "learning_rate": 1.2066350295308442e-05, "loss": 0.4213, "step": 7309 }, { "epoch": 1.35, "learning_rate": 1.2064395910831044e-05, "loss": 0.4472, "step": 7310 }, { "epoch": 1.35, "learning_rate": 1.2062441443988071e-05, "loss": 0.4386, "step": 7311 }, { "epoch": 1.35, "learning_rate": 1.2060486894857502e-05, "loss": 0.448, "step": 7312 }, { "epoch": 1.35, "learning_rate": 1.2058532263517319e-05, "loss": 0.4263, "step": 7313 }, { "epoch": 1.35, "learning_rate": 1.2056577550045511e-05, "loss": 0.427, "step": 7314 }, { "epoch": 1.35, "learning_rate": 1.2054622754520066e-05, "loss": 0.426, "step": 7315 }, { "epoch": 1.35, "learning_rate": 1.2052667877018981e-05, "loss": 0.4341, "step": 7316 }, { "epoch": 1.35, "learning_rate": 1.2050712917620246e-05, "loss": 0.4513, "step": 7317 }, { "epoch": 1.35, "learning_rate": 1.204875787640186e-05, "loss": 0.4457, "step": 7318 }, { "epoch": 1.35, "learning_rate": 1.2046802753441829e-05, "loss": 0.4445, "step": 7319 }, { "epoch": 1.35, "learning_rate": 1.204484754881816e-05, "loss": 0.4388, "step": 7320 }, { "epoch": 1.35, "learning_rate": 1.2042892262608856e-05, "loss": 0.4412, "step": 7321 }, { "epoch": 1.35, "learning_rate": 1.2040936894891937e-05, "loss": 0.4259, "step": 7322 }, { "epoch": 1.35, "learning_rate": 1.2038981445745412e-05, "loss": 0.4492, "step": 7323 }, { "epoch": 1.36, "learning_rate": 1.2037025915247302e-05, "loss": 0.4442, "step": 7324 }, { "epoch": 1.36, "learning_rate": 1.203507030347563e-05, "loss": 0.4289, "step": 7325 }, { "epoch": 1.36, "learning_rate": 1.203311461050842e-05, "loss": 0.4442, "step": 7326 }, { "epoch": 1.36, "learning_rate": 1.2031158836423706e-05, "loss": 0.4324, "step": 7327 }, { "epoch": 1.36, "learning_rate": 1.202920298129951e-05, "loss": 0.4211, "step": 7328 }, { "epoch": 1.36, "learning_rate": 1.2027247045213874e-05, "loss": 0.4385, "step": 7329 }, { "epoch": 1.36, "learning_rate": 1.2025291028244832e-05, "loss": 0.4259, "step": 7330 }, { "epoch": 1.36, "learning_rate": 1.202333493047043e-05, "loss": 0.4424, "step": 7331 }, { "epoch": 1.36, "learning_rate": 1.2021378751968708e-05, "loss": 0.452, "step": 7332 }, { "epoch": 1.36, "learning_rate": 1.2019422492817718e-05, "loss": 0.4272, "step": 7333 }, { "epoch": 1.36, "learning_rate": 1.201746615309551e-05, "loss": 0.4462, "step": 7334 }, { "epoch": 1.36, "learning_rate": 1.2015509732880138e-05, "loss": 0.4337, "step": 7335 }, { "epoch": 1.36, "learning_rate": 1.2013553232249657e-05, "loss": 0.4433, "step": 7336 }, { "epoch": 1.36, "learning_rate": 1.2011596651282132e-05, "loss": 0.4549, "step": 7337 }, { "epoch": 1.36, "learning_rate": 1.2009639990055625e-05, "loss": 0.4445, "step": 7338 }, { "epoch": 1.36, "learning_rate": 1.2007683248648201e-05, "loss": 0.4326, "step": 7339 }, { "epoch": 1.36, "learning_rate": 1.2005726427137936e-05, "loss": 0.4339, "step": 7340 }, { "epoch": 1.36, "learning_rate": 1.2003769525602897e-05, "loss": 0.4817, "step": 7341 }, { "epoch": 1.36, "learning_rate": 1.2001812544121164e-05, "loss": 0.4187, "step": 7342 }, { "epoch": 1.36, "learning_rate": 1.1999855482770816e-05, "loss": 0.431, "step": 7343 }, { "epoch": 1.36, "learning_rate": 1.1997898341629942e-05, "loss": 0.4326, "step": 7344 }, { "epoch": 1.36, "learning_rate": 1.1995941120776619e-05, "loss": 0.4432, "step": 7345 }, { "epoch": 1.36, "learning_rate": 1.1993983820288942e-05, "loss": 0.444, "step": 7346 }, { "epoch": 1.36, "learning_rate": 1.1992026440245e-05, "loss": 0.4523, "step": 7347 }, { "epoch": 1.36, "learning_rate": 1.1990068980722893e-05, "loss": 0.4338, "step": 7348 }, { "epoch": 1.36, "learning_rate": 1.198811144180072e-05, "loss": 0.4408, "step": 7349 }, { "epoch": 1.36, "learning_rate": 1.1986153823556579e-05, "loss": 0.4275, "step": 7350 }, { "epoch": 1.36, "learning_rate": 1.1984196126068578e-05, "loss": 0.4277, "step": 7351 }, { "epoch": 1.36, "learning_rate": 1.1982238349414825e-05, "loss": 0.4257, "step": 7352 }, { "epoch": 1.36, "learning_rate": 1.198028049367343e-05, "loss": 0.4353, "step": 7353 }, { "epoch": 1.36, "learning_rate": 1.1978322558922512e-05, "loss": 0.4541, "step": 7354 }, { "epoch": 1.36, "learning_rate": 1.1976364545240186e-05, "loss": 0.4797, "step": 7355 }, { "epoch": 1.36, "learning_rate": 1.1974406452704575e-05, "loss": 0.4521, "step": 7356 }, { "epoch": 1.36, "learning_rate": 1.1972448281393802e-05, "loss": 0.4331, "step": 7357 }, { "epoch": 1.36, "learning_rate": 1.1970490031385994e-05, "loss": 0.4241, "step": 7358 }, { "epoch": 1.36, "learning_rate": 1.1968531702759281e-05, "loss": 0.4515, "step": 7359 }, { "epoch": 1.36, "learning_rate": 1.19665732955918e-05, "loss": 0.4467, "step": 7360 }, { "epoch": 1.36, "learning_rate": 1.1964614809961684e-05, "loss": 0.4166, "step": 7361 }, { "epoch": 1.36, "learning_rate": 1.1962656245947073e-05, "loss": 0.4483, "step": 7362 }, { "epoch": 1.36, "learning_rate": 1.1960697603626113e-05, "loss": 0.4271, "step": 7363 }, { "epoch": 1.36, "learning_rate": 1.1958738883076949e-05, "loss": 0.4131, "step": 7364 }, { "epoch": 1.36, "learning_rate": 1.195678008437773e-05, "loss": 0.438, "step": 7365 }, { "epoch": 1.36, "learning_rate": 1.195482120760661e-05, "loss": 0.4445, "step": 7366 }, { "epoch": 1.36, "learning_rate": 1.1952862252841742e-05, "loss": 0.439, "step": 7367 }, { "epoch": 1.36, "learning_rate": 1.1950903220161286e-05, "loss": 0.4237, "step": 7368 }, { "epoch": 1.36, "learning_rate": 1.1948944109643401e-05, "loss": 0.4254, "step": 7369 }, { "epoch": 1.36, "learning_rate": 1.1946984921366255e-05, "loss": 0.4248, "step": 7370 }, { "epoch": 1.36, "learning_rate": 1.1945025655408018e-05, "loss": 0.4317, "step": 7371 }, { "epoch": 1.36, "learning_rate": 1.1943066311846858e-05, "loss": 0.4281, "step": 7372 }, { "epoch": 1.36, "learning_rate": 1.1941106890760947e-05, "loss": 0.4476, "step": 7373 }, { "epoch": 1.36, "learning_rate": 1.1939147392228467e-05, "loss": 0.4336, "step": 7374 }, { "epoch": 1.36, "learning_rate": 1.1937187816327596e-05, "loss": 0.4423, "step": 7375 }, { "epoch": 1.36, "learning_rate": 1.1935228163136517e-05, "loss": 0.4339, "step": 7376 }, { "epoch": 1.36, "learning_rate": 1.193326843273342e-05, "loss": 0.4554, "step": 7377 }, { "epoch": 1.37, "learning_rate": 1.193130862519649e-05, "loss": 0.4335, "step": 7378 }, { "epoch": 1.37, "learning_rate": 1.192934874060392e-05, "loss": 0.4551, "step": 7379 }, { "epoch": 1.37, "learning_rate": 1.1927388779033909e-05, "loss": 0.4524, "step": 7380 }, { "epoch": 1.37, "learning_rate": 1.1925428740564652e-05, "loss": 0.4479, "step": 7381 }, { "epoch": 1.37, "learning_rate": 1.1923468625274354e-05, "loss": 0.443, "step": 7382 }, { "epoch": 1.37, "learning_rate": 1.1921508433241223e-05, "loss": 0.4541, "step": 7383 }, { "epoch": 1.37, "learning_rate": 1.1919548164543458e-05, "loss": 0.4553, "step": 7384 }, { "epoch": 1.37, "learning_rate": 1.1917587819259278e-05, "loss": 0.4327, "step": 7385 }, { "epoch": 1.37, "learning_rate": 1.1915627397466894e-05, "loss": 0.4663, "step": 7386 }, { "epoch": 1.37, "learning_rate": 1.1913666899244522e-05, "loss": 0.4526, "step": 7387 }, { "epoch": 1.37, "learning_rate": 1.1911706324670386e-05, "loss": 0.4386, "step": 7388 }, { "epoch": 1.37, "learning_rate": 1.1909745673822706e-05, "loss": 0.414, "step": 7389 }, { "epoch": 1.37, "learning_rate": 1.190778494677971e-05, "loss": 0.4362, "step": 7390 }, { "epoch": 1.37, "learning_rate": 1.1905824143619625e-05, "loss": 0.4485, "step": 7391 }, { "epoch": 1.37, "learning_rate": 1.1903863264420686e-05, "loss": 0.429, "step": 7392 }, { "epoch": 1.37, "learning_rate": 1.190190230926113e-05, "loss": 0.4076, "step": 7393 }, { "epoch": 1.37, "learning_rate": 1.1899941278219191e-05, "loss": 0.45, "step": 7394 }, { "epoch": 1.37, "learning_rate": 1.1897980171373114e-05, "loss": 0.4351, "step": 7395 }, { "epoch": 1.37, "learning_rate": 1.189601898880114e-05, "loss": 0.4239, "step": 7396 }, { "epoch": 1.37, "learning_rate": 1.1894057730581519e-05, "loss": 0.431, "step": 7397 }, { "epoch": 1.37, "learning_rate": 1.1892096396792501e-05, "loss": 0.4356, "step": 7398 }, { "epoch": 1.37, "learning_rate": 1.1890134987512343e-05, "loss": 0.4485, "step": 7399 }, { "epoch": 1.37, "learning_rate": 1.1888173502819295e-05, "loss": 0.4378, "step": 7400 }, { "epoch": 1.37, "learning_rate": 1.1886211942791623e-05, "loss": 0.4298, "step": 7401 }, { "epoch": 1.37, "learning_rate": 1.1884250307507585e-05, "loss": 0.4289, "step": 7402 }, { "epoch": 1.37, "learning_rate": 1.1882288597045449e-05, "loss": 0.4598, "step": 7403 }, { "epoch": 1.37, "learning_rate": 1.1880326811483481e-05, "loss": 0.4384, "step": 7404 }, { "epoch": 1.37, "learning_rate": 1.1878364950899957e-05, "loss": 0.4575, "step": 7405 }, { "epoch": 1.37, "learning_rate": 1.1876403015373145e-05, "loss": 0.4367, "step": 7406 }, { "epoch": 1.37, "learning_rate": 1.1874441004981331e-05, "loss": 0.4338, "step": 7407 }, { "epoch": 1.37, "learning_rate": 1.187247891980279e-05, "loss": 0.4535, "step": 7408 }, { "epoch": 1.37, "learning_rate": 1.1870516759915807e-05, "loss": 0.4339, "step": 7409 }, { "epoch": 1.37, "learning_rate": 1.186855452539867e-05, "loss": 0.4377, "step": 7410 }, { "epoch": 1.37, "learning_rate": 1.1866592216329666e-05, "loss": 0.4318, "step": 7411 }, { "epoch": 1.37, "learning_rate": 1.1864629832787089e-05, "loss": 0.4165, "step": 7412 }, { "epoch": 1.37, "learning_rate": 1.1862667374849232e-05, "loss": 0.4548, "step": 7413 }, { "epoch": 1.37, "learning_rate": 1.1860704842594397e-05, "loss": 0.4148, "step": 7414 }, { "epoch": 1.37, "learning_rate": 1.1858742236100885e-05, "loss": 0.4383, "step": 7415 }, { "epoch": 1.37, "learning_rate": 1.1856779555446996e-05, "loss": 0.4196, "step": 7416 }, { "epoch": 1.37, "learning_rate": 1.1854816800711042e-05, "loss": 0.4277, "step": 7417 }, { "epoch": 1.37, "learning_rate": 1.185285397197133e-05, "loss": 0.4465, "step": 7418 }, { "epoch": 1.37, "learning_rate": 1.1850891069306178e-05, "loss": 0.4423, "step": 7419 }, { "epoch": 1.37, "learning_rate": 1.1848928092793897e-05, "loss": 0.4431, "step": 7420 }, { "epoch": 1.37, "learning_rate": 1.184696504251281e-05, "loss": 0.4335, "step": 7421 }, { "epoch": 1.37, "learning_rate": 1.1845001918541238e-05, "loss": 0.4477, "step": 7422 }, { "epoch": 1.37, "learning_rate": 1.1843038720957503e-05, "loss": 0.4383, "step": 7423 }, { "epoch": 1.37, "learning_rate": 1.1841075449839936e-05, "loss": 0.4439, "step": 7424 }, { "epoch": 1.37, "learning_rate": 1.1839112105266865e-05, "loss": 0.4424, "step": 7425 }, { "epoch": 1.37, "learning_rate": 1.183714868731663e-05, "loss": 0.4313, "step": 7426 }, { "epoch": 1.37, "learning_rate": 1.1835185196067562e-05, "loss": 0.443, "step": 7427 }, { "epoch": 1.37, "learning_rate": 1.1833221631598004e-05, "loss": 0.454, "step": 7428 }, { "epoch": 1.37, "learning_rate": 1.1831257993986296e-05, "loss": 0.4628, "step": 7429 }, { "epoch": 1.37, "learning_rate": 1.1829294283310783e-05, "loss": 0.4276, "step": 7430 }, { "epoch": 1.37, "learning_rate": 1.1827330499649816e-05, "loss": 0.443, "step": 7431 }, { "epoch": 1.38, "learning_rate": 1.1825366643081744e-05, "loss": 0.4307, "step": 7432 }, { "epoch": 1.38, "learning_rate": 1.1823402713684925e-05, "loss": 0.4471, "step": 7433 }, { "epoch": 1.38, "learning_rate": 1.1821438711537712e-05, "loss": 0.4251, "step": 7434 }, { "epoch": 1.38, "learning_rate": 1.1819474636718466e-05, "loss": 0.4542, "step": 7435 }, { "epoch": 1.38, "learning_rate": 1.1817510489305552e-05, "loss": 0.43, "step": 7436 }, { "epoch": 1.38, "learning_rate": 1.1815546269377336e-05, "loss": 0.4441, "step": 7437 }, { "epoch": 1.38, "learning_rate": 1.1813581977012184e-05, "loss": 0.418, "step": 7438 }, { "epoch": 1.38, "learning_rate": 1.1811617612288468e-05, "loss": 0.4466, "step": 7439 }, { "epoch": 1.38, "learning_rate": 1.1809653175284564e-05, "loss": 0.4339, "step": 7440 }, { "epoch": 1.38, "learning_rate": 1.1807688666078847e-05, "loss": 0.4445, "step": 7441 }, { "epoch": 1.38, "learning_rate": 1.18057240847497e-05, "loss": 0.4181, "step": 7442 }, { "epoch": 1.38, "learning_rate": 1.180375943137551e-05, "loss": 0.4341, "step": 7443 }, { "epoch": 1.38, "learning_rate": 1.1801794706034653e-05, "loss": 0.4399, "step": 7444 }, { "epoch": 1.38, "learning_rate": 1.1799829908805525e-05, "loss": 0.4266, "step": 7445 }, { "epoch": 1.38, "learning_rate": 1.1797865039766513e-05, "loss": 0.4365, "step": 7446 }, { "epoch": 1.38, "learning_rate": 1.1795900098996019e-05, "loss": 0.4287, "step": 7447 }, { "epoch": 1.38, "learning_rate": 1.1793935086572434e-05, "loss": 0.4435, "step": 7448 }, { "epoch": 1.38, "learning_rate": 1.179197000257416e-05, "loss": 0.4415, "step": 7449 }, { "epoch": 1.38, "learning_rate": 1.1790004847079602e-05, "loss": 0.4339, "step": 7450 }, { "epoch": 1.38, "learning_rate": 1.1788039620167163e-05, "loss": 0.438, "step": 7451 }, { "epoch": 1.38, "learning_rate": 1.1786074321915252e-05, "loss": 0.4483, "step": 7452 }, { "epoch": 1.38, "learning_rate": 1.1784108952402287e-05, "loss": 0.4417, "step": 7453 }, { "epoch": 1.38, "learning_rate": 1.1782143511706676e-05, "loss": 0.4601, "step": 7454 }, { "epoch": 1.38, "learning_rate": 1.178017799990684e-05, "loss": 0.4344, "step": 7455 }, { "epoch": 1.38, "learning_rate": 1.1778212417081195e-05, "loss": 0.4266, "step": 7456 }, { "epoch": 1.38, "learning_rate": 1.1776246763308167e-05, "loss": 0.4199, "step": 7457 }, { "epoch": 1.38, "learning_rate": 1.1774281038666181e-05, "loss": 0.4308, "step": 7458 }, { "epoch": 1.38, "learning_rate": 1.177231524323367e-05, "loss": 0.453, "step": 7459 }, { "epoch": 1.38, "learning_rate": 1.1770349377089058e-05, "loss": 0.4391, "step": 7460 }, { "epoch": 1.38, "learning_rate": 1.1768383440310786e-05, "loss": 0.4353, "step": 7461 }, { "epoch": 1.38, "learning_rate": 1.1766417432977289e-05, "loss": 0.4407, "step": 7462 }, { "epoch": 1.38, "learning_rate": 1.1764451355167007e-05, "loss": 0.4301, "step": 7463 }, { "epoch": 1.38, "learning_rate": 1.1762485206958381e-05, "loss": 0.4157, "step": 7464 }, { "epoch": 1.38, "learning_rate": 1.1760518988429861e-05, "loss": 0.4445, "step": 7465 }, { "epoch": 1.38, "learning_rate": 1.175855269965989e-05, "loss": 0.4471, "step": 7466 }, { "epoch": 1.38, "learning_rate": 1.1756586340726925e-05, "loss": 0.4195, "step": 7467 }, { "epoch": 1.38, "learning_rate": 1.1754619911709415e-05, "loss": 0.4461, "step": 7468 }, { "epoch": 1.38, "learning_rate": 1.1752653412685819e-05, "loss": 0.4314, "step": 7469 }, { "epoch": 1.38, "learning_rate": 1.17506868437346e-05, "loss": 0.4346, "step": 7470 }, { "epoch": 1.38, "learning_rate": 1.1748720204934214e-05, "loss": 0.4387, "step": 7471 }, { "epoch": 1.38, "learning_rate": 1.1746753496363132e-05, "loss": 0.4409, "step": 7472 }, { "epoch": 1.38, "learning_rate": 1.1744786718099816e-05, "loss": 0.4594, "step": 7473 }, { "epoch": 1.38, "learning_rate": 1.1742819870222743e-05, "loss": 0.4496, "step": 7474 }, { "epoch": 1.38, "learning_rate": 1.1740852952810383e-05, "loss": 0.4531, "step": 7475 }, { "epoch": 1.38, "learning_rate": 1.1738885965941216e-05, "loss": 0.4473, "step": 7476 }, { "epoch": 1.38, "learning_rate": 1.1736918909693716e-05, "loss": 0.448, "step": 7477 }, { "epoch": 1.38, "learning_rate": 1.1734951784146366e-05, "loss": 0.4497, "step": 7478 }, { "epoch": 1.38, "learning_rate": 1.1732984589377655e-05, "loss": 0.4473, "step": 7479 }, { "epoch": 1.38, "learning_rate": 1.1731017325466064e-05, "loss": 0.4295, "step": 7480 }, { "epoch": 1.38, "learning_rate": 1.1729049992490086e-05, "loss": 0.4226, "step": 7481 }, { "epoch": 1.38, "learning_rate": 1.1727082590528219e-05, "loss": 0.4401, "step": 7482 }, { "epoch": 1.38, "learning_rate": 1.1725115119658952e-05, "loss": 0.4315, "step": 7483 }, { "epoch": 1.38, "learning_rate": 1.1723147579960786e-05, "loss": 0.4339, "step": 7484 }, { "epoch": 1.38, "learning_rate": 1.172117997151222e-05, "loss": 0.4408, "step": 7485 }, { "epoch": 1.39, "learning_rate": 1.1719212294391762e-05, "loss": 0.4303, "step": 7486 }, { "epoch": 1.39, "learning_rate": 1.1717244548677918e-05, "loss": 0.4315, "step": 7487 }, { "epoch": 1.39, "learning_rate": 1.1715276734449193e-05, "loss": 0.4274, "step": 7488 }, { "epoch": 1.39, "learning_rate": 1.1713308851784103e-05, "loss": 0.4393, "step": 7489 }, { "epoch": 1.39, "learning_rate": 1.171134090076116e-05, "loss": 0.4721, "step": 7490 }, { "epoch": 1.39, "learning_rate": 1.1709372881458887e-05, "loss": 0.4264, "step": 7491 }, { "epoch": 1.39, "learning_rate": 1.1707404793955801e-05, "loss": 0.4469, "step": 7492 }, { "epoch": 1.39, "learning_rate": 1.1705436638330422e-05, "loss": 0.4255, "step": 7493 }, { "epoch": 1.39, "learning_rate": 1.170346841466128e-05, "loss": 0.4369, "step": 7494 }, { "epoch": 1.39, "learning_rate": 1.17015001230269e-05, "loss": 0.413, "step": 7495 }, { "epoch": 1.39, "learning_rate": 1.1699531763505817e-05, "loss": 0.4408, "step": 7496 }, { "epoch": 1.39, "learning_rate": 1.1697563336176565e-05, "loss": 0.4265, "step": 7497 }, { "epoch": 1.39, "learning_rate": 1.169559484111768e-05, "loss": 0.4327, "step": 7498 }, { "epoch": 1.39, "learning_rate": 1.1693626278407696e-05, "loss": 0.436, "step": 7499 }, { "epoch": 1.39, "learning_rate": 1.1691657648125162e-05, "loss": 0.4373, "step": 7500 }, { "epoch": 1.39, "learning_rate": 1.1689688950348617e-05, "loss": 0.4337, "step": 7501 }, { "epoch": 1.39, "learning_rate": 1.1687720185156613e-05, "loss": 0.4259, "step": 7502 }, { "epoch": 1.39, "learning_rate": 1.1685751352627699e-05, "loss": 0.437, "step": 7503 }, { "epoch": 1.39, "learning_rate": 1.1683782452840426e-05, "loss": 0.4204, "step": 7504 }, { "epoch": 1.39, "learning_rate": 1.168181348587335e-05, "loss": 0.4343, "step": 7505 }, { "epoch": 1.39, "learning_rate": 1.167984445180503e-05, "loss": 0.4335, "step": 7506 }, { "epoch": 1.39, "learning_rate": 1.1677875350714028e-05, "loss": 0.4451, "step": 7507 }, { "epoch": 1.39, "learning_rate": 1.1675906182678904e-05, "loss": 0.4574, "step": 7508 }, { "epoch": 1.39, "learning_rate": 1.1673936947778226e-05, "loss": 0.4374, "step": 7509 }, { "epoch": 1.39, "learning_rate": 1.1671967646090565e-05, "loss": 0.4454, "step": 7510 }, { "epoch": 1.39, "learning_rate": 1.166999827769449e-05, "loss": 0.441, "step": 7511 }, { "epoch": 1.39, "learning_rate": 1.1668028842668573e-05, "loss": 0.4444, "step": 7512 }, { "epoch": 1.39, "learning_rate": 1.1666059341091395e-05, "loss": 0.4253, "step": 7513 }, { "epoch": 1.39, "learning_rate": 1.1664089773041538e-05, "loss": 0.4571, "step": 7514 }, { "epoch": 1.39, "learning_rate": 1.1662120138597576e-05, "loss": 0.4358, "step": 7515 }, { "epoch": 1.39, "learning_rate": 1.1660150437838099e-05, "loss": 0.446, "step": 7516 }, { "epoch": 1.39, "learning_rate": 1.1658180670841692e-05, "loss": 0.4292, "step": 7517 }, { "epoch": 1.39, "learning_rate": 1.1656210837686948e-05, "loss": 0.4365, "step": 7518 }, { "epoch": 1.39, "learning_rate": 1.1654240938452456e-05, "loss": 0.4389, "step": 7519 }, { "epoch": 1.39, "learning_rate": 1.1652270973216817e-05, "loss": 0.4449, "step": 7520 }, { "epoch": 1.39, "learning_rate": 1.1650300942058622e-05, "loss": 0.4395, "step": 7521 }, { "epoch": 1.39, "learning_rate": 1.1648330845056474e-05, "loss": 0.4334, "step": 7522 }, { "epoch": 1.39, "learning_rate": 1.1646360682288979e-05, "loss": 0.4278, "step": 7523 }, { "epoch": 1.39, "learning_rate": 1.164439045383474e-05, "loss": 0.4065, "step": 7524 }, { "epoch": 1.39, "learning_rate": 1.1642420159772368e-05, "loss": 0.4306, "step": 7525 }, { "epoch": 1.39, "learning_rate": 1.164044980018047e-05, "loss": 0.4369, "step": 7526 }, { "epoch": 1.39, "learning_rate": 1.1638479375137663e-05, "loss": 0.4473, "step": 7527 }, { "epoch": 1.39, "learning_rate": 1.1636508884722564e-05, "loss": 0.4372, "step": 7528 }, { "epoch": 1.39, "learning_rate": 1.163453832901379e-05, "loss": 0.4272, "step": 7529 }, { "epoch": 1.39, "learning_rate": 1.1632567708089961e-05, "loss": 0.4289, "step": 7530 }, { "epoch": 1.39, "learning_rate": 1.1630597022029704e-05, "loss": 0.4161, "step": 7531 }, { "epoch": 1.39, "learning_rate": 1.1628626270911645e-05, "loss": 0.4356, "step": 7532 }, { "epoch": 1.39, "learning_rate": 1.1626655454814412e-05, "loss": 0.4343, "step": 7533 }, { "epoch": 1.39, "learning_rate": 1.1624684573816641e-05, "loss": 0.4339, "step": 7534 }, { "epoch": 1.39, "learning_rate": 1.1622713627996963e-05, "loss": 0.4355, "step": 7535 }, { "epoch": 1.39, "learning_rate": 1.1620742617434015e-05, "loss": 0.4536, "step": 7536 }, { "epoch": 1.39, "learning_rate": 1.1618771542206435e-05, "loss": 0.4218, "step": 7537 }, { "epoch": 1.39, "learning_rate": 1.161680040239287e-05, "loss": 0.4442, "step": 7538 }, { "epoch": 1.39, "learning_rate": 1.1614829198071962e-05, "loss": 0.4353, "step": 7539 }, { "epoch": 1.4, "learning_rate": 1.1612857929322358e-05, "loss": 0.429, "step": 7540 }, { "epoch": 1.4, "learning_rate": 1.161088659622271e-05, "loss": 0.4191, "step": 7541 }, { "epoch": 1.4, "learning_rate": 1.160891519885167e-05, "loss": 0.4276, "step": 7542 }, { "epoch": 1.4, "learning_rate": 1.160694373728789e-05, "loss": 0.4349, "step": 7543 }, { "epoch": 1.4, "learning_rate": 1.160497221161003e-05, "loss": 0.4427, "step": 7544 }, { "epoch": 1.4, "learning_rate": 1.1603000621896752e-05, "loss": 0.4379, "step": 7545 }, { "epoch": 1.4, "learning_rate": 1.1601028968226716e-05, "loss": 0.4368, "step": 7546 }, { "epoch": 1.4, "learning_rate": 1.1599057250678589e-05, "loss": 0.4456, "step": 7547 }, { "epoch": 1.4, "learning_rate": 1.1597085469331039e-05, "loss": 0.4517, "step": 7548 }, { "epoch": 1.4, "learning_rate": 1.1595113624262736e-05, "loss": 0.4409, "step": 7549 }, { "epoch": 1.4, "learning_rate": 1.159314171555235e-05, "loss": 0.4324, "step": 7550 }, { "epoch": 1.4, "learning_rate": 1.1591169743278559e-05, "loss": 0.4393, "step": 7551 }, { "epoch": 1.4, "learning_rate": 1.1589197707520045e-05, "loss": 0.4303, "step": 7552 }, { "epoch": 1.4, "learning_rate": 1.1587225608355481e-05, "loss": 0.4239, "step": 7553 }, { "epoch": 1.4, "learning_rate": 1.1585253445863556e-05, "loss": 0.4368, "step": 7554 }, { "epoch": 1.4, "learning_rate": 1.1583281220122953e-05, "loss": 0.4486, "step": 7555 }, { "epoch": 1.4, "learning_rate": 1.1581308931212361e-05, "loss": 0.423, "step": 7556 }, { "epoch": 1.4, "learning_rate": 1.157933657921047e-05, "loss": 0.4273, "step": 7557 }, { "epoch": 1.4, "learning_rate": 1.1577364164195972e-05, "loss": 0.4197, "step": 7558 }, { "epoch": 1.4, "learning_rate": 1.1575391686247566e-05, "loss": 0.4308, "step": 7559 }, { "epoch": 1.4, "learning_rate": 1.1573419145443946e-05, "loss": 0.434, "step": 7560 }, { "epoch": 1.4, "learning_rate": 1.1571446541863817e-05, "loss": 0.4402, "step": 7561 }, { "epoch": 1.4, "learning_rate": 1.1569473875585882e-05, "loss": 0.4244, "step": 7562 }, { "epoch": 1.4, "learning_rate": 1.1567501146688846e-05, "loss": 0.4303, "step": 7563 }, { "epoch": 1.4, "learning_rate": 1.1565528355251415e-05, "loss": 0.4228, "step": 7564 }, { "epoch": 1.4, "learning_rate": 1.1563555501352299e-05, "loss": 0.4235, "step": 7565 }, { "epoch": 1.4, "learning_rate": 1.1561582585070218e-05, "loss": 0.465, "step": 7566 }, { "epoch": 1.4, "learning_rate": 1.1559609606483877e-05, "loss": 0.4344, "step": 7567 }, { "epoch": 1.4, "learning_rate": 1.1557636565672003e-05, "loss": 0.4025, "step": 7568 }, { "epoch": 1.4, "learning_rate": 1.1555663462713315e-05, "loss": 0.425, "step": 7569 }, { "epoch": 1.4, "learning_rate": 1.1553690297686534e-05, "loss": 0.4381, "step": 7570 }, { "epoch": 1.4, "learning_rate": 1.1551717070670388e-05, "loss": 0.4021, "step": 7571 }, { "epoch": 1.4, "learning_rate": 1.1549743781743603e-05, "loss": 0.4144, "step": 7572 }, { "epoch": 1.4, "learning_rate": 1.1547770430984908e-05, "loss": 0.4531, "step": 7573 }, { "epoch": 1.4, "learning_rate": 1.1545797018473044e-05, "loss": 0.4269, "step": 7574 }, { "epoch": 1.4, "learning_rate": 1.1543823544286737e-05, "loss": 0.4463, "step": 7575 }, { "epoch": 1.4, "learning_rate": 1.154185000850473e-05, "loss": 0.4225, "step": 7576 }, { "epoch": 1.4, "learning_rate": 1.1539876411205762e-05, "loss": 0.4319, "step": 7577 }, { "epoch": 1.4, "learning_rate": 1.1537902752468573e-05, "loss": 0.4571, "step": 7578 }, { "epoch": 1.4, "learning_rate": 1.1535929032371915e-05, "loss": 0.4165, "step": 7579 }, { "epoch": 1.4, "learning_rate": 1.1533955250994533e-05, "loss": 0.4481, "step": 7580 }, { "epoch": 1.4, "learning_rate": 1.1531981408415176e-05, "loss": 0.4384, "step": 7581 }, { "epoch": 1.4, "learning_rate": 1.1530007504712595e-05, "loss": 0.4319, "step": 7582 }, { "epoch": 1.4, "learning_rate": 1.152803353996555e-05, "loss": 0.4409, "step": 7583 }, { "epoch": 1.4, "learning_rate": 1.1526059514252794e-05, "loss": 0.4099, "step": 7584 }, { "epoch": 1.4, "learning_rate": 1.1524085427653089e-05, "loss": 0.4278, "step": 7585 }, { "epoch": 1.4, "learning_rate": 1.1522111280245197e-05, "loss": 0.4288, "step": 7586 }, { "epoch": 1.4, "learning_rate": 1.1520137072107884e-05, "loss": 0.4393, "step": 7587 }, { "epoch": 1.4, "learning_rate": 1.1518162803319915e-05, "loss": 0.4422, "step": 7588 }, { "epoch": 1.4, "learning_rate": 1.1516188473960061e-05, "loss": 0.4227, "step": 7589 }, { "epoch": 1.4, "learning_rate": 1.1514214084107094e-05, "loss": 0.4314, "step": 7590 }, { "epoch": 1.4, "learning_rate": 1.1512239633839792e-05, "loss": 0.4271, "step": 7591 }, { "epoch": 1.4, "learning_rate": 1.1510265123236926e-05, "loss": 0.4243, "step": 7592 }, { "epoch": 1.4, "learning_rate": 1.1508290552377277e-05, "loss": 0.4207, "step": 7593 }, { "epoch": 1.4, "learning_rate": 1.1506315921339629e-05, "loss": 0.4281, "step": 7594 }, { "epoch": 1.41, "learning_rate": 1.1504341230202762e-05, "loss": 0.4233, "step": 7595 }, { "epoch": 1.41, "learning_rate": 1.150236647904547e-05, "loss": 0.4225, "step": 7596 }, { "epoch": 1.41, "learning_rate": 1.1500391667946533e-05, "loss": 0.4284, "step": 7597 }, { "epoch": 1.41, "learning_rate": 1.1498416796984746e-05, "loss": 0.4246, "step": 7598 }, { "epoch": 1.41, "learning_rate": 1.1496441866238905e-05, "loss": 0.4401, "step": 7599 }, { "epoch": 1.41, "learning_rate": 1.1494466875787803e-05, "loss": 0.4028, "step": 7600 }, { "epoch": 1.41, "learning_rate": 1.1492491825710239e-05, "loss": 0.4376, "step": 7601 }, { "epoch": 1.41, "learning_rate": 1.1490516716085018e-05, "loss": 0.4359, "step": 7602 }, { "epoch": 1.41, "learning_rate": 1.1488541546990937e-05, "loss": 0.4402, "step": 7603 }, { "epoch": 1.41, "learning_rate": 1.1486566318506804e-05, "loss": 0.4298, "step": 7604 }, { "epoch": 1.41, "learning_rate": 1.1484591030711428e-05, "loss": 0.4344, "step": 7605 }, { "epoch": 1.41, "learning_rate": 1.1482615683683616e-05, "loss": 0.4416, "step": 7606 }, { "epoch": 1.41, "learning_rate": 1.1480640277502186e-05, "loss": 0.445, "step": 7607 }, { "epoch": 1.41, "learning_rate": 1.147866481224595e-05, "loss": 0.4397, "step": 7608 }, { "epoch": 1.41, "learning_rate": 1.1476689287993722e-05, "loss": 0.4369, "step": 7609 }, { "epoch": 1.41, "learning_rate": 1.147471370482433e-05, "loss": 0.4327, "step": 7610 }, { "epoch": 1.41, "learning_rate": 1.147273806281659e-05, "loss": 0.4111, "step": 7611 }, { "epoch": 1.41, "learning_rate": 1.1470762362049329e-05, "loss": 0.4319, "step": 7612 }, { "epoch": 1.41, "learning_rate": 1.1468786602601374e-05, "loss": 0.4279, "step": 7613 }, { "epoch": 1.41, "learning_rate": 1.1466810784551549e-05, "loss": 0.4328, "step": 7614 }, { "epoch": 1.41, "learning_rate": 1.1464834907978691e-05, "loss": 0.4426, "step": 7615 }, { "epoch": 1.41, "learning_rate": 1.1462858972961632e-05, "loss": 0.4217, "step": 7616 }, { "epoch": 1.41, "learning_rate": 1.1460882979579209e-05, "loss": 0.4372, "step": 7617 }, { "epoch": 1.41, "learning_rate": 1.1458906927910263e-05, "loss": 0.4063, "step": 7618 }, { "epoch": 1.41, "learning_rate": 1.1456930818033627e-05, "loss": 0.4374, "step": 7619 }, { "epoch": 1.41, "learning_rate": 1.145495465002815e-05, "loss": 0.4347, "step": 7620 }, { "epoch": 1.41, "learning_rate": 1.1452978423972676e-05, "loss": 0.4339, "step": 7621 }, { "epoch": 1.41, "learning_rate": 1.1451002139946053e-05, "loss": 0.4377, "step": 7622 }, { "epoch": 1.41, "learning_rate": 1.1449025798027131e-05, "loss": 0.4348, "step": 7623 }, { "epoch": 1.41, "learning_rate": 1.1447049398294765e-05, "loss": 0.4278, "step": 7624 }, { "epoch": 1.41, "learning_rate": 1.1445072940827806e-05, "loss": 0.449, "step": 7625 }, { "epoch": 1.41, "learning_rate": 1.1443096425705112e-05, "loss": 0.4574, "step": 7626 }, { "epoch": 1.41, "learning_rate": 1.144111985300554e-05, "loss": 0.4599, "step": 7627 }, { "epoch": 1.41, "learning_rate": 1.1439143222807956e-05, "loss": 0.4491, "step": 7628 }, { "epoch": 1.41, "learning_rate": 1.1437166535191223e-05, "loss": 0.4151, "step": 7629 }, { "epoch": 1.41, "learning_rate": 1.1435189790234204e-05, "loss": 0.4273, "step": 7630 }, { "epoch": 1.41, "learning_rate": 1.1433212988015771e-05, "loss": 0.4385, "step": 7631 }, { "epoch": 1.41, "learning_rate": 1.143123612861479e-05, "loss": 0.4504, "step": 7632 }, { "epoch": 1.41, "learning_rate": 1.1429259212110142e-05, "loss": 0.4288, "step": 7633 }, { "epoch": 1.41, "learning_rate": 1.1427282238580694e-05, "loss": 0.4361, "step": 7634 }, { "epoch": 1.41, "learning_rate": 1.142530520810533e-05, "loss": 0.4013, "step": 7635 }, { "epoch": 1.41, "learning_rate": 1.1423328120762927e-05, "loss": 0.4096, "step": 7636 }, { "epoch": 1.41, "learning_rate": 1.1421350976632363e-05, "loss": 0.4538, "step": 7637 }, { "epoch": 1.41, "learning_rate": 1.141937377579253e-05, "loss": 0.4427, "step": 7638 }, { "epoch": 1.41, "learning_rate": 1.1417396518322313e-05, "loss": 0.4369, "step": 7639 }, { "epoch": 1.41, "learning_rate": 1.1415419204300597e-05, "loss": 0.4318, "step": 7640 }, { "epoch": 1.41, "learning_rate": 1.1413441833806276e-05, "loss": 0.4352, "step": 7641 }, { "epoch": 1.41, "learning_rate": 1.1411464406918242e-05, "loss": 0.4356, "step": 7642 }, { "epoch": 1.41, "learning_rate": 1.1409486923715392e-05, "loss": 0.4297, "step": 7643 }, { "epoch": 1.41, "learning_rate": 1.140750938427662e-05, "loss": 0.4241, "step": 7644 }, { "epoch": 1.41, "learning_rate": 1.1405531788680833e-05, "loss": 0.4295, "step": 7645 }, { "epoch": 1.41, "learning_rate": 1.1403554137006932e-05, "loss": 0.4342, "step": 7646 }, { "epoch": 1.41, "learning_rate": 1.1401576429333817e-05, "loss": 0.4425, "step": 7647 }, { "epoch": 1.41, "learning_rate": 1.1399598665740396e-05, "loss": 0.4341, "step": 7648 }, { "epoch": 1.42, "learning_rate": 1.1397620846305582e-05, "loss": 0.4454, "step": 7649 }, { "epoch": 1.42, "learning_rate": 1.1395642971108281e-05, "loss": 0.4338, "step": 7650 }, { "epoch": 1.42, "learning_rate": 1.1393665040227412e-05, "loss": 0.4188, "step": 7651 }, { "epoch": 1.42, "learning_rate": 1.1391687053741888e-05, "loss": 0.4239, "step": 7652 }, { "epoch": 1.42, "learning_rate": 1.1389709011730627e-05, "loss": 0.4396, "step": 7653 }, { "epoch": 1.42, "learning_rate": 1.1387730914272548e-05, "loss": 0.4177, "step": 7654 }, { "epoch": 1.42, "learning_rate": 1.1385752761446576e-05, "loss": 0.4608, "step": 7655 }, { "epoch": 1.42, "learning_rate": 1.1383774553331635e-05, "loss": 0.4281, "step": 7656 }, { "epoch": 1.42, "learning_rate": 1.138179629000665e-05, "loss": 0.4098, "step": 7657 }, { "epoch": 1.42, "learning_rate": 1.137981797155055e-05, "loss": 0.4351, "step": 7658 }, { "epoch": 1.42, "learning_rate": 1.137783959804227e-05, "loss": 0.4383, "step": 7659 }, { "epoch": 1.42, "learning_rate": 1.137586116956074e-05, "loss": 0.4229, "step": 7660 }, { "epoch": 1.42, "learning_rate": 1.1373882686184898e-05, "loss": 0.4536, "step": 7661 }, { "epoch": 1.42, "learning_rate": 1.137190414799368e-05, "loss": 0.442, "step": 7662 }, { "epoch": 1.42, "learning_rate": 1.1369925555066026e-05, "loss": 0.4169, "step": 7663 }, { "epoch": 1.42, "learning_rate": 1.136794690748088e-05, "loss": 0.4297, "step": 7664 }, { "epoch": 1.42, "learning_rate": 1.1365968205317183e-05, "loss": 0.4415, "step": 7665 }, { "epoch": 1.42, "learning_rate": 1.1363989448653886e-05, "loss": 0.4342, "step": 7666 }, { "epoch": 1.42, "learning_rate": 1.136201063756993e-05, "loss": 0.4324, "step": 7667 }, { "epoch": 1.42, "learning_rate": 1.136003177214428e-05, "loss": 0.4354, "step": 7668 }, { "epoch": 1.42, "learning_rate": 1.1358052852455873e-05, "loss": 0.4307, "step": 7669 }, { "epoch": 1.42, "learning_rate": 1.1356073878583675e-05, "loss": 0.4317, "step": 7670 }, { "epoch": 1.42, "learning_rate": 1.1354094850606639e-05, "loss": 0.4484, "step": 7671 }, { "epoch": 1.42, "learning_rate": 1.1352115768603726e-05, "loss": 0.4198, "step": 7672 }, { "epoch": 1.42, "learning_rate": 1.1350136632653899e-05, "loss": 0.4277, "step": 7673 }, { "epoch": 1.42, "learning_rate": 1.1348157442836116e-05, "loss": 0.4382, "step": 7674 }, { "epoch": 1.42, "learning_rate": 1.134617819922935e-05, "loss": 0.4467, "step": 7675 }, { "epoch": 1.42, "learning_rate": 1.1344198901912564e-05, "loss": 0.4222, "step": 7676 }, { "epoch": 1.42, "learning_rate": 1.1342219550964732e-05, "loss": 0.437, "step": 7677 }, { "epoch": 1.42, "learning_rate": 1.1340240146464825e-05, "loss": 0.4416, "step": 7678 }, { "epoch": 1.42, "learning_rate": 1.1338260688491817e-05, "loss": 0.4236, "step": 7679 }, { "epoch": 1.42, "learning_rate": 1.1336281177124686e-05, "loss": 0.4257, "step": 7680 }, { "epoch": 1.42, "learning_rate": 1.1334301612442409e-05, "loss": 0.4337, "step": 7681 }, { "epoch": 1.42, "learning_rate": 1.133232199452397e-05, "loss": 0.4487, "step": 7682 }, { "epoch": 1.42, "learning_rate": 1.1330342323448347e-05, "loss": 0.4301, "step": 7683 }, { "epoch": 1.42, "learning_rate": 1.132836259929453e-05, "loss": 0.441, "step": 7684 }, { "epoch": 1.42, "learning_rate": 1.1326382822141505e-05, "loss": 0.4092, "step": 7685 }, { "epoch": 1.42, "learning_rate": 1.132440299206826e-05, "loss": 0.4607, "step": 7686 }, { "epoch": 1.42, "learning_rate": 1.1322423109153788e-05, "loss": 0.4305, "step": 7687 }, { "epoch": 1.42, "learning_rate": 1.1320443173477083e-05, "loss": 0.4785, "step": 7688 }, { "epoch": 1.42, "learning_rate": 1.131846318511714e-05, "loss": 0.4272, "step": 7689 }, { "epoch": 1.42, "learning_rate": 1.1316483144152959e-05, "loss": 0.4234, "step": 7690 }, { "epoch": 1.42, "learning_rate": 1.1314503050663537e-05, "loss": 0.4417, "step": 7691 }, { "epoch": 1.42, "learning_rate": 1.1312522904727874e-05, "loss": 0.4472, "step": 7692 }, { "epoch": 1.42, "learning_rate": 1.1310542706424981e-05, "loss": 0.4267, "step": 7693 }, { "epoch": 1.42, "learning_rate": 1.1308562455833859e-05, "loss": 0.4348, "step": 7694 }, { "epoch": 1.42, "learning_rate": 1.1306582153033516e-05, "loss": 0.4073, "step": 7695 }, { "epoch": 1.42, "learning_rate": 1.1304601798102965e-05, "loss": 0.4385, "step": 7696 }, { "epoch": 1.42, "learning_rate": 1.130262139112122e-05, "loss": 0.4408, "step": 7697 }, { "epoch": 1.42, "learning_rate": 1.1300640932167291e-05, "loss": 0.4215, "step": 7698 }, { "epoch": 1.42, "learning_rate": 1.1298660421320195e-05, "loss": 0.4243, "step": 7699 }, { "epoch": 1.42, "learning_rate": 1.1296679858658956e-05, "loss": 0.4221, "step": 7700 }, { "epoch": 1.42, "learning_rate": 1.1294699244262592e-05, "loss": 0.4135, "step": 7701 }, { "epoch": 1.42, "learning_rate": 1.1292718578210122e-05, "loss": 0.4017, "step": 7702 }, { "epoch": 1.43, "learning_rate": 1.1290737860580577e-05, "loss": 0.4284, "step": 7703 }, { "epoch": 1.43, "learning_rate": 1.128875709145298e-05, "loss": 0.4197, "step": 7704 }, { "epoch": 1.43, "learning_rate": 1.128677627090636e-05, "loss": 0.4543, "step": 7705 }, { "epoch": 1.43, "learning_rate": 1.128479539901975e-05, "loss": 0.4366, "step": 7706 }, { "epoch": 1.43, "learning_rate": 1.1282814475872181e-05, "loss": 0.4208, "step": 7707 }, { "epoch": 1.43, "learning_rate": 1.1280833501542691e-05, "loss": 0.4254, "step": 7708 }, { "epoch": 1.43, "learning_rate": 1.1278852476110316e-05, "loss": 0.4301, "step": 7709 }, { "epoch": 1.43, "learning_rate": 1.1276871399654095e-05, "loss": 0.4243, "step": 7710 }, { "epoch": 1.43, "learning_rate": 1.1274890272253068e-05, "loss": 0.4413, "step": 7711 }, { "epoch": 1.43, "learning_rate": 1.1272909093986283e-05, "loss": 0.4367, "step": 7712 }, { "epoch": 1.43, "learning_rate": 1.1270927864932777e-05, "loss": 0.4357, "step": 7713 }, { "epoch": 1.43, "learning_rate": 1.1268946585171604e-05, "loss": 0.4198, "step": 7714 }, { "epoch": 1.43, "learning_rate": 1.1266965254781812e-05, "loss": 0.4504, "step": 7715 }, { "epoch": 1.43, "learning_rate": 1.1264983873842453e-05, "loss": 0.4317, "step": 7716 }, { "epoch": 1.43, "learning_rate": 1.1263002442432579e-05, "loss": 0.4679, "step": 7717 }, { "epoch": 1.43, "learning_rate": 1.1261020960631245e-05, "loss": 0.438, "step": 7718 }, { "epoch": 1.43, "learning_rate": 1.125903942851751e-05, "loss": 0.4287, "step": 7719 }, { "epoch": 1.43, "learning_rate": 1.1257057846170432e-05, "loss": 0.4091, "step": 7720 }, { "epoch": 1.43, "learning_rate": 1.1255076213669073e-05, "loss": 0.4328, "step": 7721 }, { "epoch": 1.43, "learning_rate": 1.1253094531092498e-05, "loss": 0.4241, "step": 7722 }, { "epoch": 1.43, "learning_rate": 1.1251112798519775e-05, "loss": 0.4285, "step": 7723 }, { "epoch": 1.43, "learning_rate": 1.1249131016029962e-05, "loss": 0.4275, "step": 7724 }, { "epoch": 1.43, "learning_rate": 1.1247149183702136e-05, "loss": 0.431, "step": 7725 }, { "epoch": 1.43, "learning_rate": 1.1245167301615365e-05, "loss": 0.422, "step": 7726 }, { "epoch": 1.43, "learning_rate": 1.1243185369848725e-05, "loss": 0.4319, "step": 7727 }, { "epoch": 1.43, "learning_rate": 1.1241203388481293e-05, "loss": 0.4397, "step": 7728 }, { "epoch": 1.43, "learning_rate": 1.1239221357592143e-05, "loss": 0.422, "step": 7729 }, { "epoch": 1.43, "learning_rate": 1.1237239277260355e-05, "loss": 0.4322, "step": 7730 }, { "epoch": 1.43, "learning_rate": 1.1235257147565008e-05, "loss": 0.4076, "step": 7731 }, { "epoch": 1.43, "learning_rate": 1.1233274968585187e-05, "loss": 0.4303, "step": 7732 }, { "epoch": 1.43, "learning_rate": 1.1231292740399982e-05, "loss": 0.4344, "step": 7733 }, { "epoch": 1.43, "learning_rate": 1.1229310463088474e-05, "loss": 0.4152, "step": 7734 }, { "epoch": 1.43, "learning_rate": 1.1227328136729756e-05, "loss": 0.427, "step": 7735 }, { "epoch": 1.43, "learning_rate": 1.1225345761402918e-05, "loss": 0.4498, "step": 7736 }, { "epoch": 1.43, "learning_rate": 1.122336333718705e-05, "loss": 0.4352, "step": 7737 }, { "epoch": 1.43, "learning_rate": 1.122138086416125e-05, "loss": 0.4148, "step": 7738 }, { "epoch": 1.43, "learning_rate": 1.121939834240462e-05, "loss": 0.4187, "step": 7739 }, { "epoch": 1.43, "learning_rate": 1.121741577199625e-05, "loss": 0.4189, "step": 7740 }, { "epoch": 1.43, "learning_rate": 1.1215433153015245e-05, "loss": 0.4438, "step": 7741 }, { "epoch": 1.43, "learning_rate": 1.1213450485540707e-05, "loss": 0.4613, "step": 7742 }, { "epoch": 1.43, "learning_rate": 1.121146776965174e-05, "loss": 0.4354, "step": 7743 }, { "epoch": 1.43, "learning_rate": 1.1209485005427454e-05, "loss": 0.4229, "step": 7744 }, { "epoch": 1.43, "learning_rate": 1.1207502192946958e-05, "loss": 0.4428, "step": 7745 }, { "epoch": 1.43, "learning_rate": 1.1205519332289358e-05, "loss": 0.427, "step": 7746 }, { "epoch": 1.43, "learning_rate": 1.1203536423533767e-05, "loss": 0.4373, "step": 7747 }, { "epoch": 1.43, "learning_rate": 1.1201553466759302e-05, "loss": 0.4401, "step": 7748 }, { "epoch": 1.43, "learning_rate": 1.1199570462045077e-05, "loss": 0.438, "step": 7749 }, { "epoch": 1.43, "learning_rate": 1.1197587409470216e-05, "loss": 0.4416, "step": 7750 }, { "epoch": 1.43, "learning_rate": 1.119560430911383e-05, "loss": 0.4413, "step": 7751 }, { "epoch": 1.43, "learning_rate": 1.1193621161055048e-05, "loss": 0.4226, "step": 7752 }, { "epoch": 1.43, "learning_rate": 1.119163796537299e-05, "loss": 0.4228, "step": 7753 }, { "epoch": 1.43, "learning_rate": 1.1189654722146784e-05, "loss": 0.4249, "step": 7754 }, { "epoch": 1.43, "learning_rate": 1.1187671431455558e-05, "loss": 0.4188, "step": 7755 }, { "epoch": 1.43, "learning_rate": 1.1185688093378441e-05, "loss": 0.4178, "step": 7756 }, { "epoch": 1.44, "learning_rate": 1.1183704707994564e-05, "loss": 0.4345, "step": 7757 }, { "epoch": 1.44, "learning_rate": 1.118172127538306e-05, "loss": 0.4257, "step": 7758 }, { "epoch": 1.44, "learning_rate": 1.1179737795623065e-05, "loss": 0.4368, "step": 7759 }, { "epoch": 1.44, "learning_rate": 1.1177754268793714e-05, "loss": 0.444, "step": 7760 }, { "epoch": 1.44, "learning_rate": 1.1175770694974154e-05, "loss": 0.4294, "step": 7761 }, { "epoch": 1.44, "learning_rate": 1.1173787074243514e-05, "loss": 0.4382, "step": 7762 }, { "epoch": 1.44, "learning_rate": 1.1171803406680945e-05, "loss": 0.4447, "step": 7763 }, { "epoch": 1.44, "learning_rate": 1.1169819692365591e-05, "loss": 0.4545, "step": 7764 }, { "epoch": 1.44, "learning_rate": 1.1167835931376596e-05, "loss": 0.4569, "step": 7765 }, { "epoch": 1.44, "learning_rate": 1.1165852123793111e-05, "loss": 0.4172, "step": 7766 }, { "epoch": 1.44, "learning_rate": 1.1163868269694285e-05, "loss": 0.4223, "step": 7767 }, { "epoch": 1.44, "learning_rate": 1.1161884369159268e-05, "loss": 0.4171, "step": 7768 }, { "epoch": 1.44, "learning_rate": 1.1159900422267217e-05, "loss": 0.4328, "step": 7769 }, { "epoch": 1.44, "learning_rate": 1.1157916429097285e-05, "loss": 0.4467, "step": 7770 }, { "epoch": 1.44, "learning_rate": 1.1155932389728633e-05, "loss": 0.4491, "step": 7771 }, { "epoch": 1.44, "learning_rate": 1.1153948304240421e-05, "loss": 0.4217, "step": 7772 }, { "epoch": 1.44, "learning_rate": 1.1151964172711804e-05, "loss": 0.4439, "step": 7773 }, { "epoch": 1.44, "learning_rate": 1.1149979995221952e-05, "loss": 0.4339, "step": 7774 }, { "epoch": 1.44, "learning_rate": 1.1147995771850024e-05, "loss": 0.4225, "step": 7775 }, { "epoch": 1.44, "learning_rate": 1.1146011502675192e-05, "loss": 0.4491, "step": 7776 }, { "epoch": 1.44, "learning_rate": 1.1144027187776622e-05, "loss": 0.4558, "step": 7777 }, { "epoch": 1.44, "learning_rate": 1.1142042827233489e-05, "loss": 0.4363, "step": 7778 }, { "epoch": 1.44, "learning_rate": 1.114005842112496e-05, "loss": 0.4428, "step": 7779 }, { "epoch": 1.44, "learning_rate": 1.1138073969530207e-05, "loss": 0.4482, "step": 7780 }, { "epoch": 1.44, "learning_rate": 1.1136089472528414e-05, "loss": 0.4403, "step": 7781 }, { "epoch": 1.44, "learning_rate": 1.1134104930198752e-05, "loss": 0.4401, "step": 7782 }, { "epoch": 1.44, "learning_rate": 1.1132120342620403e-05, "loss": 0.4166, "step": 7783 }, { "epoch": 1.44, "learning_rate": 1.113013570987255e-05, "loss": 0.4221, "step": 7784 }, { "epoch": 1.44, "learning_rate": 1.1128151032034373e-05, "loss": 0.4383, "step": 7785 }, { "epoch": 1.44, "learning_rate": 1.112616630918506e-05, "loss": 0.4354, "step": 7786 }, { "epoch": 1.44, "learning_rate": 1.1124181541403796e-05, "loss": 0.4545, "step": 7787 }, { "epoch": 1.44, "learning_rate": 1.1122196728769767e-05, "loss": 0.4505, "step": 7788 }, { "epoch": 1.44, "learning_rate": 1.1120211871362172e-05, "loss": 0.4347, "step": 7789 }, { "epoch": 1.44, "learning_rate": 1.1118226969260194e-05, "loss": 0.4372, "step": 7790 }, { "epoch": 1.44, "learning_rate": 1.1116242022543028e-05, "loss": 0.4163, "step": 7791 }, { "epoch": 1.44, "learning_rate": 1.1114257031289877e-05, "loss": 0.4193, "step": 7792 }, { "epoch": 1.44, "learning_rate": 1.1112271995579928e-05, "loss": 0.4143, "step": 7793 }, { "epoch": 1.44, "learning_rate": 1.1110286915492392e-05, "loss": 0.4381, "step": 7794 }, { "epoch": 1.44, "learning_rate": 1.110830179110646e-05, "loss": 0.4082, "step": 7795 }, { "epoch": 1.44, "learning_rate": 1.1106316622501338e-05, "loss": 0.426, "step": 7796 }, { "epoch": 1.44, "learning_rate": 1.1104331409756233e-05, "loss": 0.4374, "step": 7797 }, { "epoch": 1.44, "learning_rate": 1.1102346152950347e-05, "loss": 0.4235, "step": 7798 }, { "epoch": 1.44, "learning_rate": 1.110036085216289e-05, "loss": 0.4477, "step": 7799 }, { "epoch": 1.44, "learning_rate": 1.1098375507473075e-05, "loss": 0.4195, "step": 7800 }, { "epoch": 1.44, "learning_rate": 1.1096390118960113e-05, "loss": 0.4375, "step": 7801 }, { "epoch": 1.44, "learning_rate": 1.1094404686703211e-05, "loss": 0.4223, "step": 7802 }, { "epoch": 1.44, "learning_rate": 1.1092419210781589e-05, "loss": 0.4273, "step": 7803 }, { "epoch": 1.44, "learning_rate": 1.1090433691274462e-05, "loss": 0.4253, "step": 7804 }, { "epoch": 1.44, "learning_rate": 1.1088448128261051e-05, "loss": 0.446, "step": 7805 }, { "epoch": 1.44, "learning_rate": 1.1086462521820575e-05, "loss": 0.4327, "step": 7806 }, { "epoch": 1.44, "learning_rate": 1.1084476872032255e-05, "loss": 0.4308, "step": 7807 }, { "epoch": 1.44, "learning_rate": 1.1082491178975317e-05, "loss": 0.4171, "step": 7808 }, { "epoch": 1.44, "learning_rate": 1.1080505442728984e-05, "loss": 0.424, "step": 7809 }, { "epoch": 1.44, "learning_rate": 1.1078519663372485e-05, "loss": 0.4396, "step": 7810 }, { "epoch": 1.45, "learning_rate": 1.1076533840985046e-05, "loss": 0.4412, "step": 7811 }, { "epoch": 1.45, "learning_rate": 1.1074547975645902e-05, "loss": 0.4436, "step": 7812 }, { "epoch": 1.45, "learning_rate": 1.1072562067434282e-05, "loss": 0.4348, "step": 7813 }, { "epoch": 1.45, "learning_rate": 1.1070576116429423e-05, "loss": 0.4305, "step": 7814 }, { "epoch": 1.45, "learning_rate": 1.1068590122710558e-05, "loss": 0.4418, "step": 7815 }, { "epoch": 1.45, "learning_rate": 1.106660408635693e-05, "loss": 0.4082, "step": 7816 }, { "epoch": 1.45, "learning_rate": 1.1064618007447768e-05, "loss": 0.4349, "step": 7817 }, { "epoch": 1.45, "learning_rate": 1.1062631886062321e-05, "loss": 0.4097, "step": 7818 }, { "epoch": 1.45, "learning_rate": 1.1060645722279828e-05, "loss": 0.4422, "step": 7819 }, { "epoch": 1.45, "learning_rate": 1.1058659516179534e-05, "loss": 0.4309, "step": 7820 }, { "epoch": 1.45, "learning_rate": 1.1056673267840685e-05, "loss": 0.4576, "step": 7821 }, { "epoch": 1.45, "learning_rate": 1.1054686977342533e-05, "loss": 0.4187, "step": 7822 }, { "epoch": 1.45, "learning_rate": 1.105270064476432e-05, "loss": 0.4115, "step": 7823 }, { "epoch": 1.45, "learning_rate": 1.1050714270185301e-05, "loss": 0.4462, "step": 7824 }, { "epoch": 1.45, "learning_rate": 1.104872785368473e-05, "loss": 0.4464, "step": 7825 }, { "epoch": 1.45, "learning_rate": 1.1046741395341853e-05, "loss": 0.4347, "step": 7826 }, { "epoch": 1.45, "learning_rate": 1.1044754895235941e-05, "loss": 0.4461, "step": 7827 }, { "epoch": 1.45, "learning_rate": 1.1042768353446237e-05, "loss": 0.4193, "step": 7828 }, { "epoch": 1.45, "learning_rate": 1.1040781770052007e-05, "loss": 0.4225, "step": 7829 }, { "epoch": 1.45, "learning_rate": 1.1038795145132512e-05, "loss": 0.4143, "step": 7830 }, { "epoch": 1.45, "learning_rate": 1.1036808478767014e-05, "loss": 0.4397, "step": 7831 }, { "epoch": 1.45, "learning_rate": 1.1034821771034778e-05, "loss": 0.4473, "step": 7832 }, { "epoch": 1.45, "learning_rate": 1.1032835022015067e-05, "loss": 0.4137, "step": 7833 }, { "epoch": 1.45, "learning_rate": 1.1030848231787152e-05, "loss": 0.438, "step": 7834 }, { "epoch": 1.45, "learning_rate": 1.1028861400430301e-05, "loss": 0.4472, "step": 7835 }, { "epoch": 1.45, "learning_rate": 1.1026874528023785e-05, "loss": 0.4227, "step": 7836 }, { "epoch": 1.45, "learning_rate": 1.1024887614646878e-05, "loss": 0.4227, "step": 7837 }, { "epoch": 1.45, "learning_rate": 1.1022900660378855e-05, "loss": 0.4162, "step": 7838 }, { "epoch": 1.45, "learning_rate": 1.1020913665298985e-05, "loss": 0.4353, "step": 7839 }, { "epoch": 1.45, "learning_rate": 1.101892662948655e-05, "loss": 0.4322, "step": 7840 }, { "epoch": 1.45, "learning_rate": 1.1016939553020831e-05, "loss": 0.4398, "step": 7841 }, { "epoch": 1.45, "learning_rate": 1.1014952435981106e-05, "loss": 0.4363, "step": 7842 }, { "epoch": 1.45, "learning_rate": 1.1012965278446657e-05, "loss": 0.4529, "step": 7843 }, { "epoch": 1.45, "learning_rate": 1.1010978080496773e-05, "loss": 0.4446, "step": 7844 }, { "epoch": 1.45, "learning_rate": 1.1008990842210731e-05, "loss": 0.4276, "step": 7845 }, { "epoch": 1.45, "learning_rate": 1.1007003563667824e-05, "loss": 0.4341, "step": 7846 }, { "epoch": 1.45, "learning_rate": 1.1005016244947337e-05, "loss": 0.4462, "step": 7847 }, { "epoch": 1.45, "learning_rate": 1.1003028886128564e-05, "loss": 0.4304, "step": 7848 }, { "epoch": 1.45, "learning_rate": 1.1001041487290798e-05, "loss": 0.4488, "step": 7849 }, { "epoch": 1.45, "learning_rate": 1.099905404851333e-05, "loss": 0.4404, "step": 7850 }, { "epoch": 1.45, "learning_rate": 1.0997066569875451e-05, "loss": 0.4429, "step": 7851 }, { "epoch": 1.45, "learning_rate": 1.0995079051456464e-05, "loss": 0.4284, "step": 7852 }, { "epoch": 1.45, "learning_rate": 1.0993091493335663e-05, "loss": 0.4341, "step": 7853 }, { "epoch": 1.45, "learning_rate": 1.0991103895592352e-05, "loss": 0.4168, "step": 7854 }, { "epoch": 1.45, "learning_rate": 1.0989116258305835e-05, "loss": 0.4335, "step": 7855 }, { "epoch": 1.45, "learning_rate": 1.0987128581555403e-05, "loss": 0.4355, "step": 7856 }, { "epoch": 1.45, "learning_rate": 1.0985140865420374e-05, "loss": 0.4206, "step": 7857 }, { "epoch": 1.45, "learning_rate": 1.0983153109980045e-05, "loss": 0.4298, "step": 7858 }, { "epoch": 1.45, "learning_rate": 1.0981165315313729e-05, "loss": 0.4368, "step": 7859 }, { "epoch": 1.45, "learning_rate": 1.0979177481500731e-05, "loss": 0.4523, "step": 7860 }, { "epoch": 1.45, "learning_rate": 1.0977189608620366e-05, "loss": 0.4193, "step": 7861 }, { "epoch": 1.45, "learning_rate": 1.0975201696751946e-05, "loss": 0.435, "step": 7862 }, { "epoch": 1.45, "learning_rate": 1.097321374597478e-05, "loss": 0.4265, "step": 7863 }, { "epoch": 1.45, "learning_rate": 1.0971225756368192e-05, "loss": 0.4309, "step": 7864 }, { "epoch": 1.46, "learning_rate": 1.0969237728011492e-05, "loss": 0.4099, "step": 7865 }, { "epoch": 1.46, "learning_rate": 1.0967249660984003e-05, "loss": 0.4334, "step": 7866 }, { "epoch": 1.46, "learning_rate": 1.0965261555365041e-05, "loss": 0.4311, "step": 7867 }, { "epoch": 1.46, "learning_rate": 1.0963273411233932e-05, "loss": 0.4466, "step": 7868 }, { "epoch": 1.46, "learning_rate": 1.0961285228669995e-05, "loss": 0.4363, "step": 7869 }, { "epoch": 1.46, "learning_rate": 1.095929700775256e-05, "loss": 0.4412, "step": 7870 }, { "epoch": 1.46, "learning_rate": 1.095730874856095e-05, "loss": 0.4338, "step": 7871 }, { "epoch": 1.46, "learning_rate": 1.0955320451174491e-05, "loss": 0.4316, "step": 7872 }, { "epoch": 1.46, "learning_rate": 1.0953332115672517e-05, "loss": 0.4423, "step": 7873 }, { "epoch": 1.46, "learning_rate": 1.0951343742134355e-05, "loss": 0.4288, "step": 7874 }, { "epoch": 1.46, "learning_rate": 1.0949355330639339e-05, "loss": 0.4309, "step": 7875 }, { "epoch": 1.46, "learning_rate": 1.0947366881266807e-05, "loss": 0.4299, "step": 7876 }, { "epoch": 1.46, "learning_rate": 1.0945378394096087e-05, "loss": 0.4475, "step": 7877 }, { "epoch": 1.46, "learning_rate": 1.094338986920652e-05, "loss": 0.4237, "step": 7878 }, { "epoch": 1.46, "learning_rate": 1.0941401306677441e-05, "loss": 0.4374, "step": 7879 }, { "epoch": 1.46, "learning_rate": 1.0939412706588197e-05, "loss": 0.4513, "step": 7880 }, { "epoch": 1.46, "learning_rate": 1.0937424069018124e-05, "loss": 0.4262, "step": 7881 }, { "epoch": 1.46, "learning_rate": 1.0935435394046567e-05, "loss": 0.4232, "step": 7882 }, { "epoch": 1.46, "learning_rate": 1.0933446681752869e-05, "loss": 0.4366, "step": 7883 }, { "epoch": 1.46, "learning_rate": 1.0931457932216377e-05, "loss": 0.423, "step": 7884 }, { "epoch": 1.46, "learning_rate": 1.0929469145516436e-05, "loss": 0.4402, "step": 7885 }, { "epoch": 1.46, "learning_rate": 1.0927480321732397e-05, "loss": 0.4505, "step": 7886 }, { "epoch": 1.46, "learning_rate": 1.0925491460943611e-05, "loss": 0.4333, "step": 7887 }, { "epoch": 1.46, "learning_rate": 1.092350256322943e-05, "loss": 0.4283, "step": 7888 }, { "epoch": 1.46, "learning_rate": 1.0921513628669206e-05, "loss": 0.4319, "step": 7889 }, { "epoch": 1.46, "learning_rate": 1.0919524657342296e-05, "loss": 0.4442, "step": 7890 }, { "epoch": 1.46, "learning_rate": 1.0917535649328053e-05, "loss": 0.4443, "step": 7891 }, { "epoch": 1.46, "learning_rate": 1.0915546604705835e-05, "loss": 0.4473, "step": 7892 }, { "epoch": 1.46, "learning_rate": 1.0913557523555008e-05, "loss": 0.4184, "step": 7893 }, { "epoch": 1.46, "learning_rate": 1.0911568405954922e-05, "loss": 0.4171, "step": 7894 }, { "epoch": 1.46, "learning_rate": 1.0909579251984945e-05, "loss": 0.4504, "step": 7895 }, { "epoch": 1.46, "learning_rate": 1.090759006172444e-05, "loss": 0.4199, "step": 7896 }, { "epoch": 1.46, "learning_rate": 1.0905600835252772e-05, "loss": 0.4279, "step": 7897 }, { "epoch": 1.46, "learning_rate": 1.0903611572649311e-05, "loss": 0.4254, "step": 7898 }, { "epoch": 1.46, "learning_rate": 1.0901622273993418e-05, "loss": 0.4363, "step": 7899 }, { "epoch": 1.46, "learning_rate": 1.0899632939364464e-05, "loss": 0.429, "step": 7900 }, { "epoch": 1.46, "learning_rate": 1.0897643568841825e-05, "loss": 0.4391, "step": 7901 }, { "epoch": 1.46, "learning_rate": 1.0895654162504866e-05, "loss": 0.4391, "step": 7902 }, { "epoch": 1.46, "learning_rate": 1.0893664720432965e-05, "loss": 0.4233, "step": 7903 }, { "epoch": 1.46, "learning_rate": 1.08916752427055e-05, "loss": 0.449, "step": 7904 }, { "epoch": 1.46, "learning_rate": 1.088968572940184e-05, "loss": 0.4303, "step": 7905 }, { "epoch": 1.46, "learning_rate": 1.0887696180601366e-05, "loss": 0.432, "step": 7906 }, { "epoch": 1.46, "learning_rate": 1.088570659638346e-05, "loss": 0.4339, "step": 7907 }, { "epoch": 1.46, "learning_rate": 1.0883716976827498e-05, "loss": 0.4338, "step": 7908 }, { "epoch": 1.46, "learning_rate": 1.0881727322012867e-05, "loss": 0.4266, "step": 7909 }, { "epoch": 1.46, "learning_rate": 1.087973763201895e-05, "loss": 0.4262, "step": 7910 }, { "epoch": 1.46, "learning_rate": 1.0877747906925127e-05, "loss": 0.4378, "step": 7911 }, { "epoch": 1.46, "learning_rate": 1.0875758146810788e-05, "loss": 0.4287, "step": 7912 }, { "epoch": 1.46, "learning_rate": 1.087376835175532e-05, "loss": 0.4581, "step": 7913 }, { "epoch": 1.46, "learning_rate": 1.0871778521838115e-05, "loss": 0.4348, "step": 7914 }, { "epoch": 1.46, "learning_rate": 1.0869788657138563e-05, "loss": 0.4388, "step": 7915 }, { "epoch": 1.46, "learning_rate": 1.086779875773605e-05, "loss": 0.4141, "step": 7916 }, { "epoch": 1.46, "learning_rate": 1.0865808823709973e-05, "loss": 0.4353, "step": 7917 }, { "epoch": 1.46, "learning_rate": 1.0863818855139727e-05, "loss": 0.4108, "step": 7918 }, { "epoch": 1.47, "learning_rate": 1.086182885210471e-05, "loss": 0.4372, "step": 7919 }, { "epoch": 1.47, "learning_rate": 1.0859838814684318e-05, "loss": 0.4466, "step": 7920 }, { "epoch": 1.47, "learning_rate": 1.0857848742957949e-05, "loss": 0.4307, "step": 7921 }, { "epoch": 1.47, "learning_rate": 1.0855858637005e-05, "loss": 0.4341, "step": 7922 }, { "epoch": 1.47, "learning_rate": 1.0853868496904877e-05, "loss": 0.4316, "step": 7923 }, { "epoch": 1.47, "learning_rate": 1.0851878322736983e-05, "loss": 0.4165, "step": 7924 }, { "epoch": 1.47, "learning_rate": 1.084988811458072e-05, "loss": 0.4369, "step": 7925 }, { "epoch": 1.47, "learning_rate": 1.0847897872515498e-05, "loss": 0.4346, "step": 7926 }, { "epoch": 1.47, "learning_rate": 1.0845907596620719e-05, "loss": 0.4318, "step": 7927 }, { "epoch": 1.47, "learning_rate": 1.0843917286975792e-05, "loss": 0.4521, "step": 7928 }, { "epoch": 1.47, "learning_rate": 1.0841926943660128e-05, "loss": 0.4151, "step": 7929 }, { "epoch": 1.47, "learning_rate": 1.0839936566753138e-05, "loss": 0.4359, "step": 7930 }, { "epoch": 1.47, "learning_rate": 1.0837946156334236e-05, "loss": 0.4575, "step": 7931 }, { "epoch": 1.47, "learning_rate": 1.083595571248283e-05, "loss": 0.4248, "step": 7932 }, { "epoch": 1.47, "learning_rate": 1.0833965235278344e-05, "loss": 0.4346, "step": 7933 }, { "epoch": 1.47, "learning_rate": 1.0831974724800184e-05, "loss": 0.4131, "step": 7934 }, { "epoch": 1.47, "learning_rate": 1.0829984181127775e-05, "loss": 0.4323, "step": 7935 }, { "epoch": 1.47, "learning_rate": 1.0827993604340531e-05, "loss": 0.4345, "step": 7936 }, { "epoch": 1.47, "learning_rate": 1.0826002994517878e-05, "loss": 0.4598, "step": 7937 }, { "epoch": 1.47, "learning_rate": 1.0824012351739235e-05, "loss": 0.4415, "step": 7938 }, { "epoch": 1.47, "learning_rate": 1.0822021676084024e-05, "loss": 0.4412, "step": 7939 }, { "epoch": 1.47, "learning_rate": 1.0820030967631669e-05, "loss": 0.4384, "step": 7940 }, { "epoch": 1.47, "learning_rate": 1.0818040226461599e-05, "loss": 0.4403, "step": 7941 }, { "epoch": 1.47, "learning_rate": 1.0816049452653238e-05, "loss": 0.4316, "step": 7942 }, { "epoch": 1.47, "learning_rate": 1.0814058646286014e-05, "loss": 0.4339, "step": 7943 }, { "epoch": 1.47, "learning_rate": 1.0812067807439359e-05, "loss": 0.4312, "step": 7944 }, { "epoch": 1.47, "learning_rate": 1.0810076936192699e-05, "loss": 0.4321, "step": 7945 }, { "epoch": 1.47, "learning_rate": 1.080808603262547e-05, "loss": 0.4238, "step": 7946 }, { "epoch": 1.47, "learning_rate": 1.0806095096817107e-05, "loss": 0.4122, "step": 7947 }, { "epoch": 1.47, "learning_rate": 1.080410412884704e-05, "loss": 0.4367, "step": 7948 }, { "epoch": 1.47, "learning_rate": 1.0802113128794707e-05, "loss": 0.4494, "step": 7949 }, { "epoch": 1.47, "learning_rate": 1.0800122096739545e-05, "loss": 0.4675, "step": 7950 }, { "epoch": 1.47, "learning_rate": 1.0798131032760992e-05, "loss": 0.4429, "step": 7951 }, { "epoch": 1.47, "learning_rate": 1.079613993693849e-05, "loss": 0.458, "step": 7952 }, { "epoch": 1.47, "learning_rate": 1.0794148809351479e-05, "loss": 0.4317, "step": 7953 }, { "epoch": 1.47, "learning_rate": 1.07921576500794e-05, "loss": 0.4153, "step": 7954 }, { "epoch": 1.47, "learning_rate": 1.0790166459201698e-05, "loss": 0.4088, "step": 7955 }, { "epoch": 1.47, "learning_rate": 1.0788175236797816e-05, "loss": 0.4502, "step": 7956 }, { "epoch": 1.47, "learning_rate": 1.07861839829472e-05, "loss": 0.4476, "step": 7957 }, { "epoch": 1.47, "learning_rate": 1.0784192697729301e-05, "loss": 0.434, "step": 7958 }, { "epoch": 1.47, "learning_rate": 1.0782201381223566e-05, "loss": 0.4412, "step": 7959 }, { "epoch": 1.47, "learning_rate": 1.0780210033509441e-05, "loss": 0.4342, "step": 7960 }, { "epoch": 1.47, "learning_rate": 1.0778218654666382e-05, "loss": 0.4292, "step": 7961 }, { "epoch": 1.47, "learning_rate": 1.077622724477384e-05, "loss": 0.4475, "step": 7962 }, { "epoch": 1.47, "learning_rate": 1.0774235803911266e-05, "loss": 0.4254, "step": 7963 }, { "epoch": 1.47, "learning_rate": 1.0772244332158121e-05, "loss": 0.4235, "step": 7964 }, { "epoch": 1.47, "learning_rate": 1.0770252829593855e-05, "loss": 0.4188, "step": 7965 }, { "epoch": 1.47, "learning_rate": 1.0768261296297925e-05, "loss": 0.4291, "step": 7966 }, { "epoch": 1.47, "learning_rate": 1.0766269732349795e-05, "loss": 0.4506, "step": 7967 }, { "epoch": 1.47, "learning_rate": 1.0764278137828918e-05, "loss": 0.4102, "step": 7968 }, { "epoch": 1.47, "learning_rate": 1.076228651281476e-05, "loss": 0.4135, "step": 7969 }, { "epoch": 1.47, "learning_rate": 1.0760294857386784e-05, "loss": 0.4182, "step": 7970 }, { "epoch": 1.47, "learning_rate": 1.0758303171624447e-05, "loss": 0.4303, "step": 7971 }, { "epoch": 1.47, "learning_rate": 1.0756311455607217e-05, "loss": 0.4254, "step": 7972 }, { "epoch": 1.48, "learning_rate": 1.0754319709414562e-05, "loss": 0.4483, "step": 7973 }, { "epoch": 1.48, "learning_rate": 1.0752327933125948e-05, "loss": 0.4423, "step": 7974 }, { "epoch": 1.48, "learning_rate": 1.0750336126820844e-05, "loss": 0.4407, "step": 7975 }, { "epoch": 1.48, "learning_rate": 1.0748344290578714e-05, "loss": 0.4448, "step": 7976 }, { "epoch": 1.48, "learning_rate": 1.0746352424479035e-05, "loss": 0.4472, "step": 7977 }, { "epoch": 1.48, "learning_rate": 1.0744360528601272e-05, "loss": 0.4345, "step": 7978 }, { "epoch": 1.48, "learning_rate": 1.0742368603024907e-05, "loss": 0.4598, "step": 7979 }, { "epoch": 1.48, "learning_rate": 1.0740376647829405e-05, "loss": 0.42, "step": 7980 }, { "epoch": 1.48, "learning_rate": 1.073838466309425e-05, "loss": 0.4354, "step": 7981 }, { "epoch": 1.48, "learning_rate": 1.073639264889891e-05, "loss": 0.4538, "step": 7982 }, { "epoch": 1.48, "learning_rate": 1.0734400605322868e-05, "loss": 0.4072, "step": 7983 }, { "epoch": 1.48, "learning_rate": 1.0732408532445601e-05, "loss": 0.4258, "step": 7984 }, { "epoch": 1.48, "learning_rate": 1.073041643034659e-05, "loss": 0.4426, "step": 7985 }, { "epoch": 1.48, "learning_rate": 1.0728424299105316e-05, "loss": 0.438, "step": 7986 }, { "epoch": 1.48, "learning_rate": 1.0726432138801262e-05, "loss": 0.4177, "step": 7987 }, { "epoch": 1.48, "learning_rate": 1.072443994951391e-05, "loss": 0.4311, "step": 7988 }, { "epoch": 1.48, "learning_rate": 1.0722447731322742e-05, "loss": 0.4233, "step": 7989 }, { "epoch": 1.48, "learning_rate": 1.0720455484307251e-05, "loss": 0.4458, "step": 7990 }, { "epoch": 1.48, "learning_rate": 1.071846320854692e-05, "loss": 0.4263, "step": 7991 }, { "epoch": 1.48, "learning_rate": 1.0716470904121236e-05, "loss": 0.4285, "step": 7992 }, { "epoch": 1.48, "learning_rate": 1.071447857110969e-05, "loss": 0.431, "step": 7993 }, { "epoch": 1.48, "learning_rate": 1.0712486209591772e-05, "loss": 0.4443, "step": 7994 }, { "epoch": 1.48, "learning_rate": 1.0710493819646972e-05, "loss": 0.4305, "step": 7995 }, { "epoch": 1.48, "learning_rate": 1.0708501401354785e-05, "loss": 0.4394, "step": 7996 }, { "epoch": 1.48, "learning_rate": 1.0706508954794705e-05, "loss": 0.4376, "step": 7997 }, { "epoch": 1.48, "learning_rate": 1.0704516480046225e-05, "loss": 0.4605, "step": 7998 }, { "epoch": 1.48, "learning_rate": 1.070252397718884e-05, "loss": 0.4335, "step": 7999 }, { "epoch": 1.48, "learning_rate": 1.0700531446302051e-05, "loss": 0.422, "step": 8000 }, { "epoch": 1.48, "learning_rate": 1.0698538887465355e-05, "loss": 0.4104, "step": 8001 }, { "epoch": 1.48, "learning_rate": 1.0696546300758248e-05, "loss": 0.4343, "step": 8002 }, { "epoch": 1.48, "learning_rate": 1.0694553686260238e-05, "loss": 0.4217, "step": 8003 }, { "epoch": 1.48, "learning_rate": 1.0692561044050817e-05, "loss": 0.4437, "step": 8004 }, { "epoch": 1.48, "learning_rate": 1.0690568374209493e-05, "loss": 0.4248, "step": 8005 }, { "epoch": 1.48, "learning_rate": 1.068857567681577e-05, "loss": 0.4484, "step": 8006 }, { "epoch": 1.48, "learning_rate": 1.0686582951949153e-05, "loss": 0.4151, "step": 8007 }, { "epoch": 1.48, "learning_rate": 1.0684590199689151e-05, "loss": 0.4334, "step": 8008 }, { "epoch": 1.48, "learning_rate": 1.0682597420115264e-05, "loss": 0.4456, "step": 8009 }, { "epoch": 1.48, "learning_rate": 1.0680604613307002e-05, "loss": 0.4289, "step": 8010 }, { "epoch": 1.48, "learning_rate": 1.0678611779343878e-05, "loss": 0.4423, "step": 8011 }, { "epoch": 1.48, "learning_rate": 1.06766189183054e-05, "loss": 0.4428, "step": 8012 }, { "epoch": 1.48, "learning_rate": 1.0674626030271078e-05, "loss": 0.4342, "step": 8013 }, { "epoch": 1.48, "learning_rate": 1.067263311532043e-05, "loss": 0.4301, "step": 8014 }, { "epoch": 1.48, "learning_rate": 1.0670640173532961e-05, "loss": 0.4372, "step": 8015 }, { "epoch": 1.48, "learning_rate": 1.0668647204988196e-05, "loss": 0.4418, "step": 8016 }, { "epoch": 1.48, "learning_rate": 1.0666654209765644e-05, "loss": 0.4322, "step": 8017 }, { "epoch": 1.48, "learning_rate": 1.0664661187944822e-05, "loss": 0.4231, "step": 8018 }, { "epoch": 1.48, "learning_rate": 1.0662668139605253e-05, "loss": 0.4082, "step": 8019 }, { "epoch": 1.48, "learning_rate": 1.0660675064826446e-05, "loss": 0.4281, "step": 8020 }, { "epoch": 1.48, "learning_rate": 1.065868196368793e-05, "loss": 0.4433, "step": 8021 }, { "epoch": 1.48, "learning_rate": 1.0656688836269225e-05, "loss": 0.4373, "step": 8022 }, { "epoch": 1.48, "learning_rate": 1.0654695682649849e-05, "loss": 0.4262, "step": 8023 }, { "epoch": 1.48, "learning_rate": 1.0652702502909328e-05, "loss": 0.4231, "step": 8024 }, { "epoch": 1.48, "learning_rate": 1.0650709297127188e-05, "loss": 0.4419, "step": 8025 }, { "epoch": 1.48, "learning_rate": 1.064871606538295e-05, "loss": 0.4152, "step": 8026 }, { "epoch": 1.49, "learning_rate": 1.064672280775614e-05, "loss": 0.4239, "step": 8027 }, { "epoch": 1.49, "learning_rate": 1.0644729524326289e-05, "loss": 0.4486, "step": 8028 }, { "epoch": 1.49, "learning_rate": 1.0642736215172924e-05, "loss": 0.4322, "step": 8029 }, { "epoch": 1.49, "learning_rate": 1.0640742880375574e-05, "loss": 0.4305, "step": 8030 }, { "epoch": 1.49, "learning_rate": 1.063874952001377e-05, "loss": 0.4291, "step": 8031 }, { "epoch": 1.49, "learning_rate": 1.0636756134167042e-05, "loss": 0.415, "step": 8032 }, { "epoch": 1.49, "learning_rate": 1.0634762722914922e-05, "loss": 0.4468, "step": 8033 }, { "epoch": 1.49, "learning_rate": 1.0632769286336946e-05, "loss": 0.409, "step": 8034 }, { "epoch": 1.49, "learning_rate": 1.0630775824512645e-05, "loss": 0.4144, "step": 8035 }, { "epoch": 1.49, "learning_rate": 1.0628782337521557e-05, "loss": 0.4267, "step": 8036 }, { "epoch": 1.49, "learning_rate": 1.062678882544322e-05, "loss": 0.4375, "step": 8037 }, { "epoch": 1.49, "learning_rate": 1.0624795288357168e-05, "loss": 0.4301, "step": 8038 }, { "epoch": 1.49, "learning_rate": 1.062280172634294e-05, "loss": 0.4338, "step": 8039 }, { "epoch": 1.49, "learning_rate": 1.0620808139480077e-05, "loss": 0.411, "step": 8040 }, { "epoch": 1.49, "learning_rate": 1.0618814527848121e-05, "loss": 0.4323, "step": 8041 }, { "epoch": 1.49, "learning_rate": 1.061682089152661e-05, "loss": 0.4247, "step": 8042 }, { "epoch": 1.49, "learning_rate": 1.0614827230595083e-05, "loss": 0.4213, "step": 8043 }, { "epoch": 1.49, "learning_rate": 1.0612833545133093e-05, "loss": 0.4224, "step": 8044 }, { "epoch": 1.49, "learning_rate": 1.0610839835220177e-05, "loss": 0.4276, "step": 8045 }, { "epoch": 1.49, "learning_rate": 1.0608846100935882e-05, "loss": 0.4457, "step": 8046 }, { "epoch": 1.49, "learning_rate": 1.0606852342359757e-05, "loss": 0.4401, "step": 8047 }, { "epoch": 1.49, "learning_rate": 1.0604858559571345e-05, "loss": 0.4256, "step": 8048 }, { "epoch": 1.49, "learning_rate": 1.0602864752650197e-05, "loss": 0.4354, "step": 8049 }, { "epoch": 1.49, "learning_rate": 1.060087092167586e-05, "loss": 0.4413, "step": 8050 }, { "epoch": 1.49, "learning_rate": 1.0598877066727888e-05, "loss": 0.4394, "step": 8051 }, { "epoch": 1.49, "learning_rate": 1.0596883187885832e-05, "loss": 0.4227, "step": 8052 }, { "epoch": 1.49, "learning_rate": 1.059488928522924e-05, "loss": 0.4428, "step": 8053 }, { "epoch": 1.49, "learning_rate": 1.0592895358837664e-05, "loss": 0.4567, "step": 8054 }, { "epoch": 1.49, "learning_rate": 1.0590901408790663e-05, "loss": 0.4244, "step": 8055 }, { "epoch": 1.49, "learning_rate": 1.058890743516779e-05, "loss": 0.4383, "step": 8056 }, { "epoch": 1.49, "learning_rate": 1.0586913438048599e-05, "loss": 0.4548, "step": 8057 }, { "epoch": 1.49, "learning_rate": 1.0584919417512651e-05, "loss": 0.4196, "step": 8058 }, { "epoch": 1.49, "learning_rate": 1.0582925373639501e-05, "loss": 0.4377, "step": 8059 }, { "epoch": 1.49, "learning_rate": 1.0580931306508706e-05, "loss": 0.4258, "step": 8060 }, { "epoch": 1.49, "learning_rate": 1.057893721619983e-05, "loss": 0.4405, "step": 8061 }, { "epoch": 1.49, "learning_rate": 1.0576943102792427e-05, "loss": 0.4494, "step": 8062 }, { "epoch": 1.49, "learning_rate": 1.0574948966366065e-05, "loss": 0.4332, "step": 8063 }, { "epoch": 1.49, "learning_rate": 1.0572954807000301e-05, "loss": 0.4197, "step": 8064 }, { "epoch": 1.49, "learning_rate": 1.0570960624774704e-05, "loss": 0.4397, "step": 8065 }, { "epoch": 1.49, "learning_rate": 1.0568966419768836e-05, "loss": 0.4665, "step": 8066 }, { "epoch": 1.49, "learning_rate": 1.056697219206226e-05, "loss": 0.4113, "step": 8067 }, { "epoch": 1.49, "learning_rate": 1.0564977941734543e-05, "loss": 0.4329, "step": 8068 }, { "epoch": 1.49, "learning_rate": 1.0562983668865253e-05, "loss": 0.4337, "step": 8069 }, { "epoch": 1.49, "learning_rate": 1.0560989373533957e-05, "loss": 0.4406, "step": 8070 }, { "epoch": 1.49, "learning_rate": 1.055899505582022e-05, "loss": 0.4488, "step": 8071 }, { "epoch": 1.49, "learning_rate": 1.0557000715803617e-05, "loss": 0.429, "step": 8072 }, { "epoch": 1.49, "learning_rate": 1.0555006353563718e-05, "loss": 0.449, "step": 8073 }, { "epoch": 1.49, "learning_rate": 1.0553011969180096e-05, "loss": 0.4525, "step": 8074 }, { "epoch": 1.49, "learning_rate": 1.0551017562732318e-05, "loss": 0.4316, "step": 8075 }, { "epoch": 1.49, "learning_rate": 1.0549023134299957e-05, "loss": 0.4604, "step": 8076 }, { "epoch": 1.49, "learning_rate": 1.054702868396259e-05, "loss": 0.4333, "step": 8077 }, { "epoch": 1.49, "learning_rate": 1.0545034211799792e-05, "loss": 0.4234, "step": 8078 }, { "epoch": 1.49, "learning_rate": 1.0543039717891138e-05, "loss": 0.4247, "step": 8079 }, { "epoch": 1.49, "learning_rate": 1.0541045202316207e-05, "loss": 0.448, "step": 8080 }, { "epoch": 1.5, "learning_rate": 1.0539050665154574e-05, "loss": 0.4307, "step": 8081 }, { "epoch": 1.5, "learning_rate": 1.0537056106485815e-05, "loss": 0.4401, "step": 8082 }, { "epoch": 1.5, "learning_rate": 1.053506152638951e-05, "loss": 0.4282, "step": 8083 }, { "epoch": 1.5, "learning_rate": 1.0533066924945243e-05, "loss": 0.4152, "step": 8084 }, { "epoch": 1.5, "learning_rate": 1.0531072302232592e-05, "loss": 0.4266, "step": 8085 }, { "epoch": 1.5, "learning_rate": 1.052907765833114e-05, "loss": 0.434, "step": 8086 }, { "epoch": 1.5, "learning_rate": 1.052708299332047e-05, "loss": 0.4201, "step": 8087 }, { "epoch": 1.5, "learning_rate": 1.0525088307280162e-05, "loss": 0.4355, "step": 8088 }, { "epoch": 1.5, "learning_rate": 1.0523093600289804e-05, "loss": 0.4308, "step": 8089 }, { "epoch": 1.5, "learning_rate": 1.0521098872428982e-05, "loss": 0.4356, "step": 8090 }, { "epoch": 1.5, "learning_rate": 1.0519104123777277e-05, "loss": 0.4401, "step": 8091 }, { "epoch": 1.5, "learning_rate": 1.0517109354414278e-05, "loss": 0.4219, "step": 8092 }, { "epoch": 1.5, "learning_rate": 1.0515114564419575e-05, "loss": 0.4262, "step": 8093 }, { "epoch": 1.5, "learning_rate": 1.0513119753872757e-05, "loss": 0.4353, "step": 8094 }, { "epoch": 1.5, "learning_rate": 1.0511124922853406e-05, "loss": 0.4233, "step": 8095 }, { "epoch": 1.5, "learning_rate": 1.050913007144112e-05, "loss": 0.4331, "step": 8096 }, { "epoch": 1.5, "learning_rate": 1.0507135199715485e-05, "loss": 0.4351, "step": 8097 }, { "epoch": 1.5, "learning_rate": 1.0505140307756096e-05, "loss": 0.4305, "step": 8098 }, { "epoch": 1.5, "learning_rate": 1.0503145395642543e-05, "loss": 0.4384, "step": 8099 }, { "epoch": 1.5, "learning_rate": 1.050115046345442e-05, "loss": 0.4006, "step": 8100 }, { "epoch": 1.5, "learning_rate": 1.0499155511271321e-05, "loss": 0.4149, "step": 8101 }, { "epoch": 1.5, "learning_rate": 1.0497160539172843e-05, "loss": 0.4534, "step": 8102 }, { "epoch": 1.5, "learning_rate": 1.049516554723858e-05, "loss": 0.4563, "step": 8103 }, { "epoch": 1.5, "learning_rate": 1.0493170535548127e-05, "loss": 0.4166, "step": 8104 }, { "epoch": 1.5, "learning_rate": 1.0491175504181082e-05, "loss": 0.438, "step": 8105 }, { "epoch": 1.5, "learning_rate": 1.0489180453217045e-05, "loss": 0.4197, "step": 8106 }, { "epoch": 1.5, "learning_rate": 1.0487185382735614e-05, "loss": 0.4332, "step": 8107 }, { "epoch": 1.5, "learning_rate": 1.0485190292816388e-05, "loss": 0.4308, "step": 8108 }, { "epoch": 1.5, "learning_rate": 1.0483195183538968e-05, "loss": 0.4384, "step": 8109 }, { "epoch": 1.5, "learning_rate": 1.0481200054982954e-05, "loss": 0.4501, "step": 8110 }, { "epoch": 1.5, "learning_rate": 1.0479204907227949e-05, "loss": 0.4268, "step": 8111 }, { "epoch": 1.5, "learning_rate": 1.0477209740353554e-05, "loss": 0.4251, "step": 8112 }, { "epoch": 1.5, "learning_rate": 1.0475214554439374e-05, "loss": 0.4188, "step": 8113 }, { "epoch": 1.5, "learning_rate": 1.0473219349565014e-05, "loss": 0.4362, "step": 8114 }, { "epoch": 1.5, "learning_rate": 1.0471224125810078e-05, "loss": 0.4154, "step": 8115 }, { "epoch": 1.5, "learning_rate": 1.0469228883254173e-05, "loss": 0.4261, "step": 8116 }, { "epoch": 1.5, "learning_rate": 1.0467233621976902e-05, "loss": 0.4235, "step": 8117 }, { "epoch": 1.5, "learning_rate": 1.046523834205788e-05, "loss": 0.4571, "step": 8118 }, { "epoch": 1.5, "learning_rate": 1.0463243043576704e-05, "loss": 0.426, "step": 8119 }, { "epoch": 1.5, "learning_rate": 1.0461247726612988e-05, "loss": 0.46, "step": 8120 }, { "epoch": 1.5, "learning_rate": 1.0459252391246343e-05, "loss": 0.4356, "step": 8121 }, { "epoch": 1.5, "learning_rate": 1.0457257037556378e-05, "loss": 0.4289, "step": 8122 }, { "epoch": 1.5, "learning_rate": 1.0455261665622705e-05, "loss": 0.4256, "step": 8123 }, { "epoch": 1.5, "learning_rate": 1.0453266275524936e-05, "loss": 0.441, "step": 8124 }, { "epoch": 1.5, "learning_rate": 1.045127086734268e-05, "loss": 0.4294, "step": 8125 }, { "epoch": 1.5, "learning_rate": 1.044927544115555e-05, "loss": 0.4217, "step": 8126 }, { "epoch": 1.5, "learning_rate": 1.0447279997043163e-05, "loss": 0.4176, "step": 8127 }, { "epoch": 1.5, "learning_rate": 1.0445284535085132e-05, "loss": 0.4288, "step": 8128 }, { "epoch": 1.5, "learning_rate": 1.0443289055361074e-05, "loss": 0.4307, "step": 8129 }, { "epoch": 1.5, "learning_rate": 1.0441293557950603e-05, "loss": 0.4183, "step": 8130 }, { "epoch": 1.5, "learning_rate": 1.0439298042933335e-05, "loss": 0.4306, "step": 8131 }, { "epoch": 1.5, "learning_rate": 1.0437302510388887e-05, "loss": 0.4155, "step": 8132 }, { "epoch": 1.5, "learning_rate": 1.043530696039688e-05, "loss": 0.445, "step": 8133 }, { "epoch": 1.5, "learning_rate": 1.043331139303693e-05, "loss": 0.4572, "step": 8134 }, { "epoch": 1.51, "learning_rate": 1.043131580838866e-05, "loss": 0.4361, "step": 8135 }, { "epoch": 1.51, "learning_rate": 1.0429320206531686e-05, "loss": 0.4233, "step": 8136 }, { "epoch": 1.51, "learning_rate": 1.042732458754563e-05, "loss": 0.421, "step": 8137 }, { "epoch": 1.51, "learning_rate": 1.0425328951510116e-05, "loss": 0.3932, "step": 8138 }, { "epoch": 1.51, "learning_rate": 1.0423333298504762e-05, "loss": 0.4286, "step": 8139 }, { "epoch": 1.51, "learning_rate": 1.0421337628609199e-05, "loss": 0.4448, "step": 8140 }, { "epoch": 1.51, "learning_rate": 1.041934194190304e-05, "loss": 0.4334, "step": 8141 }, { "epoch": 1.51, "learning_rate": 1.0417346238465916e-05, "loss": 0.4344, "step": 8142 }, { "epoch": 1.51, "learning_rate": 1.0415350518377447e-05, "loss": 0.4323, "step": 8143 }, { "epoch": 1.51, "learning_rate": 1.0413354781717263e-05, "loss": 0.4345, "step": 8144 }, { "epoch": 1.51, "learning_rate": 1.0411359028564986e-05, "loss": 0.4291, "step": 8145 }, { "epoch": 1.51, "learning_rate": 1.0409363259000252e-05, "loss": 0.435, "step": 8146 }, { "epoch": 1.51, "learning_rate": 1.0407367473102676e-05, "loss": 0.4196, "step": 8147 }, { "epoch": 1.51, "learning_rate": 1.0405371670951893e-05, "loss": 0.4306, "step": 8148 }, { "epoch": 1.51, "learning_rate": 1.0403375852627531e-05, "loss": 0.4154, "step": 8149 }, { "epoch": 1.51, "learning_rate": 1.040138001820922e-05, "loss": 0.4445, "step": 8150 }, { "epoch": 1.51, "learning_rate": 1.0399384167776592e-05, "loss": 0.4273, "step": 8151 }, { "epoch": 1.51, "learning_rate": 1.039738830140927e-05, "loss": 0.4318, "step": 8152 }, { "epoch": 1.51, "learning_rate": 1.0395392419186894e-05, "loss": 0.4334, "step": 8153 }, { "epoch": 1.51, "learning_rate": 1.039339652118909e-05, "loss": 0.4338, "step": 8154 }, { "epoch": 1.51, "learning_rate": 1.0391400607495494e-05, "loss": 0.4203, "step": 8155 }, { "epoch": 1.51, "learning_rate": 1.038940467818574e-05, "loss": 0.4368, "step": 8156 }, { "epoch": 1.51, "learning_rate": 1.0387408733339459e-05, "loss": 0.4315, "step": 8157 }, { "epoch": 1.51, "learning_rate": 1.0385412773036288e-05, "loss": 0.4764, "step": 8158 }, { "epoch": 1.51, "learning_rate": 1.0383416797355859e-05, "loss": 0.4555, "step": 8159 }, { "epoch": 1.51, "learning_rate": 1.038142080637781e-05, "loss": 0.4305, "step": 8160 }, { "epoch": 1.51, "learning_rate": 1.037942480018178e-05, "loss": 0.4249, "step": 8161 }, { "epoch": 1.51, "learning_rate": 1.0377428778847398e-05, "loss": 0.4195, "step": 8162 }, { "epoch": 1.51, "learning_rate": 1.037543274245431e-05, "loss": 0.4371, "step": 8163 }, { "epoch": 1.51, "learning_rate": 1.0373436691082149e-05, "loss": 0.4314, "step": 8164 }, { "epoch": 1.51, "learning_rate": 1.0371440624810557e-05, "loss": 0.4496, "step": 8165 }, { "epoch": 1.51, "learning_rate": 1.036944454371917e-05, "loss": 0.4164, "step": 8166 }, { "epoch": 1.51, "learning_rate": 1.0367448447887629e-05, "loss": 0.4306, "step": 8167 }, { "epoch": 1.51, "learning_rate": 1.0365452337395579e-05, "loss": 0.4264, "step": 8168 }, { "epoch": 1.51, "learning_rate": 1.0363456212322655e-05, "loss": 0.4526, "step": 8169 }, { "epoch": 1.51, "learning_rate": 1.0361460072748502e-05, "loss": 0.4291, "step": 8170 }, { "epoch": 1.51, "learning_rate": 1.0359463918752758e-05, "loss": 0.4246, "step": 8171 }, { "epoch": 1.51, "learning_rate": 1.0357467750415074e-05, "loss": 0.4451, "step": 8172 }, { "epoch": 1.51, "learning_rate": 1.0355471567815087e-05, "loss": 0.4378, "step": 8173 }, { "epoch": 1.51, "learning_rate": 1.0353475371032442e-05, "loss": 0.4551, "step": 8174 }, { "epoch": 1.51, "learning_rate": 1.0351479160146785e-05, "loss": 0.4417, "step": 8175 }, { "epoch": 1.51, "learning_rate": 1.0349482935237758e-05, "loss": 0.4303, "step": 8176 }, { "epoch": 1.51, "learning_rate": 1.0347486696385009e-05, "loss": 0.4321, "step": 8177 }, { "epoch": 1.51, "learning_rate": 1.0345490443668187e-05, "loss": 0.442, "step": 8178 }, { "epoch": 1.51, "learning_rate": 1.0343494177166935e-05, "loss": 0.4267, "step": 8179 }, { "epoch": 1.51, "learning_rate": 1.0341497896960902e-05, "loss": 0.4286, "step": 8180 }, { "epoch": 1.51, "learning_rate": 1.0339501603129731e-05, "loss": 0.4393, "step": 8181 }, { "epoch": 1.51, "learning_rate": 1.033750529575308e-05, "loss": 0.4358, "step": 8182 }, { "epoch": 1.51, "learning_rate": 1.0335508974910589e-05, "loss": 0.4537, "step": 8183 }, { "epoch": 1.51, "learning_rate": 1.0333512640681913e-05, "loss": 0.4221, "step": 8184 }, { "epoch": 1.51, "learning_rate": 1.03315162931467e-05, "loss": 0.4396, "step": 8185 }, { "epoch": 1.51, "learning_rate": 1.03295199323846e-05, "loss": 0.4539, "step": 8186 }, { "epoch": 1.51, "learning_rate": 1.0327523558475263e-05, "loss": 0.4184, "step": 8187 }, { "epoch": 1.51, "learning_rate": 1.0325527171498344e-05, "loss": 0.4586, "step": 8188 }, { "epoch": 1.52, "learning_rate": 1.0323530771533495e-05, "loss": 0.417, "step": 8189 }, { "epoch": 1.52, "learning_rate": 1.0321534358660363e-05, "loss": 0.433, "step": 8190 }, { "epoch": 1.52, "learning_rate": 1.031953793295861e-05, "loss": 0.4289, "step": 8191 }, { "epoch": 1.52, "learning_rate": 1.0317541494507883e-05, "loss": 0.4412, "step": 8192 }, { "epoch": 1.52, "learning_rate": 1.0315545043387838e-05, "loss": 0.4426, "step": 8193 }, { "epoch": 1.52, "learning_rate": 1.031354857967813e-05, "loss": 0.44, "step": 8194 }, { "epoch": 1.52, "learning_rate": 1.0311552103458417e-05, "loss": 0.4243, "step": 8195 }, { "epoch": 1.52, "learning_rate": 1.0309555614808349e-05, "loss": 0.4523, "step": 8196 }, { "epoch": 1.52, "learning_rate": 1.0307559113807586e-05, "loss": 0.4275, "step": 8197 }, { "epoch": 1.52, "learning_rate": 1.0305562600535783e-05, "loss": 0.4575, "step": 8198 }, { "epoch": 1.52, "learning_rate": 1.0303566075072599e-05, "loss": 0.4274, "step": 8199 }, { "epoch": 1.52, "learning_rate": 1.030156953749769e-05, "loss": 0.4512, "step": 8200 }, { "epoch": 1.52, "learning_rate": 1.0299572987890715e-05, "loss": 0.4171, "step": 8201 }, { "epoch": 1.52, "learning_rate": 1.0297576426331336e-05, "loss": 0.4342, "step": 8202 }, { "epoch": 1.52, "learning_rate": 1.0295579852899202e-05, "loss": 0.4141, "step": 8203 }, { "epoch": 1.52, "learning_rate": 1.0293583267673983e-05, "loss": 0.4429, "step": 8204 }, { "epoch": 1.52, "learning_rate": 1.0291586670735335e-05, "loss": 0.4483, "step": 8205 }, { "epoch": 1.52, "learning_rate": 1.0289590062162918e-05, "loss": 0.4218, "step": 8206 }, { "epoch": 1.52, "learning_rate": 1.0287593442036394e-05, "loss": 0.4201, "step": 8207 }, { "epoch": 1.52, "learning_rate": 1.0285596810435423e-05, "loss": 0.4421, "step": 8208 }, { "epoch": 1.52, "learning_rate": 1.028360016743967e-05, "loss": 0.4448, "step": 8209 }, { "epoch": 1.52, "learning_rate": 1.0281603513128793e-05, "loss": 0.4179, "step": 8210 }, { "epoch": 1.52, "learning_rate": 1.0279606847582457e-05, "loss": 0.4343, "step": 8211 }, { "epoch": 1.52, "learning_rate": 1.0277610170880327e-05, "loss": 0.4396, "step": 8212 }, { "epoch": 1.52, "learning_rate": 1.0275613483102064e-05, "loss": 0.4432, "step": 8213 }, { "epoch": 1.52, "learning_rate": 1.0273616784327337e-05, "loss": 0.4068, "step": 8214 }, { "epoch": 1.52, "learning_rate": 1.0271620074635801e-05, "loss": 0.4382, "step": 8215 }, { "epoch": 1.52, "learning_rate": 1.0269623354107132e-05, "loss": 0.4267, "step": 8216 }, { "epoch": 1.52, "learning_rate": 1.026762662282099e-05, "loss": 0.4387, "step": 8217 }, { "epoch": 1.52, "learning_rate": 1.026562988085704e-05, "loss": 0.4156, "step": 8218 }, { "epoch": 1.52, "learning_rate": 1.0263633128294947e-05, "loss": 0.4319, "step": 8219 }, { "epoch": 1.52, "learning_rate": 1.0261636365214385e-05, "loss": 0.4501, "step": 8220 }, { "epoch": 1.52, "learning_rate": 1.0259639591695012e-05, "loss": 0.4259, "step": 8221 }, { "epoch": 1.52, "learning_rate": 1.0257642807816504e-05, "loss": 0.4231, "step": 8222 }, { "epoch": 1.52, "learning_rate": 1.0255646013658523e-05, "loss": 0.4304, "step": 8223 }, { "epoch": 1.52, "learning_rate": 1.025364920930074e-05, "loss": 0.4179, "step": 8224 }, { "epoch": 1.52, "learning_rate": 1.0251652394822822e-05, "loss": 0.4359, "step": 8225 }, { "epoch": 1.52, "learning_rate": 1.024965557030444e-05, "loss": 0.4404, "step": 8226 }, { "epoch": 1.52, "learning_rate": 1.0247658735825262e-05, "loss": 0.4396, "step": 8227 }, { "epoch": 1.52, "learning_rate": 1.0245661891464963e-05, "loss": 0.4296, "step": 8228 }, { "epoch": 1.52, "learning_rate": 1.0243665037303205e-05, "loss": 0.4352, "step": 8229 }, { "epoch": 1.52, "learning_rate": 1.0241668173419664e-05, "loss": 0.4315, "step": 8230 }, { "epoch": 1.52, "learning_rate": 1.0239671299894009e-05, "loss": 0.4065, "step": 8231 }, { "epoch": 1.52, "learning_rate": 1.0237674416805917e-05, "loss": 0.4264, "step": 8232 }, { "epoch": 1.52, "learning_rate": 1.0235677524235055e-05, "loss": 0.4205, "step": 8233 }, { "epoch": 1.52, "learning_rate": 1.0233680622261093e-05, "loss": 0.423, "step": 8234 }, { "epoch": 1.52, "learning_rate": 1.0231683710963709e-05, "loss": 0.4289, "step": 8235 }, { "epoch": 1.52, "learning_rate": 1.0229686790422572e-05, "loss": 0.4286, "step": 8236 }, { "epoch": 1.52, "learning_rate": 1.0227689860717358e-05, "loss": 0.4054, "step": 8237 }, { "epoch": 1.52, "learning_rate": 1.0225692921927742e-05, "loss": 0.424, "step": 8238 }, { "epoch": 1.52, "learning_rate": 1.0223695974133393e-05, "loss": 0.4393, "step": 8239 }, { "epoch": 1.52, "learning_rate": 1.022169901741399e-05, "loss": 0.4235, "step": 8240 }, { "epoch": 1.52, "learning_rate": 1.0219702051849208e-05, "loss": 0.4553, "step": 8241 }, { "epoch": 1.52, "learning_rate": 1.021770507751872e-05, "loss": 0.4121, "step": 8242 }, { "epoch": 1.53, "learning_rate": 1.0215708094502204e-05, "loss": 0.4358, "step": 8243 }, { "epoch": 1.53, "learning_rate": 1.0213711102879333e-05, "loss": 0.4383, "step": 8244 }, { "epoch": 1.53, "learning_rate": 1.0211714102729786e-05, "loss": 0.4426, "step": 8245 }, { "epoch": 1.53, "learning_rate": 1.0209717094133236e-05, "loss": 0.4424, "step": 8246 }, { "epoch": 1.53, "learning_rate": 1.0207720077169364e-05, "loss": 0.4093, "step": 8247 }, { "epoch": 1.53, "learning_rate": 1.0205723051917843e-05, "loss": 0.4258, "step": 8248 }, { "epoch": 1.53, "learning_rate": 1.0203726018458355e-05, "loss": 0.4496, "step": 8249 }, { "epoch": 1.53, "learning_rate": 1.0201728976870578e-05, "loss": 0.4207, "step": 8250 }, { "epoch": 1.53, "learning_rate": 1.0199731927234187e-05, "loss": 0.4162, "step": 8251 }, { "epoch": 1.53, "learning_rate": 1.0197734869628861e-05, "loss": 0.4569, "step": 8252 }, { "epoch": 1.53, "learning_rate": 1.019573780413428e-05, "loss": 0.4285, "step": 8253 }, { "epoch": 1.53, "learning_rate": 1.0193740730830122e-05, "loss": 0.4441, "step": 8254 }, { "epoch": 1.53, "learning_rate": 1.019174364979607e-05, "loss": 0.4467, "step": 8255 }, { "epoch": 1.53, "learning_rate": 1.01897465611118e-05, "loss": 0.4265, "step": 8256 }, { "epoch": 1.53, "learning_rate": 1.0187749464856994e-05, "loss": 0.4469, "step": 8257 }, { "epoch": 1.53, "learning_rate": 1.018575236111133e-05, "loss": 0.431, "step": 8258 }, { "epoch": 1.53, "learning_rate": 1.0183755249954492e-05, "loss": 0.4467, "step": 8259 }, { "epoch": 1.53, "learning_rate": 1.0181758131466159e-05, "loss": 0.4409, "step": 8260 }, { "epoch": 1.53, "learning_rate": 1.0179761005726014e-05, "loss": 0.4318, "step": 8261 }, { "epoch": 1.53, "learning_rate": 1.0177763872813737e-05, "loss": 0.4502, "step": 8262 }, { "epoch": 1.53, "learning_rate": 1.0175766732809011e-05, "loss": 0.4347, "step": 8263 }, { "epoch": 1.53, "learning_rate": 1.017376958579152e-05, "loss": 0.443, "step": 8264 }, { "epoch": 1.53, "learning_rate": 1.017177243184094e-05, "loss": 0.4319, "step": 8265 }, { "epoch": 1.53, "learning_rate": 1.0169775271036964e-05, "loss": 0.4447, "step": 8266 }, { "epoch": 1.53, "learning_rate": 1.0167778103459265e-05, "loss": 0.4273, "step": 8267 }, { "epoch": 1.53, "learning_rate": 1.016578092918753e-05, "loss": 0.4371, "step": 8268 }, { "epoch": 1.53, "learning_rate": 1.0163783748301443e-05, "loss": 0.451, "step": 8269 }, { "epoch": 1.53, "learning_rate": 1.0161786560880686e-05, "loss": 0.4473, "step": 8270 }, { "epoch": 1.53, "learning_rate": 1.0159789367004948e-05, "loss": 0.4345, "step": 8271 }, { "epoch": 1.53, "learning_rate": 1.015779216675391e-05, "loss": 0.4485, "step": 8272 }, { "epoch": 1.53, "learning_rate": 1.0155794960207258e-05, "loss": 0.4448, "step": 8273 }, { "epoch": 1.53, "learning_rate": 1.015379774744467e-05, "loss": 0.4457, "step": 8274 }, { "epoch": 1.53, "learning_rate": 1.0151800528545842e-05, "loss": 0.4393, "step": 8275 }, { "epoch": 1.53, "learning_rate": 1.0149803303590451e-05, "loss": 0.4373, "step": 8276 }, { "epoch": 1.53, "learning_rate": 1.0147806072658189e-05, "loss": 0.4309, "step": 8277 }, { "epoch": 1.53, "learning_rate": 1.0145808835828735e-05, "loss": 0.4396, "step": 8278 }, { "epoch": 1.53, "learning_rate": 1.0143811593181779e-05, "loss": 0.4309, "step": 8279 }, { "epoch": 1.53, "learning_rate": 1.0141814344797006e-05, "loss": 0.437, "step": 8280 }, { "epoch": 1.53, "learning_rate": 1.0139817090754102e-05, "loss": 0.4136, "step": 8281 }, { "epoch": 1.53, "learning_rate": 1.0137819831132758e-05, "loss": 0.4363, "step": 8282 }, { "epoch": 1.53, "learning_rate": 1.013582256601266e-05, "loss": 0.4206, "step": 8283 }, { "epoch": 1.53, "learning_rate": 1.0133825295473487e-05, "loss": 0.4318, "step": 8284 }, { "epoch": 1.53, "learning_rate": 1.0131828019594937e-05, "loss": 0.4495, "step": 8285 }, { "epoch": 1.53, "learning_rate": 1.0129830738456689e-05, "loss": 0.437, "step": 8286 }, { "epoch": 1.53, "learning_rate": 1.0127833452138439e-05, "loss": 0.4285, "step": 8287 }, { "epoch": 1.53, "learning_rate": 1.0125836160719869e-05, "loss": 0.458, "step": 8288 }, { "epoch": 1.53, "learning_rate": 1.0123838864280668e-05, "loss": 0.4226, "step": 8289 }, { "epoch": 1.53, "learning_rate": 1.0121841562900528e-05, "loss": 0.4365, "step": 8290 }, { "epoch": 1.53, "learning_rate": 1.0119844256659134e-05, "loss": 0.4232, "step": 8291 }, { "epoch": 1.53, "learning_rate": 1.0117846945636175e-05, "loss": 0.451, "step": 8292 }, { "epoch": 1.53, "learning_rate": 1.0115849629911343e-05, "loss": 0.4225, "step": 8293 }, { "epoch": 1.53, "learning_rate": 1.0113852309564327e-05, "loss": 0.4147, "step": 8294 }, { "epoch": 1.53, "learning_rate": 1.0111854984674812e-05, "loss": 0.4426, "step": 8295 }, { "epoch": 1.53, "learning_rate": 1.010985765532249e-05, "loss": 0.4046, "step": 8296 }, { "epoch": 1.54, "learning_rate": 1.010786032158705e-05, "loss": 0.4353, "step": 8297 }, { "epoch": 1.54, "learning_rate": 1.0105862983548185e-05, "loss": 0.4306, "step": 8298 }, { "epoch": 1.54, "learning_rate": 1.0103865641285584e-05, "loss": 0.4141, "step": 8299 }, { "epoch": 1.54, "learning_rate": 1.0101868294878937e-05, "loss": 0.4329, "step": 8300 }, { "epoch": 1.54, "learning_rate": 1.009987094440793e-05, "loss": 0.4252, "step": 8301 }, { "epoch": 1.54, "learning_rate": 1.0097873589952256e-05, "loss": 0.444, "step": 8302 }, { "epoch": 1.54, "learning_rate": 1.009587623159161e-05, "loss": 0.4374, "step": 8303 }, { "epoch": 1.54, "learning_rate": 1.009387886940568e-05, "loss": 0.4347, "step": 8304 }, { "epoch": 1.54, "learning_rate": 1.0091881503474157e-05, "loss": 0.4405, "step": 8305 }, { "epoch": 1.54, "learning_rate": 1.0089884133876731e-05, "loss": 0.4329, "step": 8306 }, { "epoch": 1.54, "learning_rate": 1.0087886760693096e-05, "loss": 0.4251, "step": 8307 }, { "epoch": 1.54, "learning_rate": 1.008588938400294e-05, "loss": 0.424, "step": 8308 }, { "epoch": 1.54, "learning_rate": 1.0083892003885955e-05, "loss": 0.4336, "step": 8309 }, { "epoch": 1.54, "learning_rate": 1.008189462042184e-05, "loss": 0.4482, "step": 8310 }, { "epoch": 1.54, "learning_rate": 1.0079897233690276e-05, "loss": 0.4558, "step": 8311 }, { "epoch": 1.54, "learning_rate": 1.0077899843770964e-05, "loss": 0.4283, "step": 8312 }, { "epoch": 1.54, "learning_rate": 1.007590245074359e-05, "loss": 0.4056, "step": 8313 }, { "epoch": 1.54, "learning_rate": 1.007390505468785e-05, "loss": 0.4126, "step": 8314 }, { "epoch": 1.54, "learning_rate": 1.0071907655683432e-05, "loss": 0.4367, "step": 8315 }, { "epoch": 1.54, "learning_rate": 1.0069910253810035e-05, "loss": 0.4263, "step": 8316 }, { "epoch": 1.54, "learning_rate": 1.0067912849147348e-05, "loss": 0.4248, "step": 8317 }, { "epoch": 1.54, "learning_rate": 1.0065915441775062e-05, "loss": 0.4252, "step": 8318 }, { "epoch": 1.54, "learning_rate": 1.0063918031772875e-05, "loss": 0.4414, "step": 8319 }, { "epoch": 1.54, "learning_rate": 1.0061920619220476e-05, "loss": 0.4244, "step": 8320 }, { "epoch": 1.54, "learning_rate": 1.005992320419756e-05, "loss": 0.4391, "step": 8321 }, { "epoch": 1.54, "learning_rate": 1.0057925786783815e-05, "loss": 0.4159, "step": 8322 }, { "epoch": 1.54, "learning_rate": 1.0055928367058942e-05, "loss": 0.4609, "step": 8323 }, { "epoch": 1.54, "learning_rate": 1.005393094510263e-05, "loss": 0.4312, "step": 8324 }, { "epoch": 1.54, "learning_rate": 1.0051933520994572e-05, "loss": 0.4451, "step": 8325 }, { "epoch": 1.54, "learning_rate": 1.0049936094814463e-05, "loss": 0.4431, "step": 8326 }, { "epoch": 1.54, "learning_rate": 1.0047938666641999e-05, "loss": 0.4467, "step": 8327 }, { "epoch": 1.54, "learning_rate": 1.0045941236556866e-05, "loss": 0.4291, "step": 8328 }, { "epoch": 1.54, "learning_rate": 1.0043943804638767e-05, "loss": 0.4415, "step": 8329 }, { "epoch": 1.54, "learning_rate": 1.0041946370967389e-05, "loss": 0.4224, "step": 8330 }, { "epoch": 1.54, "learning_rate": 1.003994893562243e-05, "loss": 0.4281, "step": 8331 }, { "epoch": 1.54, "learning_rate": 1.0037951498683582e-05, "loss": 0.4245, "step": 8332 }, { "epoch": 1.54, "learning_rate": 1.0035954060230539e-05, "loss": 0.4394, "step": 8333 }, { "epoch": 1.54, "learning_rate": 1.0033956620342997e-05, "loss": 0.4457, "step": 8334 }, { "epoch": 1.54, "learning_rate": 1.0031959179100645e-05, "loss": 0.4379, "step": 8335 }, { "epoch": 1.54, "learning_rate": 1.0029961736583185e-05, "loss": 0.448, "step": 8336 }, { "epoch": 1.54, "learning_rate": 1.0027964292870304e-05, "loss": 0.4316, "step": 8337 }, { "epoch": 1.54, "learning_rate": 1.0025966848041701e-05, "loss": 0.4216, "step": 8338 }, { "epoch": 1.54, "learning_rate": 1.0023969402177069e-05, "loss": 0.4373, "step": 8339 }, { "epoch": 1.54, "learning_rate": 1.0021971955356102e-05, "loss": 0.426, "step": 8340 }, { "epoch": 1.54, "learning_rate": 1.0019974507658495e-05, "loss": 0.4253, "step": 8341 }, { "epoch": 1.54, "learning_rate": 1.0017977059163942e-05, "loss": 0.4371, "step": 8342 }, { "epoch": 1.54, "learning_rate": 1.001597960995214e-05, "loss": 0.4373, "step": 8343 }, { "epoch": 1.54, "learning_rate": 1.0013982160102778e-05, "loss": 0.4191, "step": 8344 }, { "epoch": 1.54, "learning_rate": 1.0011984709695553e-05, "loss": 0.424, "step": 8345 }, { "epoch": 1.54, "learning_rate": 1.0009987258810162e-05, "loss": 0.4374, "step": 8346 }, { "epoch": 1.54, "learning_rate": 1.0007989807526297e-05, "loss": 0.4181, "step": 8347 }, { "epoch": 1.54, "learning_rate": 1.0005992355923655e-05, "loss": 0.4211, "step": 8348 }, { "epoch": 1.54, "learning_rate": 1.0003994904081929e-05, "loss": 0.4401, "step": 8349 }, { "epoch": 1.54, "learning_rate": 1.0001997452080812e-05, "loss": 0.4182, "step": 8350 }, { "epoch": 1.55, "learning_rate": 1e-05, "loss": 0.4533, "step": 8351 }, { "epoch": 1.55, "learning_rate": 9.998002547919192e-06, "loss": 0.4097, "step": 8352 }, { "epoch": 1.55, "learning_rate": 9.996005095918074e-06, "loss": 0.4288, "step": 8353 }, { "epoch": 1.55, "learning_rate": 9.994007644076349e-06, "loss": 0.4053, "step": 8354 }, { "epoch": 1.55, "learning_rate": 9.992010192473703e-06, "loss": 0.4355, "step": 8355 }, { "epoch": 1.55, "learning_rate": 9.99001274118984e-06, "loss": 0.4238, "step": 8356 }, { "epoch": 1.55, "learning_rate": 9.988015290304452e-06, "loss": 0.4231, "step": 8357 }, { "epoch": 1.55, "learning_rate": 9.986017839897225e-06, "loss": 0.4263, "step": 8358 }, { "epoch": 1.55, "learning_rate": 9.984020390047867e-06, "loss": 0.4387, "step": 8359 }, { "epoch": 1.55, "learning_rate": 9.98202294083606e-06, "loss": 0.4106, "step": 8360 }, { "epoch": 1.55, "learning_rate": 9.980025492341508e-06, "loss": 0.4352, "step": 8361 }, { "epoch": 1.55, "learning_rate": 9.9780280446439e-06, "loss": 0.447, "step": 8362 }, { "epoch": 1.55, "learning_rate": 9.976030597822933e-06, "loss": 0.4381, "step": 8363 }, { "epoch": 1.55, "learning_rate": 9.974033151958302e-06, "loss": 0.4273, "step": 8364 }, { "epoch": 1.55, "learning_rate": 9.972035707129697e-06, "loss": 0.4392, "step": 8365 }, { "epoch": 1.55, "learning_rate": 9.970038263416818e-06, "loss": 0.4232, "step": 8366 }, { "epoch": 1.55, "learning_rate": 9.968040820899356e-06, "loss": 0.4442, "step": 8367 }, { "epoch": 1.55, "learning_rate": 9.966043379657006e-06, "loss": 0.428, "step": 8368 }, { "epoch": 1.55, "learning_rate": 9.964045939769465e-06, "loss": 0.4597, "step": 8369 }, { "epoch": 1.55, "learning_rate": 9.96204850131642e-06, "loss": 0.4104, "step": 8370 }, { "epoch": 1.55, "learning_rate": 9.960051064377574e-06, "loss": 0.4322, "step": 8371 }, { "epoch": 1.55, "learning_rate": 9.958053629032611e-06, "loss": 0.4318, "step": 8372 }, { "epoch": 1.55, "learning_rate": 9.956056195361237e-06, "loss": 0.4275, "step": 8373 }, { "epoch": 1.55, "learning_rate": 9.954058763443137e-06, "loss": 0.4469, "step": 8374 }, { "epoch": 1.55, "learning_rate": 9.952061333358005e-06, "loss": 0.4281, "step": 8375 }, { "epoch": 1.55, "learning_rate": 9.950063905185539e-06, "loss": 0.4463, "step": 8376 }, { "epoch": 1.55, "learning_rate": 9.94806647900543e-06, "loss": 0.4241, "step": 8377 }, { "epoch": 1.55, "learning_rate": 9.946069054897374e-06, "loss": 0.4463, "step": 8378 }, { "epoch": 1.55, "learning_rate": 9.944071632941064e-06, "loss": 0.4505, "step": 8379 }, { "epoch": 1.55, "learning_rate": 9.942074213216187e-06, "loss": 0.4198, "step": 8380 }, { "epoch": 1.55, "learning_rate": 9.940076795802446e-06, "loss": 0.4378, "step": 8381 }, { "epoch": 1.55, "learning_rate": 9.938079380779526e-06, "loss": 0.4463, "step": 8382 }, { "epoch": 1.55, "learning_rate": 9.936081968227129e-06, "loss": 0.4302, "step": 8383 }, { "epoch": 1.55, "learning_rate": 9.93408455822494e-06, "loss": 0.4515, "step": 8384 }, { "epoch": 1.55, "learning_rate": 9.932087150852655e-06, "loss": 0.4421, "step": 8385 }, { "epoch": 1.55, "learning_rate": 9.930089746189966e-06, "loss": 0.4181, "step": 8386 }, { "epoch": 1.55, "learning_rate": 9.92809234431657e-06, "loss": 0.4125, "step": 8387 }, { "epoch": 1.55, "learning_rate": 9.926094945312154e-06, "loss": 0.4152, "step": 8388 }, { "epoch": 1.55, "learning_rate": 9.924097549256413e-06, "loss": 0.4137, "step": 8389 }, { "epoch": 1.55, "learning_rate": 9.922100156229038e-06, "loss": 0.4481, "step": 8390 }, { "epoch": 1.55, "learning_rate": 9.920102766309727e-06, "loss": 0.4394, "step": 8391 }, { "epoch": 1.55, "learning_rate": 9.918105379578162e-06, "loss": 0.4562, "step": 8392 }, { "epoch": 1.55, "learning_rate": 9.916107996114047e-06, "loss": 0.4319, "step": 8393 }, { "epoch": 1.55, "learning_rate": 9.914110615997062e-06, "loss": 0.4311, "step": 8394 }, { "epoch": 1.55, "learning_rate": 9.912113239306908e-06, "loss": 0.4422, "step": 8395 }, { "epoch": 1.55, "learning_rate": 9.910115866123274e-06, "loss": 0.4264, "step": 8396 }, { "epoch": 1.55, "learning_rate": 9.908118496525845e-06, "loss": 0.4151, "step": 8397 }, { "epoch": 1.55, "learning_rate": 9.906121130594324e-06, "loss": 0.4338, "step": 8398 }, { "epoch": 1.55, "learning_rate": 9.90412376840839e-06, "loss": 0.4168, "step": 8399 }, { "epoch": 1.55, "learning_rate": 9.902126410047746e-06, "loss": 0.4346, "step": 8400 }, { "epoch": 1.55, "learning_rate": 9.900129055592076e-06, "loss": 0.4457, "step": 8401 }, { "epoch": 1.55, "learning_rate": 9.898131705121068e-06, "loss": 0.4245, "step": 8402 }, { "epoch": 1.55, "learning_rate": 9.89613435871442e-06, "loss": 0.4382, "step": 8403 }, { "epoch": 1.55, "learning_rate": 9.894137016451814e-06, "loss": 0.4388, "step": 8404 }, { "epoch": 1.56, "learning_rate": 9.892139678412951e-06, "loss": 0.426, "step": 8405 }, { "epoch": 1.56, "learning_rate": 9.890142344677515e-06, "loss": 0.4278, "step": 8406 }, { "epoch": 1.56, "learning_rate": 9.888145015325192e-06, "loss": 0.4434, "step": 8407 }, { "epoch": 1.56, "learning_rate": 9.886147690435678e-06, "loss": 0.4357, "step": 8408 }, { "epoch": 1.56, "learning_rate": 9.884150370088658e-06, "loss": 0.4225, "step": 8409 }, { "epoch": 1.56, "learning_rate": 9.882153054363826e-06, "loss": 0.4277, "step": 8410 }, { "epoch": 1.56, "learning_rate": 9.880155743340867e-06, "loss": 0.4388, "step": 8411 }, { "epoch": 1.56, "learning_rate": 9.878158437099475e-06, "loss": 0.4503, "step": 8412 }, { "epoch": 1.56, "learning_rate": 9.876161135719334e-06, "loss": 0.4499, "step": 8413 }, { "epoch": 1.56, "learning_rate": 9.874163839280134e-06, "loss": 0.4352, "step": 8414 }, { "epoch": 1.56, "learning_rate": 9.872166547861563e-06, "loss": 0.4022, "step": 8415 }, { "epoch": 1.56, "learning_rate": 9.870169261543313e-06, "loss": 0.419, "step": 8416 }, { "epoch": 1.56, "learning_rate": 9.868171980405067e-06, "loss": 0.4173, "step": 8417 }, { "epoch": 1.56, "learning_rate": 9.866174704526516e-06, "loss": 0.4408, "step": 8418 }, { "epoch": 1.56, "learning_rate": 9.864177433987344e-06, "loss": 0.4529, "step": 8419 }, { "epoch": 1.56, "learning_rate": 9.862180168867245e-06, "loss": 0.4409, "step": 8420 }, { "epoch": 1.56, "learning_rate": 9.860182909245898e-06, "loss": 0.452, "step": 8421 }, { "epoch": 1.56, "learning_rate": 9.858185655202997e-06, "loss": 0.4245, "step": 8422 }, { "epoch": 1.56, "learning_rate": 9.856188406818226e-06, "loss": 0.4513, "step": 8423 }, { "epoch": 1.56, "learning_rate": 9.854191164171269e-06, "loss": 0.4402, "step": 8424 }, { "epoch": 1.56, "learning_rate": 9.852193927341818e-06, "loss": 0.4582, "step": 8425 }, { "epoch": 1.56, "learning_rate": 9.85019669640955e-06, "loss": 0.4286, "step": 8426 }, { "epoch": 1.56, "learning_rate": 9.848199471454162e-06, "loss": 0.4299, "step": 8427 }, { "epoch": 1.56, "learning_rate": 9.846202252555334e-06, "loss": 0.4161, "step": 8428 }, { "epoch": 1.56, "learning_rate": 9.844205039792747e-06, "loss": 0.4384, "step": 8429 }, { "epoch": 1.56, "learning_rate": 9.842207833246095e-06, "loss": 0.444, "step": 8430 }, { "epoch": 1.56, "learning_rate": 9.840210632995054e-06, "loss": 0.4109, "step": 8431 }, { "epoch": 1.56, "learning_rate": 9.838213439119316e-06, "loss": 0.4342, "step": 8432 }, { "epoch": 1.56, "learning_rate": 9.836216251698559e-06, "loss": 0.4167, "step": 8433 }, { "epoch": 1.56, "learning_rate": 9.834219070812475e-06, "loss": 0.431, "step": 8434 }, { "epoch": 1.56, "learning_rate": 9.832221896540742e-06, "loss": 0.4348, "step": 8435 }, { "epoch": 1.56, "learning_rate": 9.830224728963041e-06, "loss": 0.4437, "step": 8436 }, { "epoch": 1.56, "learning_rate": 9.828227568159063e-06, "loss": 0.4142, "step": 8437 }, { "epoch": 1.56, "learning_rate": 9.826230414208482e-06, "loss": 0.439, "step": 8438 }, { "epoch": 1.56, "learning_rate": 9.824233267190992e-06, "loss": 0.422, "step": 8439 }, { "epoch": 1.56, "learning_rate": 9.822236127186265e-06, "loss": 0.4271, "step": 8440 }, { "epoch": 1.56, "learning_rate": 9.820238994273989e-06, "loss": 0.428, "step": 8441 }, { "epoch": 1.56, "learning_rate": 9.818241868533843e-06, "loss": 0.4247, "step": 8442 }, { "epoch": 1.56, "learning_rate": 9.816244750045511e-06, "loss": 0.4419, "step": 8443 }, { "epoch": 1.56, "learning_rate": 9.814247638888672e-06, "loss": 0.4477, "step": 8444 }, { "epoch": 1.56, "learning_rate": 9.812250535143011e-06, "loss": 0.4305, "step": 8445 }, { "epoch": 1.56, "learning_rate": 9.810253438888204e-06, "loss": 0.4212, "step": 8446 }, { "epoch": 1.56, "learning_rate": 9.808256350203934e-06, "loss": 0.4481, "step": 8447 }, { "epoch": 1.56, "learning_rate": 9.806259269169878e-06, "loss": 0.4436, "step": 8448 }, { "epoch": 1.56, "learning_rate": 9.804262195865723e-06, "loss": 0.4211, "step": 8449 }, { "epoch": 1.56, "learning_rate": 9.802265130371144e-06, "loss": 0.4289, "step": 8450 }, { "epoch": 1.56, "learning_rate": 9.800268072765816e-06, "loss": 0.4326, "step": 8451 }, { "epoch": 1.56, "learning_rate": 9.798271023129427e-06, "loss": 0.4447, "step": 8452 }, { "epoch": 1.56, "learning_rate": 9.796273981541645e-06, "loss": 0.4293, "step": 8453 }, { "epoch": 1.56, "learning_rate": 9.794276948082158e-06, "loss": 0.4279, "step": 8454 }, { "epoch": 1.56, "learning_rate": 9.792279922830638e-06, "loss": 0.4284, "step": 8455 }, { "epoch": 1.56, "learning_rate": 9.790282905866767e-06, "loss": 0.4315, "step": 8456 }, { "epoch": 1.56, "learning_rate": 9.78828589727022e-06, "loss": 0.464, "step": 8457 }, { "epoch": 1.56, "learning_rate": 9.786288897120669e-06, "loss": 0.4237, "step": 8458 }, { "epoch": 1.57, "learning_rate": 9.7842919054978e-06, "loss": 0.4248, "step": 8459 }, { "epoch": 1.57, "learning_rate": 9.78229492248128e-06, "loss": 0.4205, "step": 8460 }, { "epoch": 1.57, "learning_rate": 9.780297948150794e-06, "loss": 0.4249, "step": 8461 }, { "epoch": 1.57, "learning_rate": 9.778300982586013e-06, "loss": 0.4149, "step": 8462 }, { "epoch": 1.57, "learning_rate": 9.77630402586661e-06, "loss": 0.4294, "step": 8463 }, { "epoch": 1.57, "learning_rate": 9.774307078072261e-06, "loss": 0.4354, "step": 8464 }, { "epoch": 1.57, "learning_rate": 9.772310139282644e-06, "loss": 0.4487, "step": 8465 }, { "epoch": 1.57, "learning_rate": 9.770313209577431e-06, "loss": 0.4379, "step": 8466 }, { "epoch": 1.57, "learning_rate": 9.768316289036296e-06, "loss": 0.4367, "step": 8467 }, { "epoch": 1.57, "learning_rate": 9.76631937773891e-06, "loss": 0.446, "step": 8468 }, { "epoch": 1.57, "learning_rate": 9.764322475764951e-06, "loss": 0.4431, "step": 8469 }, { "epoch": 1.57, "learning_rate": 9.762325583194085e-06, "loss": 0.4396, "step": 8470 }, { "epoch": 1.57, "learning_rate": 9.760328700105993e-06, "loss": 0.432, "step": 8471 }, { "epoch": 1.57, "learning_rate": 9.75833182658034e-06, "loss": 0.4245, "step": 8472 }, { "epoch": 1.57, "learning_rate": 9.756334962696799e-06, "loss": 0.4776, "step": 8473 }, { "epoch": 1.57, "learning_rate": 9.754338108535042e-06, "loss": 0.4087, "step": 8474 }, { "epoch": 1.57, "learning_rate": 9.752341264174738e-06, "loss": 0.4433, "step": 8475 }, { "epoch": 1.57, "learning_rate": 9.750344429695563e-06, "loss": 0.4338, "step": 8476 }, { "epoch": 1.57, "learning_rate": 9.748347605177178e-06, "loss": 0.4241, "step": 8477 }, { "epoch": 1.57, "learning_rate": 9.746350790699265e-06, "loss": 0.4324, "step": 8478 }, { "epoch": 1.57, "learning_rate": 9.744353986341482e-06, "loss": 0.4327, "step": 8479 }, { "epoch": 1.57, "learning_rate": 9.742357192183498e-06, "loss": 0.4302, "step": 8480 }, { "epoch": 1.57, "learning_rate": 9.740360408304991e-06, "loss": 0.4425, "step": 8481 }, { "epoch": 1.57, "learning_rate": 9.738363634785617e-06, "loss": 0.4331, "step": 8482 }, { "epoch": 1.57, "learning_rate": 9.736366871705054e-06, "loss": 0.4546, "step": 8483 }, { "epoch": 1.57, "learning_rate": 9.734370119142966e-06, "loss": 0.4372, "step": 8484 }, { "epoch": 1.57, "learning_rate": 9.732373377179012e-06, "loss": 0.4119, "step": 8485 }, { "epoch": 1.57, "learning_rate": 9.730376645892872e-06, "loss": 0.4355, "step": 8486 }, { "epoch": 1.57, "learning_rate": 9.728379925364199e-06, "loss": 0.4373, "step": 8487 }, { "epoch": 1.57, "learning_rate": 9.726383215672668e-06, "loss": 0.4452, "step": 8488 }, { "epoch": 1.57, "learning_rate": 9.724386516897937e-06, "loss": 0.43, "step": 8489 }, { "epoch": 1.57, "learning_rate": 9.722389829119674e-06, "loss": 0.436, "step": 8490 }, { "epoch": 1.57, "learning_rate": 9.720393152417545e-06, "loss": 0.4173, "step": 8491 }, { "epoch": 1.57, "learning_rate": 9.71839648687121e-06, "loss": 0.404, "step": 8492 }, { "epoch": 1.57, "learning_rate": 9.716399832560334e-06, "loss": 0.4286, "step": 8493 }, { "epoch": 1.57, "learning_rate": 9.714403189564582e-06, "loss": 0.4311, "step": 8494 }, { "epoch": 1.57, "learning_rate": 9.71240655796361e-06, "loss": 0.4358, "step": 8495 }, { "epoch": 1.57, "learning_rate": 9.710409937837086e-06, "loss": 0.4252, "step": 8496 }, { "epoch": 1.57, "learning_rate": 9.708413329264667e-06, "loss": 0.4198, "step": 8497 }, { "epoch": 1.57, "learning_rate": 9.70641673232602e-06, "loss": 0.4471, "step": 8498 }, { "epoch": 1.57, "learning_rate": 9.704420147100798e-06, "loss": 0.442, "step": 8499 }, { "epoch": 1.57, "learning_rate": 9.70242357366867e-06, "loss": 0.4173, "step": 8500 }, { "epoch": 1.57, "learning_rate": 9.700427012109288e-06, "loss": 0.4392, "step": 8501 }, { "epoch": 1.57, "learning_rate": 9.69843046250231e-06, "loss": 0.4544, "step": 8502 }, { "epoch": 1.57, "learning_rate": 9.696433924927404e-06, "loss": 0.4412, "step": 8503 }, { "epoch": 1.57, "learning_rate": 9.694437399464217e-06, "loss": 0.4304, "step": 8504 }, { "epoch": 1.57, "learning_rate": 9.692440886192417e-06, "loss": 0.4501, "step": 8505 }, { "epoch": 1.57, "learning_rate": 9.690444385191655e-06, "loss": 0.4386, "step": 8506 }, { "epoch": 1.57, "learning_rate": 9.688447896541586e-06, "loss": 0.4513, "step": 8507 }, { "epoch": 1.57, "learning_rate": 9.686451420321872e-06, "loss": 0.439, "step": 8508 }, { "epoch": 1.57, "learning_rate": 9.684454956612162e-06, "loss": 0.4324, "step": 8509 }, { "epoch": 1.57, "learning_rate": 9.68245850549212e-06, "loss": 0.4345, "step": 8510 }, { "epoch": 1.57, "learning_rate": 9.680462067041393e-06, "loss": 0.4386, "step": 8511 }, { "epoch": 1.57, "learning_rate": 9.678465641339639e-06, "loss": 0.4301, "step": 8512 }, { "epoch": 1.58, "learning_rate": 9.67646922846651e-06, "loss": 0.4313, "step": 8513 }, { "epoch": 1.58, "learning_rate": 9.674472828501659e-06, "loss": 0.4458, "step": 8514 }, { "epoch": 1.58, "learning_rate": 9.67247644152474e-06, "loss": 0.4223, "step": 8515 }, { "epoch": 1.58, "learning_rate": 9.670480067615406e-06, "loss": 0.4285, "step": 8516 }, { "epoch": 1.58, "learning_rate": 9.668483706853303e-06, "loss": 0.4156, "step": 8517 }, { "epoch": 1.58, "learning_rate": 9.666487359318092e-06, "loss": 0.4369, "step": 8518 }, { "epoch": 1.58, "learning_rate": 9.664491025089411e-06, "loss": 0.434, "step": 8519 }, { "epoch": 1.58, "learning_rate": 9.662494704246924e-06, "loss": 0.428, "step": 8520 }, { "epoch": 1.58, "learning_rate": 9.660498396870269e-06, "loss": 0.442, "step": 8521 }, { "epoch": 1.58, "learning_rate": 9.658502103039103e-06, "loss": 0.442, "step": 8522 }, { "epoch": 1.58, "learning_rate": 9.65650582283307e-06, "loss": 0.4415, "step": 8523 }, { "epoch": 1.58, "learning_rate": 9.654509556331814e-06, "loss": 0.4203, "step": 8524 }, { "epoch": 1.58, "learning_rate": 9.652513303614992e-06, "loss": 0.4294, "step": 8525 }, { "epoch": 1.58, "learning_rate": 9.650517064762242e-06, "loss": 0.4153, "step": 8526 }, { "epoch": 1.58, "learning_rate": 9.648520839853219e-06, "loss": 0.4415, "step": 8527 }, { "epoch": 1.58, "learning_rate": 9.646524628967563e-06, "loss": 0.4437, "step": 8528 }, { "epoch": 1.58, "learning_rate": 9.644528432184916e-06, "loss": 0.4175, "step": 8529 }, { "epoch": 1.58, "learning_rate": 9.642532249584931e-06, "loss": 0.4267, "step": 8530 }, { "epoch": 1.58, "learning_rate": 9.640536081247241e-06, "loss": 0.4364, "step": 8531 }, { "epoch": 1.58, "learning_rate": 9.638539927251502e-06, "loss": 0.4354, "step": 8532 }, { "epoch": 1.58, "learning_rate": 9.63654378767735e-06, "loss": 0.4426, "step": 8533 }, { "epoch": 1.58, "learning_rate": 9.634547662604423e-06, "loss": 0.4406, "step": 8534 }, { "epoch": 1.58, "learning_rate": 9.632551552112373e-06, "loss": 0.4294, "step": 8535 }, { "epoch": 1.58, "learning_rate": 9.630555456280832e-06, "loss": 0.4375, "step": 8536 }, { "epoch": 1.58, "learning_rate": 9.628559375189448e-06, "loss": 0.4318, "step": 8537 }, { "epoch": 1.58, "learning_rate": 9.626563308917855e-06, "loss": 0.436, "step": 8538 }, { "epoch": 1.58, "learning_rate": 9.624567257545694e-06, "loss": 0.4409, "step": 8539 }, { "epoch": 1.58, "learning_rate": 9.622571221152605e-06, "loss": 0.425, "step": 8540 }, { "epoch": 1.58, "learning_rate": 9.620575199818226e-06, "loss": 0.4139, "step": 8541 }, { "epoch": 1.58, "learning_rate": 9.618579193622191e-06, "loss": 0.4619, "step": 8542 }, { "epoch": 1.58, "learning_rate": 9.616583202644143e-06, "loss": 0.4463, "step": 8543 }, { "epoch": 1.58, "learning_rate": 9.614587226963715e-06, "loss": 0.447, "step": 8544 }, { "epoch": 1.58, "learning_rate": 9.612591266660545e-06, "loss": 0.4515, "step": 8545 }, { "epoch": 1.58, "learning_rate": 9.610595321814261e-06, "loss": 0.4486, "step": 8546 }, { "epoch": 1.58, "learning_rate": 9.608599392504509e-06, "loss": 0.446, "step": 8547 }, { "epoch": 1.58, "learning_rate": 9.60660347881091e-06, "loss": 0.4266, "step": 8548 }, { "epoch": 1.58, "learning_rate": 9.60460758081311e-06, "loss": 0.424, "step": 8549 }, { "epoch": 1.58, "learning_rate": 9.602611698590735e-06, "loss": 0.4098, "step": 8550 }, { "epoch": 1.58, "learning_rate": 9.600615832223412e-06, "loss": 0.423, "step": 8551 }, { "epoch": 1.58, "learning_rate": 9.598619981790783e-06, "loss": 0.443, "step": 8552 }, { "epoch": 1.58, "learning_rate": 9.59662414737247e-06, "loss": 0.4364, "step": 8553 }, { "epoch": 1.58, "learning_rate": 9.59462832904811e-06, "loss": 0.403, "step": 8554 }, { "epoch": 1.58, "learning_rate": 9.59263252689733e-06, "loss": 0.4656, "step": 8555 }, { "epoch": 1.58, "learning_rate": 9.590636740999753e-06, "loss": 0.4342, "step": 8556 }, { "epoch": 1.58, "learning_rate": 9.588640971435015e-06, "loss": 0.4265, "step": 8557 }, { "epoch": 1.58, "learning_rate": 9.586645218282739e-06, "loss": 0.4418, "step": 8558 }, { "epoch": 1.58, "learning_rate": 9.584649481622556e-06, "loss": 0.4252, "step": 8559 }, { "epoch": 1.58, "learning_rate": 9.58265376153409e-06, "loss": 0.4107, "step": 8560 }, { "epoch": 1.58, "learning_rate": 9.580658058096963e-06, "loss": 0.43, "step": 8561 }, { "epoch": 1.58, "learning_rate": 9.578662371390806e-06, "loss": 0.4189, "step": 8562 }, { "epoch": 1.58, "learning_rate": 9.576666701495236e-06, "loss": 0.4431, "step": 8563 }, { "epoch": 1.58, "learning_rate": 9.574671048489886e-06, "loss": 0.4265, "step": 8564 }, { "epoch": 1.58, "learning_rate": 9.57267541245437e-06, "loss": 0.4619, "step": 8565 }, { "epoch": 1.58, "learning_rate": 9.570679793468317e-06, "loss": 0.4204, "step": 8566 }, { "epoch": 1.59, "learning_rate": 9.568684191611343e-06, "loss": 0.4694, "step": 8567 }, { "epoch": 1.59, "learning_rate": 9.566688606963071e-06, "loss": 0.4267, "step": 8568 }, { "epoch": 1.59, "learning_rate": 9.564693039603123e-06, "loss": 0.4345, "step": 8569 }, { "epoch": 1.59, "learning_rate": 9.562697489611113e-06, "loss": 0.4416, "step": 8570 }, { "epoch": 1.59, "learning_rate": 9.56070195706667e-06, "loss": 0.4338, "step": 8571 }, { "epoch": 1.59, "learning_rate": 9.558706442049404e-06, "loss": 0.4298, "step": 8572 }, { "epoch": 1.59, "learning_rate": 9.556710944638929e-06, "loss": 0.4296, "step": 8573 }, { "epoch": 1.59, "learning_rate": 9.554715464914871e-06, "loss": 0.4417, "step": 8574 }, { "epoch": 1.59, "learning_rate": 9.552720002956838e-06, "loss": 0.4134, "step": 8575 }, { "epoch": 1.59, "learning_rate": 9.550724558844453e-06, "loss": 0.4392, "step": 8576 }, { "epoch": 1.59, "learning_rate": 9.548729132657326e-06, "loss": 0.43, "step": 8577 }, { "epoch": 1.59, "learning_rate": 9.546733724475067e-06, "loss": 0.4305, "step": 8578 }, { "epoch": 1.59, "learning_rate": 9.544738334377297e-06, "loss": 0.4463, "step": 8579 }, { "epoch": 1.59, "learning_rate": 9.542742962443622e-06, "loss": 0.4202, "step": 8580 }, { "epoch": 1.59, "learning_rate": 9.540747608753658e-06, "loss": 0.4492, "step": 8581 }, { "epoch": 1.59, "learning_rate": 9.538752273387015e-06, "loss": 0.4465, "step": 8582 }, { "epoch": 1.59, "learning_rate": 9.536756956423298e-06, "loss": 0.4438, "step": 8583 }, { "epoch": 1.59, "learning_rate": 9.534761657942126e-06, "loss": 0.4407, "step": 8584 }, { "epoch": 1.59, "learning_rate": 9.532766378023098e-06, "loss": 0.4288, "step": 8585 }, { "epoch": 1.59, "learning_rate": 9.53077111674583e-06, "loss": 0.443, "step": 8586 }, { "epoch": 1.59, "learning_rate": 9.528775874189922e-06, "loss": 0.4453, "step": 8587 }, { "epoch": 1.59, "learning_rate": 9.526780650434988e-06, "loss": 0.4224, "step": 8588 }, { "epoch": 1.59, "learning_rate": 9.524785445560628e-06, "loss": 0.4367, "step": 8589 }, { "epoch": 1.59, "learning_rate": 9.52279025964645e-06, "loss": 0.4296, "step": 8590 }, { "epoch": 1.59, "learning_rate": 9.520795092772054e-06, "loss": 0.4508, "step": 8591 }, { "epoch": 1.59, "learning_rate": 9.51879994501705e-06, "loss": 0.4254, "step": 8592 }, { "epoch": 1.59, "learning_rate": 9.516804816461036e-06, "loss": 0.4279, "step": 8593 }, { "epoch": 1.59, "learning_rate": 9.514809707183617e-06, "loss": 0.4267, "step": 8594 }, { "epoch": 1.59, "learning_rate": 9.512814617264388e-06, "loss": 0.445, "step": 8595 }, { "epoch": 1.59, "learning_rate": 9.510819546782958e-06, "loss": 0.443, "step": 8596 }, { "epoch": 1.59, "learning_rate": 9.508824495818918e-06, "loss": 0.4337, "step": 8597 }, { "epoch": 1.59, "learning_rate": 9.506829464451876e-06, "loss": 0.4263, "step": 8598 }, { "epoch": 1.59, "learning_rate": 9.504834452761425e-06, "loss": 0.451, "step": 8599 }, { "epoch": 1.59, "learning_rate": 9.502839460827158e-06, "loss": 0.4478, "step": 8600 }, { "epoch": 1.59, "learning_rate": 9.500844488728682e-06, "loss": 0.4122, "step": 8601 }, { "epoch": 1.59, "learning_rate": 9.498849536545582e-06, "loss": 0.4253, "step": 8602 }, { "epoch": 1.59, "learning_rate": 9.49685460435746e-06, "loss": 0.4396, "step": 8603 }, { "epoch": 1.59, "learning_rate": 9.49485969224391e-06, "loss": 0.4246, "step": 8604 }, { "epoch": 1.59, "learning_rate": 9.492864800284516e-06, "loss": 0.4398, "step": 8605 }, { "epoch": 1.59, "learning_rate": 9.490869928558885e-06, "loss": 0.4125, "step": 8606 }, { "epoch": 1.59, "learning_rate": 9.488875077146595e-06, "loss": 0.4311, "step": 8607 }, { "epoch": 1.59, "learning_rate": 9.486880246127248e-06, "loss": 0.4328, "step": 8608 }, { "epoch": 1.59, "learning_rate": 9.484885435580424e-06, "loss": 0.4326, "step": 8609 }, { "epoch": 1.59, "learning_rate": 9.482890645585723e-06, "loss": 0.4359, "step": 8610 }, { "epoch": 1.59, "learning_rate": 9.480895876222728e-06, "loss": 0.4359, "step": 8611 }, { "epoch": 1.59, "learning_rate": 9.47890112757102e-06, "loss": 0.4298, "step": 8612 }, { "epoch": 1.59, "learning_rate": 9.476906399710198e-06, "loss": 0.4072, "step": 8613 }, { "epoch": 1.59, "learning_rate": 9.474911692719838e-06, "loss": 0.4323, "step": 8614 }, { "epoch": 1.59, "learning_rate": 9.472917006679534e-06, "loss": 0.4238, "step": 8615 }, { "epoch": 1.59, "learning_rate": 9.470922341668862e-06, "loss": 0.4349, "step": 8616 }, { "epoch": 1.59, "learning_rate": 9.468927697767411e-06, "loss": 0.4179, "step": 8617 }, { "epoch": 1.59, "learning_rate": 9.466933075054759e-06, "loss": 0.4313, "step": 8618 }, { "epoch": 1.59, "learning_rate": 9.464938473610492e-06, "loss": 0.4354, "step": 8619 }, { "epoch": 1.59, "learning_rate": 9.46294389351419e-06, "loss": 0.4225, "step": 8620 }, { "epoch": 1.6, "learning_rate": 9.460949334845433e-06, "loss": 0.4156, "step": 8621 }, { "epoch": 1.6, "learning_rate": 9.458954797683796e-06, "loss": 0.4377, "step": 8622 }, { "epoch": 1.6, "learning_rate": 9.456960282108865e-06, "loss": 0.4095, "step": 8623 }, { "epoch": 1.6, "learning_rate": 9.454965788200208e-06, "loss": 0.4144, "step": 8624 }, { "epoch": 1.6, "learning_rate": 9.452971316037413e-06, "loss": 0.427, "step": 8625 }, { "epoch": 1.6, "learning_rate": 9.450976865700048e-06, "loss": 0.4404, "step": 8626 }, { "epoch": 1.6, "learning_rate": 9.448982437267687e-06, "loss": 0.4213, "step": 8627 }, { "epoch": 1.6, "learning_rate": 9.446988030819909e-06, "loss": 0.4331, "step": 8628 }, { "epoch": 1.6, "learning_rate": 9.444993646436281e-06, "loss": 0.4203, "step": 8629 }, { "epoch": 1.6, "learning_rate": 9.442999284196384e-06, "loss": 0.4381, "step": 8630 }, { "epoch": 1.6, "learning_rate": 9.44100494417978e-06, "loss": 0.4186, "step": 8631 }, { "epoch": 1.6, "learning_rate": 9.439010626466047e-06, "loss": 0.4205, "step": 8632 }, { "epoch": 1.6, "learning_rate": 9.437016331134752e-06, "loss": 0.4019, "step": 8633 }, { "epoch": 1.6, "learning_rate": 9.435022058265459e-06, "loss": 0.4431, "step": 8634 }, { "epoch": 1.6, "learning_rate": 9.433027807937745e-06, "loss": 0.4166, "step": 8635 }, { "epoch": 1.6, "learning_rate": 9.431033580231166e-06, "loss": 0.4246, "step": 8636 }, { "epoch": 1.6, "learning_rate": 9.429039375225298e-06, "loss": 0.4451, "step": 8637 }, { "epoch": 1.6, "learning_rate": 9.4270451929997e-06, "loss": 0.431, "step": 8638 }, { "epoch": 1.6, "learning_rate": 9.425051033633938e-06, "loss": 0.4351, "step": 8639 }, { "epoch": 1.6, "learning_rate": 9.423056897207575e-06, "loss": 0.4315, "step": 8640 }, { "epoch": 1.6, "learning_rate": 9.421062783800174e-06, "loss": 0.4151, "step": 8641 }, { "epoch": 1.6, "learning_rate": 9.419068693491297e-06, "loss": 0.4289, "step": 8642 }, { "epoch": 1.6, "learning_rate": 9.417074626360504e-06, "loss": 0.4197, "step": 8643 }, { "epoch": 1.6, "learning_rate": 9.41508058248735e-06, "loss": 0.4203, "step": 8644 }, { "epoch": 1.6, "learning_rate": 9.413086561951403e-06, "loss": 0.4413, "step": 8645 }, { "epoch": 1.6, "learning_rate": 9.411092564832212e-06, "loss": 0.4179, "step": 8646 }, { "epoch": 1.6, "learning_rate": 9.40909859120934e-06, "loss": 0.4262, "step": 8647 }, { "epoch": 1.6, "learning_rate": 9.407104641162341e-06, "loss": 0.4229, "step": 8648 }, { "epoch": 1.6, "learning_rate": 9.405110714770765e-06, "loss": 0.4628, "step": 8649 }, { "epoch": 1.6, "learning_rate": 9.403116812114173e-06, "loss": 0.4436, "step": 8650 }, { "epoch": 1.6, "learning_rate": 9.401122933272112e-06, "loss": 0.4415, "step": 8651 }, { "epoch": 1.6, "learning_rate": 9.399129078324141e-06, "loss": 0.4403, "step": 8652 }, { "epoch": 1.6, "learning_rate": 9.397135247349803e-06, "loss": 0.4277, "step": 8653 }, { "epoch": 1.6, "learning_rate": 9.395141440428657e-06, "loss": 0.43, "step": 8654 }, { "epoch": 1.6, "learning_rate": 9.393147657640248e-06, "loss": 0.4517, "step": 8655 }, { "epoch": 1.6, "learning_rate": 9.39115389906412e-06, "loss": 0.4441, "step": 8656 }, { "epoch": 1.6, "learning_rate": 9.389160164779827e-06, "loss": 0.4434, "step": 8657 }, { "epoch": 1.6, "learning_rate": 9.387166454866909e-06, "loss": 0.4494, "step": 8658 }, { "epoch": 1.6, "learning_rate": 9.385172769404918e-06, "loss": 0.428, "step": 8659 }, { "epoch": 1.6, "learning_rate": 9.383179108473397e-06, "loss": 0.4265, "step": 8660 }, { "epoch": 1.6, "learning_rate": 9.381185472151882e-06, "loss": 0.4187, "step": 8661 }, { "epoch": 1.6, "learning_rate": 9.379191860519926e-06, "loss": 0.4342, "step": 8662 }, { "epoch": 1.6, "learning_rate": 9.377198273657062e-06, "loss": 0.4117, "step": 8663 }, { "epoch": 1.6, "learning_rate": 9.375204711642836e-06, "loss": 0.4367, "step": 8664 }, { "epoch": 1.6, "learning_rate": 9.373211174556784e-06, "loss": 0.4217, "step": 8665 }, { "epoch": 1.6, "learning_rate": 9.371217662478445e-06, "loss": 0.4163, "step": 8666 }, { "epoch": 1.6, "learning_rate": 9.369224175487358e-06, "loss": 0.4201, "step": 8667 }, { "epoch": 1.6, "learning_rate": 9.367230713663059e-06, "loss": 0.4365, "step": 8668 }, { "epoch": 1.6, "learning_rate": 9.365237277085081e-06, "loss": 0.4519, "step": 8669 }, { "epoch": 1.6, "learning_rate": 9.363243865832963e-06, "loss": 0.4291, "step": 8670 }, { "epoch": 1.6, "learning_rate": 9.361250479986234e-06, "loss": 0.4232, "step": 8671 }, { "epoch": 1.6, "learning_rate": 9.35925711962443e-06, "loss": 0.4354, "step": 8672 }, { "epoch": 1.6, "learning_rate": 9.357263784827078e-06, "loss": 0.4216, "step": 8673 }, { "epoch": 1.6, "learning_rate": 9.355270475673713e-06, "loss": 0.4523, "step": 8674 }, { "epoch": 1.6, "learning_rate": 9.353277192243861e-06, "loss": 0.4378, "step": 8675 }, { "epoch": 1.61, "learning_rate": 9.351283934617053e-06, "loss": 0.4345, "step": 8676 }, { "epoch": 1.61, "learning_rate": 9.349290702872818e-06, "loss": 0.4056, "step": 8677 }, { "epoch": 1.61, "learning_rate": 9.347297497090673e-06, "loss": 0.421, "step": 8678 }, { "epoch": 1.61, "learning_rate": 9.345304317350153e-06, "loss": 0.4284, "step": 8679 }, { "epoch": 1.61, "learning_rate": 9.343311163730777e-06, "loss": 0.4348, "step": 8680 }, { "epoch": 1.61, "learning_rate": 9.341318036312071e-06, "loss": 0.4567, "step": 8681 }, { "epoch": 1.61, "learning_rate": 9.339324935173557e-06, "loss": 0.4373, "step": 8682 }, { "epoch": 1.61, "learning_rate": 9.337331860394752e-06, "loss": 0.4375, "step": 8683 }, { "epoch": 1.61, "learning_rate": 9.335338812055182e-06, "loss": 0.4336, "step": 8684 }, { "epoch": 1.61, "learning_rate": 9.333345790234357e-06, "loss": 0.4125, "step": 8685 }, { "epoch": 1.61, "learning_rate": 9.331352795011806e-06, "loss": 0.4337, "step": 8686 }, { "epoch": 1.61, "learning_rate": 9.32935982646704e-06, "loss": 0.4139, "step": 8687 }, { "epoch": 1.61, "learning_rate": 9.327366884679574e-06, "loss": 0.4215, "step": 8688 }, { "epoch": 1.61, "learning_rate": 9.325373969728924e-06, "loss": 0.4273, "step": 8689 }, { "epoch": 1.61, "learning_rate": 9.323381081694604e-06, "loss": 0.4187, "step": 8690 }, { "epoch": 1.61, "learning_rate": 9.321388220656126e-06, "loss": 0.4056, "step": 8691 }, { "epoch": 1.61, "learning_rate": 9.319395386693003e-06, "loss": 0.4396, "step": 8692 }, { "epoch": 1.61, "learning_rate": 9.31740257988474e-06, "loss": 0.4507, "step": 8693 }, { "epoch": 1.61, "learning_rate": 9.315409800310856e-06, "loss": 0.4455, "step": 8694 }, { "epoch": 1.61, "learning_rate": 9.313417048050847e-06, "loss": 0.4532, "step": 8695 }, { "epoch": 1.61, "learning_rate": 9.311424323184231e-06, "loss": 0.4269, "step": 8696 }, { "epoch": 1.61, "learning_rate": 9.30943162579051e-06, "loss": 0.43, "step": 8697 }, { "epoch": 1.61, "learning_rate": 9.307438955949186e-06, "loss": 0.4417, "step": 8698 }, { "epoch": 1.61, "learning_rate": 9.305446313739767e-06, "loss": 0.4056, "step": 8699 }, { "epoch": 1.61, "learning_rate": 9.303453699241752e-06, "loss": 0.4286, "step": 8700 }, { "epoch": 1.61, "learning_rate": 9.301461112534648e-06, "loss": 0.4361, "step": 8701 }, { "epoch": 1.61, "learning_rate": 9.299468553697949e-06, "loss": 0.4536, "step": 8702 }, { "epoch": 1.61, "learning_rate": 9.297476022811161e-06, "loss": 0.435, "step": 8703 }, { "epoch": 1.61, "learning_rate": 9.29548351995378e-06, "loss": 0.4362, "step": 8704 }, { "epoch": 1.61, "learning_rate": 9.293491045205297e-06, "loss": 0.4264, "step": 8705 }, { "epoch": 1.61, "learning_rate": 9.291498598645218e-06, "loss": 0.4318, "step": 8706 }, { "epoch": 1.61, "learning_rate": 9.289506180353028e-06, "loss": 0.4324, "step": 8707 }, { "epoch": 1.61, "learning_rate": 9.287513790408232e-06, "loss": 0.445, "step": 8708 }, { "epoch": 1.61, "learning_rate": 9.285521428890313e-06, "loss": 0.4202, "step": 8709 }, { "epoch": 1.61, "learning_rate": 9.283529095878766e-06, "loss": 0.4191, "step": 8710 }, { "epoch": 1.61, "learning_rate": 9.281536791453084e-06, "loss": 0.441, "step": 8711 }, { "epoch": 1.61, "learning_rate": 9.27954451569275e-06, "loss": 0.4525, "step": 8712 }, { "epoch": 1.61, "learning_rate": 9.27755226867726e-06, "loss": 0.4322, "step": 8713 }, { "epoch": 1.61, "learning_rate": 9.275560050486095e-06, "loss": 0.4369, "step": 8714 }, { "epoch": 1.61, "learning_rate": 9.273567861198742e-06, "loss": 0.4311, "step": 8715 }, { "epoch": 1.61, "learning_rate": 9.271575700894686e-06, "loss": 0.4051, "step": 8716 }, { "epoch": 1.61, "learning_rate": 9.269583569653412e-06, "loss": 0.4246, "step": 8717 }, { "epoch": 1.61, "learning_rate": 9.2675914675544e-06, "loss": 0.4346, "step": 8718 }, { "epoch": 1.61, "learning_rate": 9.265599394677137e-06, "loss": 0.4489, "step": 8719 }, { "epoch": 1.61, "learning_rate": 9.263607351101092e-06, "loss": 0.4283, "step": 8720 }, { "epoch": 1.61, "learning_rate": 9.261615336905756e-06, "loss": 0.4408, "step": 8721 }, { "epoch": 1.61, "learning_rate": 9.259623352170595e-06, "loss": 0.4233, "step": 8722 }, { "epoch": 1.61, "learning_rate": 9.257631396975097e-06, "loss": 0.4267, "step": 8723 }, { "epoch": 1.61, "learning_rate": 9.255639471398728e-06, "loss": 0.4503, "step": 8724 }, { "epoch": 1.61, "learning_rate": 9.25364757552097e-06, "loss": 0.454, "step": 8725 }, { "epoch": 1.61, "learning_rate": 9.251655709421291e-06, "loss": 0.4353, "step": 8726 }, { "epoch": 1.61, "learning_rate": 9.24966387317916e-06, "loss": 0.4459, "step": 8727 }, { "epoch": 1.61, "learning_rate": 9.247672066874056e-06, "loss": 0.4103, "step": 8728 }, { "epoch": 1.61, "learning_rate": 9.245680290585438e-06, "loss": 0.4183, "step": 8729 }, { "epoch": 1.62, "learning_rate": 9.243688544392784e-06, "loss": 0.4367, "step": 8730 }, { "epoch": 1.62, "learning_rate": 9.241696828375558e-06, "loss": 0.4205, "step": 8731 }, { "epoch": 1.62, "learning_rate": 9.23970514261322e-06, "loss": 0.4197, "step": 8732 }, { "epoch": 1.62, "learning_rate": 9.237713487185242e-06, "loss": 0.4459, "step": 8733 }, { "epoch": 1.62, "learning_rate": 9.235721862171084e-06, "loss": 0.4243, "step": 8734 }, { "epoch": 1.62, "learning_rate": 9.233730267650209e-06, "loss": 0.4442, "step": 8735 }, { "epoch": 1.62, "learning_rate": 9.23173870370208e-06, "loss": 0.4366, "step": 8736 }, { "epoch": 1.62, "learning_rate": 9.229747170406149e-06, "loss": 0.4259, "step": 8737 }, { "epoch": 1.62, "learning_rate": 9.227755667841884e-06, "loss": 0.4267, "step": 8738 }, { "epoch": 1.62, "learning_rate": 9.225764196088733e-06, "loss": 0.4251, "step": 8739 }, { "epoch": 1.62, "learning_rate": 9.223772755226163e-06, "loss": 0.4476, "step": 8740 }, { "epoch": 1.62, "learning_rate": 9.22178134533362e-06, "loss": 0.4244, "step": 8741 }, { "epoch": 1.62, "learning_rate": 9.21978996649056e-06, "loss": 0.4381, "step": 8742 }, { "epoch": 1.62, "learning_rate": 9.217798618776438e-06, "loss": 0.4272, "step": 8743 }, { "epoch": 1.62, "learning_rate": 9.2158073022707e-06, "loss": 0.4175, "step": 8744 }, { "epoch": 1.62, "learning_rate": 9.213816017052801e-06, "loss": 0.43, "step": 8745 }, { "epoch": 1.62, "learning_rate": 9.211824763202187e-06, "loss": 0.4447, "step": 8746 }, { "epoch": 1.62, "learning_rate": 9.209833540798305e-06, "loss": 0.4375, "step": 8747 }, { "epoch": 1.62, "learning_rate": 9.207842349920603e-06, "loss": 0.4563, "step": 8748 }, { "epoch": 1.62, "learning_rate": 9.205851190648523e-06, "loss": 0.4203, "step": 8749 }, { "epoch": 1.62, "learning_rate": 9.203860063061512e-06, "loss": 0.4286, "step": 8750 }, { "epoch": 1.62, "learning_rate": 9.201868967239008e-06, "loss": 0.4477, "step": 8751 }, { "epoch": 1.62, "learning_rate": 9.199877903260458e-06, "loss": 0.4429, "step": 8752 }, { "epoch": 1.62, "learning_rate": 9.197886871205298e-06, "loss": 0.4271, "step": 8753 }, { "epoch": 1.62, "learning_rate": 9.195895871152962e-06, "loss": 0.4424, "step": 8754 }, { "epoch": 1.62, "learning_rate": 9.193904903182898e-06, "loss": 0.4466, "step": 8755 }, { "epoch": 1.62, "learning_rate": 9.19191396737453e-06, "loss": 0.4528, "step": 8756 }, { "epoch": 1.62, "learning_rate": 9.189923063807303e-06, "loss": 0.4343, "step": 8757 }, { "epoch": 1.62, "learning_rate": 9.187932192560646e-06, "loss": 0.447, "step": 8758 }, { "epoch": 1.62, "learning_rate": 9.185941353713988e-06, "loss": 0.4344, "step": 8759 }, { "epoch": 1.62, "learning_rate": 9.183950547346767e-06, "loss": 0.4281, "step": 8760 }, { "epoch": 1.62, "learning_rate": 9.181959773538401e-06, "loss": 0.4313, "step": 8761 }, { "epoch": 1.62, "learning_rate": 9.179969032368333e-06, "loss": 0.4491, "step": 8762 }, { "epoch": 1.62, "learning_rate": 9.17797832391598e-06, "loss": 0.4154, "step": 8763 }, { "epoch": 1.62, "learning_rate": 9.175987648260768e-06, "loss": 0.4397, "step": 8764 }, { "epoch": 1.62, "learning_rate": 9.173997005482123e-06, "loss": 0.4293, "step": 8765 }, { "epoch": 1.62, "learning_rate": 9.17200639565947e-06, "loss": 0.4121, "step": 8766 }, { "epoch": 1.62, "learning_rate": 9.170015818872229e-06, "loss": 0.4111, "step": 8767 }, { "epoch": 1.62, "learning_rate": 9.168025275199818e-06, "loss": 0.438, "step": 8768 }, { "epoch": 1.62, "learning_rate": 9.166034764721661e-06, "loss": 0.4349, "step": 8769 }, { "epoch": 1.62, "learning_rate": 9.164044287517173e-06, "loss": 0.4291, "step": 8770 }, { "epoch": 1.62, "learning_rate": 9.162053843665767e-06, "loss": 0.4424, "step": 8771 }, { "epoch": 1.62, "learning_rate": 9.160063433246866e-06, "loss": 0.4458, "step": 8772 }, { "epoch": 1.62, "learning_rate": 9.158073056339872e-06, "loss": 0.4196, "step": 8773 }, { "epoch": 1.62, "learning_rate": 9.15608271302421e-06, "loss": 0.4291, "step": 8774 }, { "epoch": 1.62, "learning_rate": 9.154092403379286e-06, "loss": 0.423, "step": 8775 }, { "epoch": 1.62, "learning_rate": 9.152102127484503e-06, "loss": 0.4182, "step": 8776 }, { "epoch": 1.62, "learning_rate": 9.150111885419282e-06, "loss": 0.4209, "step": 8777 }, { "epoch": 1.62, "learning_rate": 9.148121677263018e-06, "loss": 0.4421, "step": 8778 }, { "epoch": 1.62, "learning_rate": 9.146131503095124e-06, "loss": 0.4349, "step": 8779 }, { "epoch": 1.62, "learning_rate": 9.144141362995006e-06, "loss": 0.4344, "step": 8780 }, { "epoch": 1.62, "learning_rate": 9.142151257042056e-06, "loss": 0.431, "step": 8781 }, { "epoch": 1.62, "learning_rate": 9.140161185315687e-06, "loss": 0.4385, "step": 8782 }, { "epoch": 1.62, "learning_rate": 9.138171147895292e-06, "loss": 0.463, "step": 8783 }, { "epoch": 1.63, "learning_rate": 9.136181144860275e-06, "loss": 0.4686, "step": 8784 }, { "epoch": 1.63, "learning_rate": 9.134191176290033e-06, "loss": 0.4205, "step": 8785 }, { "epoch": 1.63, "learning_rate": 9.132201242263954e-06, "loss": 0.4317, "step": 8786 }, { "epoch": 1.63, "learning_rate": 9.130211342861444e-06, "loss": 0.4297, "step": 8787 }, { "epoch": 1.63, "learning_rate": 9.128221478161885e-06, "loss": 0.4492, "step": 8788 }, { "epoch": 1.63, "learning_rate": 9.126231648244681e-06, "loss": 0.4303, "step": 8789 }, { "epoch": 1.63, "learning_rate": 9.124241853189212e-06, "loss": 0.4289, "step": 8790 }, { "epoch": 1.63, "learning_rate": 9.122252093074877e-06, "loss": 0.4378, "step": 8791 }, { "epoch": 1.63, "learning_rate": 9.120262367981054e-06, "loss": 0.442, "step": 8792 }, { "epoch": 1.63, "learning_rate": 9.118272677987135e-06, "loss": 0.4345, "step": 8793 }, { "epoch": 1.63, "learning_rate": 9.116283023172504e-06, "loss": 0.4222, "step": 8794 }, { "epoch": 1.63, "learning_rate": 9.114293403616543e-06, "loss": 0.4092, "step": 8795 }, { "epoch": 1.63, "learning_rate": 9.112303819398635e-06, "loss": 0.4223, "step": 8796 }, { "epoch": 1.63, "learning_rate": 9.110314270598165e-06, "loss": 0.4192, "step": 8797 }, { "epoch": 1.63, "learning_rate": 9.108324757294504e-06, "loss": 0.4219, "step": 8798 }, { "epoch": 1.63, "learning_rate": 9.106335279567038e-06, "loss": 0.4623, "step": 8799 }, { "epoch": 1.63, "learning_rate": 9.104345837495134e-06, "loss": 0.4284, "step": 8800 }, { "epoch": 1.63, "learning_rate": 9.102356431158179e-06, "loss": 0.4272, "step": 8801 }, { "epoch": 1.63, "learning_rate": 9.10036706063554e-06, "loss": 0.4215, "step": 8802 }, { "epoch": 1.63, "learning_rate": 9.098377726006586e-06, "loss": 0.4276, "step": 8803 }, { "epoch": 1.63, "learning_rate": 9.096388427350694e-06, "loss": 0.4326, "step": 8804 }, { "epoch": 1.63, "learning_rate": 9.094399164747228e-06, "loss": 0.4238, "step": 8805 }, { "epoch": 1.63, "learning_rate": 9.092409938275562e-06, "loss": 0.4383, "step": 8806 }, { "epoch": 1.63, "learning_rate": 9.09042074801506e-06, "loss": 0.4499, "step": 8807 }, { "epoch": 1.63, "learning_rate": 9.088431594045083e-06, "loss": 0.4304, "step": 8808 }, { "epoch": 1.63, "learning_rate": 9.086442476445e-06, "loss": 0.4216, "step": 8809 }, { "epoch": 1.63, "learning_rate": 9.084453395294167e-06, "loss": 0.4429, "step": 8810 }, { "epoch": 1.63, "learning_rate": 9.082464350671952e-06, "loss": 0.4373, "step": 8811 }, { "epoch": 1.63, "learning_rate": 9.080475342657706e-06, "loss": 0.4424, "step": 8812 }, { "epoch": 1.63, "learning_rate": 9.078486371330797e-06, "loss": 0.4282, "step": 8813 }, { "epoch": 1.63, "learning_rate": 9.076497436770573e-06, "loss": 0.4368, "step": 8814 }, { "epoch": 1.63, "learning_rate": 9.074508539056392e-06, "loss": 0.4356, "step": 8815 }, { "epoch": 1.63, "learning_rate": 9.072519678267606e-06, "loss": 0.4371, "step": 8816 }, { "epoch": 1.63, "learning_rate": 9.070530854483569e-06, "loss": 0.4164, "step": 8817 }, { "epoch": 1.63, "learning_rate": 9.068542067783628e-06, "loss": 0.4183, "step": 8818 }, { "epoch": 1.63, "learning_rate": 9.066553318247136e-06, "loss": 0.4141, "step": 8819 }, { "epoch": 1.63, "learning_rate": 9.064564605953436e-06, "loss": 0.4285, "step": 8820 }, { "epoch": 1.63, "learning_rate": 9.06257593098188e-06, "loss": 0.4162, "step": 8821 }, { "epoch": 1.63, "learning_rate": 9.060587293411805e-06, "loss": 0.4219, "step": 8822 }, { "epoch": 1.63, "learning_rate": 9.05859869332256e-06, "loss": 0.4334, "step": 8823 }, { "epoch": 1.63, "learning_rate": 9.056610130793486e-06, "loss": 0.4325, "step": 8824 }, { "epoch": 1.63, "learning_rate": 9.054621605903916e-06, "loss": 0.4579, "step": 8825 }, { "epoch": 1.63, "learning_rate": 9.052633118733198e-06, "loss": 0.4157, "step": 8826 }, { "epoch": 1.63, "learning_rate": 9.050644669360661e-06, "loss": 0.4308, "step": 8827 }, { "epoch": 1.63, "learning_rate": 9.048656257865647e-06, "loss": 0.4394, "step": 8828 }, { "epoch": 1.63, "learning_rate": 9.046667884327488e-06, "loss": 0.4302, "step": 8829 }, { "epoch": 1.63, "learning_rate": 9.04467954882551e-06, "loss": 0.4447, "step": 8830 }, { "epoch": 1.63, "learning_rate": 9.042691251439055e-06, "loss": 0.4434, "step": 8831 }, { "epoch": 1.63, "learning_rate": 9.040702992247442e-06, "loss": 0.4203, "step": 8832 }, { "epoch": 1.63, "learning_rate": 9.038714771330006e-06, "loss": 0.4378, "step": 8833 }, { "epoch": 1.63, "learning_rate": 9.03672658876607e-06, "loss": 0.4374, "step": 8834 }, { "epoch": 1.63, "learning_rate": 9.034738444634962e-06, "loss": 0.444, "step": 8835 }, { "epoch": 1.63, "learning_rate": 9.032750339016002e-06, "loss": 0.436, "step": 8836 }, { "epoch": 1.63, "learning_rate": 9.03076227198851e-06, "loss": 0.4325, "step": 8837 }, { "epoch": 1.64, "learning_rate": 9.028774243631813e-06, "loss": 0.4125, "step": 8838 }, { "epoch": 1.64, "learning_rate": 9.02678625402522e-06, "loss": 0.4363, "step": 8839 }, { "epoch": 1.64, "learning_rate": 9.024798303248058e-06, "loss": 0.4304, "step": 8840 }, { "epoch": 1.64, "learning_rate": 9.022810391379637e-06, "loss": 0.4459, "step": 8841 }, { "epoch": 1.64, "learning_rate": 9.02082251849927e-06, "loss": 0.4219, "step": 8842 }, { "epoch": 1.64, "learning_rate": 9.018834684686275e-06, "loss": 0.4507, "step": 8843 }, { "epoch": 1.64, "learning_rate": 9.016846890019958e-06, "loss": 0.4317, "step": 8844 }, { "epoch": 1.64, "learning_rate": 9.01485913457963e-06, "loss": 0.4243, "step": 8845 }, { "epoch": 1.64, "learning_rate": 9.0128714184446e-06, "loss": 0.429, "step": 8846 }, { "epoch": 1.64, "learning_rate": 9.010883741694169e-06, "loss": 0.4154, "step": 8847 }, { "epoch": 1.64, "learning_rate": 9.00889610440765e-06, "loss": 0.4418, "step": 8848 }, { "epoch": 1.64, "learning_rate": 9.006908506664335e-06, "loss": 0.4299, "step": 8849 }, { "epoch": 1.64, "learning_rate": 9.00492094854354e-06, "loss": 0.4235, "step": 8850 }, { "epoch": 1.64, "learning_rate": 9.002933430124554e-06, "loss": 0.4338, "step": 8851 }, { "epoch": 1.64, "learning_rate": 9.000945951486675e-06, "loss": 0.4448, "step": 8852 }, { "epoch": 1.64, "learning_rate": 8.998958512709205e-06, "loss": 0.4397, "step": 8853 }, { "epoch": 1.64, "learning_rate": 8.996971113871436e-06, "loss": 0.4249, "step": 8854 }, { "epoch": 1.64, "learning_rate": 8.994983755052665e-06, "loss": 0.4412, "step": 8855 }, { "epoch": 1.64, "learning_rate": 8.992996436332178e-06, "loss": 0.418, "step": 8856 }, { "epoch": 1.64, "learning_rate": 8.991009157789272e-06, "loss": 0.4158, "step": 8857 }, { "epoch": 1.64, "learning_rate": 8.989021919503234e-06, "loss": 0.4288, "step": 8858 }, { "epoch": 1.64, "learning_rate": 8.987034721553343e-06, "loss": 0.437, "step": 8859 }, { "epoch": 1.64, "learning_rate": 8.985047564018897e-06, "loss": 0.4237, "step": 8860 }, { "epoch": 1.64, "learning_rate": 8.983060446979169e-06, "loss": 0.4572, "step": 8861 }, { "epoch": 1.64, "learning_rate": 8.981073370513452e-06, "loss": 0.4352, "step": 8862 }, { "epoch": 1.64, "learning_rate": 8.979086334701019e-06, "loss": 0.4139, "step": 8863 }, { "epoch": 1.64, "learning_rate": 8.97709933962115e-06, "loss": 0.4351, "step": 8864 }, { "epoch": 1.64, "learning_rate": 8.975112385353124e-06, "loss": 0.4311, "step": 8865 }, { "epoch": 1.64, "learning_rate": 8.973125471976213e-06, "loss": 0.4264, "step": 8866 }, { "epoch": 1.64, "learning_rate": 8.9711385995697e-06, "loss": 0.4063, "step": 8867 }, { "epoch": 1.64, "learning_rate": 8.96915176821285e-06, "loss": 0.4086, "step": 8868 }, { "epoch": 1.64, "learning_rate": 8.967164977984936e-06, "loss": 0.4178, "step": 8869 }, { "epoch": 1.64, "learning_rate": 8.965178228965225e-06, "loss": 0.4254, "step": 8870 }, { "epoch": 1.64, "learning_rate": 8.96319152123299e-06, "loss": 0.4247, "step": 8871 }, { "epoch": 1.64, "learning_rate": 8.961204854867491e-06, "loss": 0.4162, "step": 8872 }, { "epoch": 1.64, "learning_rate": 8.959218229947998e-06, "loss": 0.4315, "step": 8873 }, { "epoch": 1.64, "learning_rate": 8.957231646553765e-06, "loss": 0.437, "step": 8874 }, { "epoch": 1.64, "learning_rate": 8.955245104764066e-06, "loss": 0.4189, "step": 8875 }, { "epoch": 1.64, "learning_rate": 8.953258604658147e-06, "loss": 0.4285, "step": 8876 }, { "epoch": 1.64, "learning_rate": 8.951272146315276e-06, "loss": 0.4226, "step": 8877 }, { "epoch": 1.64, "learning_rate": 8.9492857298147e-06, "loss": 0.4152, "step": 8878 }, { "epoch": 1.64, "learning_rate": 8.947299355235683e-06, "loss": 0.4354, "step": 8879 }, { "epoch": 1.64, "learning_rate": 8.945313022657472e-06, "loss": 0.4288, "step": 8880 }, { "epoch": 1.64, "learning_rate": 8.943326732159314e-06, "loss": 0.4369, "step": 8881 }, { "epoch": 1.64, "learning_rate": 8.941340483820469e-06, "loss": 0.4295, "step": 8882 }, { "epoch": 1.64, "learning_rate": 8.939354277720174e-06, "loss": 0.4467, "step": 8883 }, { "epoch": 1.64, "learning_rate": 8.937368113937682e-06, "loss": 0.4231, "step": 8884 }, { "epoch": 1.64, "learning_rate": 8.935381992552237e-06, "loss": 0.4036, "step": 8885 }, { "epoch": 1.64, "learning_rate": 8.933395913643074e-06, "loss": 0.4225, "step": 8886 }, { "epoch": 1.64, "learning_rate": 8.931409877289444e-06, "loss": 0.4344, "step": 8887 }, { "epoch": 1.64, "learning_rate": 8.929423883570577e-06, "loss": 0.4366, "step": 8888 }, { "epoch": 1.64, "learning_rate": 8.927437932565719e-06, "loss": 0.4151, "step": 8889 }, { "epoch": 1.64, "learning_rate": 8.9254520243541e-06, "loss": 0.4343, "step": 8890 }, { "epoch": 1.64, "learning_rate": 8.923466159014956e-06, "loss": 0.4368, "step": 8891 }, { "epoch": 1.65, "learning_rate": 8.921480336627518e-06, "loss": 0.4308, "step": 8892 }, { "epoch": 1.65, "learning_rate": 8.91949455727102e-06, "loss": 0.4369, "step": 8893 }, { "epoch": 1.65, "learning_rate": 8.917508821024686e-06, "loss": 0.4196, "step": 8894 }, { "epoch": 1.65, "learning_rate": 8.91552312796775e-06, "loss": 0.4185, "step": 8895 }, { "epoch": 1.65, "learning_rate": 8.913537478179426e-06, "loss": 0.446, "step": 8896 }, { "epoch": 1.65, "learning_rate": 8.911551871738952e-06, "loss": 0.4478, "step": 8897 }, { "epoch": 1.65, "learning_rate": 8.90956630872554e-06, "loss": 0.4444, "step": 8898 }, { "epoch": 1.65, "learning_rate": 8.907580789218415e-06, "loss": 0.428, "step": 8899 }, { "epoch": 1.65, "learning_rate": 8.90559531329679e-06, "loss": 0.4353, "step": 8900 }, { "epoch": 1.65, "learning_rate": 8.903609881039892e-06, "loss": 0.4497, "step": 8901 }, { "epoch": 1.65, "learning_rate": 8.901624492526928e-06, "loss": 0.4358, "step": 8902 }, { "epoch": 1.65, "learning_rate": 8.89963914783711e-06, "loss": 0.4306, "step": 8903 }, { "epoch": 1.65, "learning_rate": 8.897653847049657e-06, "loss": 0.4512, "step": 8904 }, { "epoch": 1.65, "learning_rate": 8.895668590243768e-06, "loss": 0.4255, "step": 8905 }, { "epoch": 1.65, "learning_rate": 8.893683377498664e-06, "loss": 0.4573, "step": 8906 }, { "epoch": 1.65, "learning_rate": 8.891698208893545e-06, "loss": 0.4228, "step": 8907 }, { "epoch": 1.65, "learning_rate": 8.889713084507611e-06, "loss": 0.4416, "step": 8908 }, { "epoch": 1.65, "learning_rate": 8.887728004420073e-06, "loss": 0.4206, "step": 8909 }, { "epoch": 1.65, "learning_rate": 8.885742968710125e-06, "loss": 0.4442, "step": 8910 }, { "epoch": 1.65, "learning_rate": 8.883757977456973e-06, "loss": 0.443, "step": 8911 }, { "epoch": 1.65, "learning_rate": 8.881773030739811e-06, "loss": 0.4515, "step": 8912 }, { "epoch": 1.65, "learning_rate": 8.879788128637831e-06, "loss": 0.4218, "step": 8913 }, { "epoch": 1.65, "learning_rate": 8.877803271230234e-06, "loss": 0.4397, "step": 8914 }, { "epoch": 1.65, "learning_rate": 8.875818458596206e-06, "loss": 0.4223, "step": 8915 }, { "epoch": 1.65, "learning_rate": 8.873833690814944e-06, "loss": 0.447, "step": 8916 }, { "epoch": 1.65, "learning_rate": 8.87184896796563e-06, "loss": 0.437, "step": 8917 }, { "epoch": 1.65, "learning_rate": 8.869864290127454e-06, "loss": 0.4291, "step": 8918 }, { "epoch": 1.65, "learning_rate": 8.867879657379598e-06, "loss": 0.4253, "step": 8919 }, { "epoch": 1.65, "learning_rate": 8.865895069801252e-06, "loss": 0.4432, "step": 8920 }, { "epoch": 1.65, "learning_rate": 8.86391052747159e-06, "loss": 0.4253, "step": 8921 }, { "epoch": 1.65, "learning_rate": 8.861926030469795e-06, "loss": 0.4506, "step": 8922 }, { "epoch": 1.65, "learning_rate": 8.859941578875044e-06, "loss": 0.4503, "step": 8923 }, { "epoch": 1.65, "learning_rate": 8.857957172766516e-06, "loss": 0.429, "step": 8924 }, { "epoch": 1.65, "learning_rate": 8.855972812223377e-06, "loss": 0.4196, "step": 8925 }, { "epoch": 1.65, "learning_rate": 8.853988497324811e-06, "loss": 0.4205, "step": 8926 }, { "epoch": 1.65, "learning_rate": 8.852004228149976e-06, "loss": 0.4361, "step": 8927 }, { "epoch": 1.65, "learning_rate": 8.850020004778053e-06, "loss": 0.4343, "step": 8928 }, { "epoch": 1.65, "learning_rate": 8.848035827288202e-06, "loss": 0.4306, "step": 8929 }, { "epoch": 1.65, "learning_rate": 8.846051695759582e-06, "loss": 0.4309, "step": 8930 }, { "epoch": 1.65, "learning_rate": 8.84406761027137e-06, "loss": 0.4269, "step": 8931 }, { "epoch": 1.65, "learning_rate": 8.842083570902715e-06, "loss": 0.4406, "step": 8932 }, { "epoch": 1.65, "learning_rate": 8.840099577732787e-06, "loss": 0.4055, "step": 8933 }, { "epoch": 1.65, "learning_rate": 8.838115630840737e-06, "loss": 0.4229, "step": 8934 }, { "epoch": 1.65, "learning_rate": 8.836131730305718e-06, "loss": 0.4245, "step": 8935 }, { "epoch": 1.65, "learning_rate": 8.834147876206894e-06, "loss": 0.426, "step": 8936 }, { "epoch": 1.65, "learning_rate": 8.832164068623404e-06, "loss": 0.4122, "step": 8937 }, { "epoch": 1.65, "learning_rate": 8.830180307634412e-06, "loss": 0.4254, "step": 8938 }, { "epoch": 1.65, "learning_rate": 8.828196593319056e-06, "loss": 0.4208, "step": 8939 }, { "epoch": 1.65, "learning_rate": 8.826212925756487e-06, "loss": 0.43, "step": 8940 }, { "epoch": 1.65, "learning_rate": 8.824229305025851e-06, "loss": 0.4418, "step": 8941 }, { "epoch": 1.65, "learning_rate": 8.822245731206287e-06, "loss": 0.4383, "step": 8942 }, { "epoch": 1.65, "learning_rate": 8.820262204376938e-06, "loss": 0.4157, "step": 8943 }, { "epoch": 1.65, "learning_rate": 8.818278724616943e-06, "loss": 0.4238, "step": 8944 }, { "epoch": 1.65, "learning_rate": 8.816295292005439e-06, "loss": 0.4225, "step": 8945 }, { "epoch": 1.66, "learning_rate": 8.814311906621564e-06, "loss": 0.4201, "step": 8946 }, { "epoch": 1.66, "learning_rate": 8.812328568544444e-06, "loss": 0.4197, "step": 8947 }, { "epoch": 1.66, "learning_rate": 8.810345277853218e-06, "loss": 0.432, "step": 8948 }, { "epoch": 1.66, "learning_rate": 8.80836203462701e-06, "loss": 0.4269, "step": 8949 }, { "epoch": 1.66, "learning_rate": 8.806378838944954e-06, "loss": 0.4481, "step": 8950 }, { "epoch": 1.66, "learning_rate": 8.804395690886174e-06, "loss": 0.4347, "step": 8951 }, { "epoch": 1.66, "learning_rate": 8.802412590529787e-06, "loss": 0.4053, "step": 8952 }, { "epoch": 1.66, "learning_rate": 8.800429537954925e-06, "loss": 0.4646, "step": 8953 }, { "epoch": 1.66, "learning_rate": 8.7984465332407e-06, "loss": 0.4342, "step": 8954 }, { "epoch": 1.66, "learning_rate": 8.796463576466236e-06, "loss": 0.4297, "step": 8955 }, { "epoch": 1.66, "learning_rate": 8.794480667710647e-06, "loss": 0.4271, "step": 8956 }, { "epoch": 1.66, "learning_rate": 8.792497807053044e-06, "loss": 0.4542, "step": 8957 }, { "epoch": 1.66, "learning_rate": 8.790514994572548e-06, "loss": 0.4203, "step": 8958 }, { "epoch": 1.66, "learning_rate": 8.788532230348258e-06, "loss": 0.4441, "step": 8959 }, { "epoch": 1.66, "learning_rate": 8.786549514459296e-06, "loss": 0.4297, "step": 8960 }, { "epoch": 1.66, "learning_rate": 8.78456684698476e-06, "loss": 0.4084, "step": 8961 }, { "epoch": 1.66, "learning_rate": 8.782584228003754e-06, "loss": 0.428, "step": 8962 }, { "epoch": 1.66, "learning_rate": 8.780601657595385e-06, "loss": 0.4332, "step": 8963 }, { "epoch": 1.66, "learning_rate": 8.778619135838748e-06, "loss": 0.4457, "step": 8964 }, { "epoch": 1.66, "learning_rate": 8.776636662812953e-06, "loss": 0.4323, "step": 8965 }, { "epoch": 1.66, "learning_rate": 8.774654238597084e-06, "loss": 0.4505, "step": 8966 }, { "epoch": 1.66, "learning_rate": 8.772671863270248e-06, "loss": 0.4399, "step": 8967 }, { "epoch": 1.66, "learning_rate": 8.770689536911528e-06, "loss": 0.417, "step": 8968 }, { "epoch": 1.66, "learning_rate": 8.76870725960002e-06, "loss": 0.4303, "step": 8969 }, { "epoch": 1.66, "learning_rate": 8.766725031414814e-06, "loss": 0.4237, "step": 8970 }, { "epoch": 1.66, "learning_rate": 8.764742852434996e-06, "loss": 0.4314, "step": 8971 }, { "epoch": 1.66, "learning_rate": 8.76276072273965e-06, "loss": 0.4357, "step": 8972 }, { "epoch": 1.66, "learning_rate": 8.760778642407862e-06, "loss": 0.4269, "step": 8973 }, { "epoch": 1.66, "learning_rate": 8.758796611518708e-06, "loss": 0.4501, "step": 8974 }, { "epoch": 1.66, "learning_rate": 8.756814630151276e-06, "loss": 0.4462, "step": 8975 }, { "epoch": 1.66, "learning_rate": 8.754832698384634e-06, "loss": 0.412, "step": 8976 }, { "epoch": 1.66, "learning_rate": 8.752850816297866e-06, "loss": 0.4288, "step": 8977 }, { "epoch": 1.66, "learning_rate": 8.750868983970043e-06, "loss": 0.4121, "step": 8978 }, { "epoch": 1.66, "learning_rate": 8.74888720148023e-06, "loss": 0.4357, "step": 8979 }, { "epoch": 1.66, "learning_rate": 8.746905468907503e-06, "loss": 0.4226, "step": 8980 }, { "epoch": 1.66, "learning_rate": 8.744923786330927e-06, "loss": 0.4123, "step": 8981 }, { "epoch": 1.66, "learning_rate": 8.74294215382957e-06, "loss": 0.4203, "step": 8982 }, { "epoch": 1.66, "learning_rate": 8.740960571482495e-06, "loss": 0.4207, "step": 8983 }, { "epoch": 1.66, "learning_rate": 8.738979039368758e-06, "loss": 0.4487, "step": 8984 }, { "epoch": 1.66, "learning_rate": 8.736997557567426e-06, "loss": 0.4264, "step": 8985 }, { "epoch": 1.66, "learning_rate": 8.735016126157549e-06, "loss": 0.4404, "step": 8986 }, { "epoch": 1.66, "learning_rate": 8.73303474521819e-06, "loss": 0.4587, "step": 8987 }, { "epoch": 1.66, "learning_rate": 8.731053414828397e-06, "loss": 0.4196, "step": 8988 }, { "epoch": 1.66, "learning_rate": 8.729072135067226e-06, "loss": 0.4533, "step": 8989 }, { "epoch": 1.66, "learning_rate": 8.727090906013724e-06, "loss": 0.4218, "step": 8990 }, { "epoch": 1.66, "learning_rate": 8.725109727746934e-06, "loss": 0.4166, "step": 8991 }, { "epoch": 1.66, "learning_rate": 8.723128600345909e-06, "loss": 0.4272, "step": 8992 }, { "epoch": 1.66, "learning_rate": 8.721147523889685e-06, "loss": 0.434, "step": 8993 }, { "epoch": 1.66, "learning_rate": 8.719166498457312e-06, "loss": 0.4254, "step": 8994 }, { "epoch": 1.66, "learning_rate": 8.717185524127822e-06, "loss": 0.4262, "step": 8995 }, { "epoch": 1.66, "learning_rate": 8.715204600980254e-06, "loss": 0.4541, "step": 8996 }, { "epoch": 1.66, "learning_rate": 8.713223729093643e-06, "loss": 0.425, "step": 8997 }, { "epoch": 1.66, "learning_rate": 8.711242908547025e-06, "loss": 0.4322, "step": 8998 }, { "epoch": 1.66, "learning_rate": 8.709262139419425e-06, "loss": 0.4572, "step": 8999 }, { "epoch": 1.67, "learning_rate": 8.707281421789882e-06, "loss": 0.439, "step": 9000 }, { "epoch": 1.67, "learning_rate": 8.70530075573741e-06, "loss": 0.439, "step": 9001 }, { "epoch": 1.67, "learning_rate": 8.703320141341047e-06, "loss": 0.4255, "step": 9002 }, { "epoch": 1.67, "learning_rate": 8.701339578679803e-06, "loss": 0.4324, "step": 9003 }, { "epoch": 1.67, "learning_rate": 8.699359067832712e-06, "loss": 0.4254, "step": 9004 }, { "epoch": 1.67, "learning_rate": 8.697378608878786e-06, "loss": 0.4353, "step": 9005 }, { "epoch": 1.67, "learning_rate": 8.695398201897036e-06, "loss": 0.4502, "step": 9006 }, { "epoch": 1.67, "learning_rate": 8.693417846966488e-06, "loss": 0.4387, "step": 9007 }, { "epoch": 1.67, "learning_rate": 8.691437544166143e-06, "loss": 0.4154, "step": 9008 }, { "epoch": 1.67, "learning_rate": 8.689457293575024e-06, "loss": 0.416, "step": 9009 }, { "epoch": 1.67, "learning_rate": 8.68747709527213e-06, "loss": 0.4363, "step": 9010 }, { "epoch": 1.67, "learning_rate": 8.685496949336468e-06, "loss": 0.4138, "step": 9011 }, { "epoch": 1.67, "learning_rate": 8.683516855847046e-06, "loss": 0.4259, "step": 9012 }, { "epoch": 1.67, "learning_rate": 8.681536814882861e-06, "loss": 0.4321, "step": 9013 }, { "epoch": 1.67, "learning_rate": 8.679556826522919e-06, "loss": 0.434, "step": 9014 }, { "epoch": 1.67, "learning_rate": 8.677576890846212e-06, "loss": 0.4267, "step": 9015 }, { "epoch": 1.67, "learning_rate": 8.675597007931742e-06, "loss": 0.4272, "step": 9016 }, { "epoch": 1.67, "learning_rate": 8.673617177858497e-06, "loss": 0.4186, "step": 9017 }, { "epoch": 1.67, "learning_rate": 8.671637400705473e-06, "loss": 0.4253, "step": 9018 }, { "epoch": 1.67, "learning_rate": 8.669657676551654e-06, "loss": 0.4248, "step": 9019 }, { "epoch": 1.67, "learning_rate": 8.667678005476034e-06, "loss": 0.437, "step": 9020 }, { "epoch": 1.67, "learning_rate": 8.665698387557593e-06, "loss": 0.4403, "step": 9021 }, { "epoch": 1.67, "learning_rate": 8.66371882287532e-06, "loss": 0.4215, "step": 9022 }, { "epoch": 1.67, "learning_rate": 8.661739311508185e-06, "loss": 0.4268, "step": 9023 }, { "epoch": 1.67, "learning_rate": 8.65975985353518e-06, "loss": 0.4296, "step": 9024 }, { "epoch": 1.67, "learning_rate": 8.65778044903527e-06, "loss": 0.4114, "step": 9025 }, { "epoch": 1.67, "learning_rate": 8.655801098087439e-06, "loss": 0.4364, "step": 9026 }, { "epoch": 1.67, "learning_rate": 8.653821800770655e-06, "loss": 0.4123, "step": 9027 }, { "epoch": 1.67, "learning_rate": 8.651842557163886e-06, "loss": 0.4316, "step": 9028 }, { "epoch": 1.67, "learning_rate": 8.649863367346108e-06, "loss": 0.4322, "step": 9029 }, { "epoch": 1.67, "learning_rate": 8.647884231396276e-06, "loss": 0.4341, "step": 9030 }, { "epoch": 1.67, "learning_rate": 8.645905149393363e-06, "loss": 0.4235, "step": 9031 }, { "epoch": 1.67, "learning_rate": 8.64392612141633e-06, "loss": 0.4371, "step": 9032 }, { "epoch": 1.67, "learning_rate": 8.641947147544128e-06, "loss": 0.4333, "step": 9033 }, { "epoch": 1.67, "learning_rate": 8.639968227855726e-06, "loss": 0.4449, "step": 9034 }, { "epoch": 1.67, "learning_rate": 8.637989362430068e-06, "loss": 0.4189, "step": 9035 }, { "epoch": 1.67, "learning_rate": 8.63601055134612e-06, "loss": 0.4381, "step": 9036 }, { "epoch": 1.67, "learning_rate": 8.634031794682818e-06, "loss": 0.4458, "step": 9037 }, { "epoch": 1.67, "learning_rate": 8.632053092519123e-06, "loss": 0.4277, "step": 9038 }, { "epoch": 1.67, "learning_rate": 8.630074444933977e-06, "loss": 0.433, "step": 9039 }, { "epoch": 1.67, "learning_rate": 8.628095852006322e-06, "loss": 0.4267, "step": 9040 }, { "epoch": 1.67, "learning_rate": 8.626117313815106e-06, "loss": 0.423, "step": 9041 }, { "epoch": 1.67, "learning_rate": 8.62413883043926e-06, "loss": 0.4316, "step": 9042 }, { "epoch": 1.67, "learning_rate": 8.622160401957733e-06, "loss": 0.4328, "step": 9043 }, { "epoch": 1.67, "learning_rate": 8.620182028449451e-06, "loss": 0.4039, "step": 9044 }, { "epoch": 1.67, "learning_rate": 8.618203709993353e-06, "loss": 0.4265, "step": 9045 }, { "epoch": 1.67, "learning_rate": 8.61622544666837e-06, "loss": 0.4147, "step": 9046 }, { "epoch": 1.67, "learning_rate": 8.614247238553428e-06, "loss": 0.4255, "step": 9047 }, { "epoch": 1.67, "learning_rate": 8.612269085727453e-06, "loss": 0.4437, "step": 9048 }, { "epoch": 1.67, "learning_rate": 8.610290988269378e-06, "loss": 0.4318, "step": 9049 }, { "epoch": 1.67, "learning_rate": 8.608312946258115e-06, "loss": 0.413, "step": 9050 }, { "epoch": 1.67, "learning_rate": 8.606334959772591e-06, "loss": 0.4237, "step": 9051 }, { "epoch": 1.67, "learning_rate": 8.604357028891719e-06, "loss": 0.4275, "step": 9052 }, { "epoch": 1.67, "learning_rate": 8.602379153694423e-06, "loss": 0.4356, "step": 9053 }, { "epoch": 1.68, "learning_rate": 8.600401334259609e-06, "loss": 0.4294, "step": 9054 }, { "epoch": 1.68, "learning_rate": 8.598423570666187e-06, "loss": 0.4071, "step": 9055 }, { "epoch": 1.68, "learning_rate": 8.596445862993073e-06, "loss": 0.4276, "step": 9056 }, { "epoch": 1.68, "learning_rate": 8.594468211319167e-06, "loss": 0.4338, "step": 9057 }, { "epoch": 1.68, "learning_rate": 8.592490615723381e-06, "loss": 0.4456, "step": 9058 }, { "epoch": 1.68, "learning_rate": 8.59051307628461e-06, "loss": 0.4353, "step": 9059 }, { "epoch": 1.68, "learning_rate": 8.588535593081761e-06, "loss": 0.4165, "step": 9060 }, { "epoch": 1.68, "learning_rate": 8.586558166193731e-06, "loss": 0.4255, "step": 9061 }, { "epoch": 1.68, "learning_rate": 8.584580795699406e-06, "loss": 0.4084, "step": 9062 }, { "epoch": 1.68, "learning_rate": 8.58260348167769e-06, "loss": 0.4207, "step": 9063 }, { "epoch": 1.68, "learning_rate": 8.58062622420747e-06, "loss": 0.4211, "step": 9064 }, { "epoch": 1.68, "learning_rate": 8.578649023367639e-06, "loss": 0.4412, "step": 9065 }, { "epoch": 1.68, "learning_rate": 8.576671879237077e-06, "loss": 0.4467, "step": 9066 }, { "epoch": 1.68, "learning_rate": 8.574694791894673e-06, "loss": 0.4227, "step": 9067 }, { "epoch": 1.68, "learning_rate": 8.572717761419307e-06, "loss": 0.4475, "step": 9068 }, { "epoch": 1.68, "learning_rate": 8.570740787889861e-06, "loss": 0.4205, "step": 9069 }, { "epoch": 1.68, "learning_rate": 8.568763871385211e-06, "loss": 0.4124, "step": 9070 }, { "epoch": 1.68, "learning_rate": 8.566787011984234e-06, "loss": 0.4288, "step": 9071 }, { "epoch": 1.68, "learning_rate": 8.564810209765799e-06, "loss": 0.4349, "step": 9072 }, { "epoch": 1.68, "learning_rate": 8.562833464808782e-06, "loss": 0.4176, "step": 9073 }, { "epoch": 1.68, "learning_rate": 8.560856777192044e-06, "loss": 0.4277, "step": 9074 }, { "epoch": 1.68, "learning_rate": 8.558880146994463e-06, "loss": 0.4348, "step": 9075 }, { "epoch": 1.68, "learning_rate": 8.556903574294895e-06, "loss": 0.4175, "step": 9076 }, { "epoch": 1.68, "learning_rate": 8.554927059172198e-06, "loss": 0.4484, "step": 9077 }, { "epoch": 1.68, "learning_rate": 8.552950601705239e-06, "loss": 0.4209, "step": 9078 }, { "epoch": 1.68, "learning_rate": 8.550974201972869e-06, "loss": 0.4111, "step": 9079 }, { "epoch": 1.68, "learning_rate": 8.548997860053948e-06, "loss": 0.4263, "step": 9080 }, { "epoch": 1.68, "learning_rate": 8.547021576027324e-06, "loss": 0.4412, "step": 9081 }, { "epoch": 1.68, "learning_rate": 8.545045349971852e-06, "loss": 0.4148, "step": 9082 }, { "epoch": 1.68, "learning_rate": 8.543069181966379e-06, "loss": 0.4428, "step": 9083 }, { "epoch": 1.68, "learning_rate": 8.54109307208974e-06, "loss": 0.4255, "step": 9084 }, { "epoch": 1.68, "learning_rate": 8.539117020420795e-06, "loss": 0.3902, "step": 9085 }, { "epoch": 1.68, "learning_rate": 8.537141027038368e-06, "loss": 0.394, "step": 9086 }, { "epoch": 1.68, "learning_rate": 8.53516509202131e-06, "loss": 0.4348, "step": 9087 }, { "epoch": 1.68, "learning_rate": 8.533189215448456e-06, "loss": 0.4349, "step": 9088 }, { "epoch": 1.68, "learning_rate": 8.53121339739863e-06, "loss": 0.4394, "step": 9089 }, { "epoch": 1.68, "learning_rate": 8.529237637950675e-06, "loss": 0.4275, "step": 9090 }, { "epoch": 1.68, "learning_rate": 8.527261937183411e-06, "loss": 0.437, "step": 9091 }, { "epoch": 1.68, "learning_rate": 8.525286295175672e-06, "loss": 0.4395, "step": 9092 }, { "epoch": 1.68, "learning_rate": 8.523310712006279e-06, "loss": 0.4333, "step": 9093 }, { "epoch": 1.68, "learning_rate": 8.521335187754053e-06, "loss": 0.4072, "step": 9094 }, { "epoch": 1.68, "learning_rate": 8.519359722497818e-06, "loss": 0.4118, "step": 9095 }, { "epoch": 1.68, "learning_rate": 8.517384316316386e-06, "loss": 0.4243, "step": 9096 }, { "epoch": 1.68, "learning_rate": 8.515408969288575e-06, "loss": 0.423, "step": 9097 }, { "epoch": 1.68, "learning_rate": 8.513433681493201e-06, "loss": 0.4347, "step": 9098 }, { "epoch": 1.68, "learning_rate": 8.511458453009066e-06, "loss": 0.4189, "step": 9099 }, { "epoch": 1.68, "learning_rate": 8.509483283914987e-06, "loss": 0.4455, "step": 9100 }, { "epoch": 1.68, "learning_rate": 8.507508174289761e-06, "loss": 0.4206, "step": 9101 }, { "epoch": 1.68, "learning_rate": 8.5055331242122e-06, "loss": 0.4273, "step": 9102 }, { "epoch": 1.68, "learning_rate": 8.503558133761096e-06, "loss": 0.4334, "step": 9103 }, { "epoch": 1.68, "learning_rate": 8.501583203015256e-06, "loss": 0.4397, "step": 9104 }, { "epoch": 1.68, "learning_rate": 8.499608332053472e-06, "loss": 0.447, "step": 9105 }, { "epoch": 1.68, "learning_rate": 8.497633520954534e-06, "loss": 0.4374, "step": 9106 }, { "epoch": 1.68, "learning_rate": 8.49565876979724e-06, "loss": 0.4319, "step": 9107 }, { "epoch": 1.69, "learning_rate": 8.493684078660373e-06, "loss": 0.4301, "step": 9108 }, { "epoch": 1.69, "learning_rate": 8.491709447622726e-06, "loss": 0.4301, "step": 9109 }, { "epoch": 1.69, "learning_rate": 8.48973487676308e-06, "loss": 0.4261, "step": 9110 }, { "epoch": 1.69, "learning_rate": 8.487760366160211e-06, "loss": 0.4264, "step": 9111 }, { "epoch": 1.69, "learning_rate": 8.485785915892907e-06, "loss": 0.4307, "step": 9112 }, { "epoch": 1.69, "learning_rate": 8.483811526039939e-06, "loss": 0.4476, "step": 9113 }, { "epoch": 1.69, "learning_rate": 8.481837196680088e-06, "loss": 0.4261, "step": 9114 }, { "epoch": 1.69, "learning_rate": 8.479862927892121e-06, "loss": 0.4349, "step": 9115 }, { "epoch": 1.69, "learning_rate": 8.477888719754805e-06, "loss": 0.4216, "step": 9116 }, { "epoch": 1.69, "learning_rate": 8.475914572346915e-06, "loss": 0.4418, "step": 9117 }, { "epoch": 1.69, "learning_rate": 8.47394048574721e-06, "loss": 0.4143, "step": 9118 }, { "epoch": 1.69, "learning_rate": 8.471966460034452e-06, "loss": 0.4198, "step": 9119 }, { "epoch": 1.69, "learning_rate": 8.46999249528741e-06, "loss": 0.4264, "step": 9120 }, { "epoch": 1.69, "learning_rate": 8.468018591584827e-06, "loss": 0.4378, "step": 9121 }, { "epoch": 1.69, "learning_rate": 8.46604474900547e-06, "loss": 0.421, "step": 9122 }, { "epoch": 1.69, "learning_rate": 8.464070967628084e-06, "loss": 0.434, "step": 9123 }, { "epoch": 1.69, "learning_rate": 8.462097247531428e-06, "loss": 0.4395, "step": 9124 }, { "epoch": 1.69, "learning_rate": 8.46012358879424e-06, "loss": 0.4494, "step": 9125 }, { "epoch": 1.69, "learning_rate": 8.458149991495274e-06, "loss": 0.424, "step": 9126 }, { "epoch": 1.69, "learning_rate": 8.456176455713268e-06, "loss": 0.4329, "step": 9127 }, { "epoch": 1.69, "learning_rate": 8.45420298152696e-06, "loss": 0.4354, "step": 9128 }, { "epoch": 1.69, "learning_rate": 8.452229569015093e-06, "loss": 0.423, "step": 9129 }, { "epoch": 1.69, "learning_rate": 8.450256218256398e-06, "loss": 0.4428, "step": 9130 }, { "epoch": 1.69, "learning_rate": 8.448282929329616e-06, "loss": 0.4225, "step": 9131 }, { "epoch": 1.69, "learning_rate": 8.44630970231347e-06, "loss": 0.435, "step": 9132 }, { "epoch": 1.69, "learning_rate": 8.444336537286686e-06, "loss": 0.4485, "step": 9133 }, { "epoch": 1.69, "learning_rate": 8.442363434328e-06, "loss": 0.4403, "step": 9134 }, { "epoch": 1.69, "learning_rate": 8.440390393516124e-06, "loss": 0.4316, "step": 9135 }, { "epoch": 1.69, "learning_rate": 8.438417414929787e-06, "loss": 0.4219, "step": 9136 }, { "epoch": 1.69, "learning_rate": 8.436444498647705e-06, "loss": 0.4273, "step": 9137 }, { "epoch": 1.69, "learning_rate": 8.434471644748589e-06, "loss": 0.4428, "step": 9138 }, { "epoch": 1.69, "learning_rate": 8.432498853311158e-06, "loss": 0.4155, "step": 9139 }, { "epoch": 1.69, "learning_rate": 8.430526124414118e-06, "loss": 0.4389, "step": 9140 }, { "epoch": 1.69, "learning_rate": 8.428553458136185e-06, "loss": 0.4212, "step": 9141 }, { "epoch": 1.69, "learning_rate": 8.426580854556055e-06, "loss": 0.4426, "step": 9142 }, { "epoch": 1.69, "learning_rate": 8.424608313752438e-06, "loss": 0.4219, "step": 9143 }, { "epoch": 1.69, "learning_rate": 8.42263583580403e-06, "loss": 0.414, "step": 9144 }, { "epoch": 1.69, "learning_rate": 8.420663420789535e-06, "loss": 0.4345, "step": 9145 }, { "epoch": 1.69, "learning_rate": 8.418691068787644e-06, "loss": 0.4508, "step": 9146 }, { "epoch": 1.69, "learning_rate": 8.41671877987705e-06, "loss": 0.4202, "step": 9147 }, { "epoch": 1.69, "learning_rate": 8.414746554136447e-06, "loss": 0.4356, "step": 9148 }, { "epoch": 1.69, "learning_rate": 8.412774391644522e-06, "loss": 0.4221, "step": 9149 }, { "epoch": 1.69, "learning_rate": 8.410802292479958e-06, "loss": 0.4344, "step": 9150 }, { "epoch": 1.69, "learning_rate": 8.408830256721443e-06, "loss": 0.4432, "step": 9151 }, { "epoch": 1.69, "learning_rate": 8.406858284447652e-06, "loss": 0.4296, "step": 9152 }, { "epoch": 1.69, "learning_rate": 8.40488637573727e-06, "loss": 0.4366, "step": 9153 }, { "epoch": 1.69, "learning_rate": 8.402914530668966e-06, "loss": 0.4334, "step": 9154 }, { "epoch": 1.69, "learning_rate": 8.400942749321413e-06, "loss": 0.4078, "step": 9155 }, { "epoch": 1.69, "learning_rate": 8.398971031773288e-06, "loss": 0.4063, "step": 9156 }, { "epoch": 1.69, "learning_rate": 8.39699937810325e-06, "loss": 0.4289, "step": 9157 }, { "epoch": 1.69, "learning_rate": 8.395027788389972e-06, "loss": 0.4154, "step": 9158 }, { "epoch": 1.69, "learning_rate": 8.393056262712116e-06, "loss": 0.4338, "step": 9159 }, { "epoch": 1.69, "learning_rate": 8.391084801148334e-06, "loss": 0.4034, "step": 9160 }, { "epoch": 1.69, "learning_rate": 8.389113403777294e-06, "loss": 0.4337, "step": 9161 }, { "epoch": 1.7, "learning_rate": 8.387142070677643e-06, "loss": 0.4592, "step": 9162 }, { "epoch": 1.7, "learning_rate": 8.385170801928042e-06, "loss": 0.418, "step": 9163 }, { "epoch": 1.7, "learning_rate": 8.383199597607135e-06, "loss": 0.4372, "step": 9164 }, { "epoch": 1.7, "learning_rate": 8.381228457793566e-06, "loss": 0.4421, "step": 9165 }, { "epoch": 1.7, "learning_rate": 8.37925738256599e-06, "loss": 0.44, "step": 9166 }, { "epoch": 1.7, "learning_rate": 8.377286372003039e-06, "loss": 0.436, "step": 9167 }, { "epoch": 1.7, "learning_rate": 8.375315426183362e-06, "loss": 0.4437, "step": 9168 }, { "epoch": 1.7, "learning_rate": 8.373344545185586e-06, "loss": 0.4272, "step": 9169 }, { "epoch": 1.7, "learning_rate": 8.371373729088356e-06, "loss": 0.4327, "step": 9170 }, { "epoch": 1.7, "learning_rate": 8.369402977970297e-06, "loss": 0.4152, "step": 9171 }, { "epoch": 1.7, "learning_rate": 8.367432291910042e-06, "loss": 0.4244, "step": 9172 }, { "epoch": 1.7, "learning_rate": 8.365461670986214e-06, "loss": 0.4596, "step": 9173 }, { "epoch": 1.7, "learning_rate": 8.363491115277438e-06, "loss": 0.4383, "step": 9174 }, { "epoch": 1.7, "learning_rate": 8.361520624862339e-06, "loss": 0.4332, "step": 9175 }, { "epoch": 1.7, "learning_rate": 8.359550199819533e-06, "loss": 0.4356, "step": 9176 }, { "epoch": 1.7, "learning_rate": 8.357579840227634e-06, "loss": 0.4329, "step": 9177 }, { "epoch": 1.7, "learning_rate": 8.355609546165264e-06, "loss": 0.4301, "step": 9178 }, { "epoch": 1.7, "learning_rate": 8.353639317711022e-06, "loss": 0.4357, "step": 9179 }, { "epoch": 1.7, "learning_rate": 8.35166915494353e-06, "loss": 0.4194, "step": 9180 }, { "epoch": 1.7, "learning_rate": 8.349699057941383e-06, "loss": 0.4433, "step": 9181 }, { "epoch": 1.7, "learning_rate": 8.347729026783186e-06, "loss": 0.4185, "step": 9182 }, { "epoch": 1.7, "learning_rate": 8.345759061547547e-06, "loss": 0.4434, "step": 9183 }, { "epoch": 1.7, "learning_rate": 8.343789162313054e-06, "loss": 0.4625, "step": 9184 }, { "epoch": 1.7, "learning_rate": 8.34181932915831e-06, "loss": 0.4419, "step": 9185 }, { "epoch": 1.7, "learning_rate": 8.339849562161906e-06, "loss": 0.4145, "step": 9186 }, { "epoch": 1.7, "learning_rate": 8.337879861402425e-06, "loss": 0.4331, "step": 9187 }, { "epoch": 1.7, "learning_rate": 8.335910226958467e-06, "loss": 0.4239, "step": 9188 }, { "epoch": 1.7, "learning_rate": 8.333940658908603e-06, "loss": 0.4215, "step": 9189 }, { "epoch": 1.7, "learning_rate": 8.331971157331428e-06, "loss": 0.4204, "step": 9190 }, { "epoch": 1.7, "learning_rate": 8.330001722305512e-06, "loss": 0.3978, "step": 9191 }, { "epoch": 1.7, "learning_rate": 8.328032353909439e-06, "loss": 0.416, "step": 9192 }, { "epoch": 1.7, "learning_rate": 8.326063052221775e-06, "loss": 0.4238, "step": 9193 }, { "epoch": 1.7, "learning_rate": 8.3240938173211e-06, "loss": 0.4208, "step": 9194 }, { "epoch": 1.7, "learning_rate": 8.322124649285977e-06, "loss": 0.4113, "step": 9195 }, { "epoch": 1.7, "learning_rate": 8.320155548194972e-06, "loss": 0.4251, "step": 9196 }, { "epoch": 1.7, "learning_rate": 8.318186514126652e-06, "loss": 0.4457, "step": 9197 }, { "epoch": 1.7, "learning_rate": 8.316217547159579e-06, "loss": 0.4132, "step": 9198 }, { "epoch": 1.7, "learning_rate": 8.314248647372303e-06, "loss": 0.4036, "step": 9199 }, { "epoch": 1.7, "learning_rate": 8.312279814843392e-06, "loss": 0.4422, "step": 9200 }, { "epoch": 1.7, "learning_rate": 8.310311049651385e-06, "loss": 0.4168, "step": 9201 }, { "epoch": 1.7, "learning_rate": 8.308342351874843e-06, "loss": 0.411, "step": 9202 }, { "epoch": 1.7, "learning_rate": 8.30637372159231e-06, "loss": 0.4369, "step": 9203 }, { "epoch": 1.7, "learning_rate": 8.304405158882325e-06, "loss": 0.4313, "step": 9204 }, { "epoch": 1.7, "learning_rate": 8.302436663823438e-06, "loss": 0.4339, "step": 9205 }, { "epoch": 1.7, "learning_rate": 8.300468236494183e-06, "loss": 0.4092, "step": 9206 }, { "epoch": 1.7, "learning_rate": 8.298499876973101e-06, "loss": 0.4547, "step": 9207 }, { "epoch": 1.7, "learning_rate": 8.296531585338726e-06, "loss": 0.4213, "step": 9208 }, { "epoch": 1.7, "learning_rate": 8.294563361669581e-06, "loss": 0.4462, "step": 9209 }, { "epoch": 1.7, "learning_rate": 8.292595206044206e-06, "loss": 0.4154, "step": 9210 }, { "epoch": 1.7, "learning_rate": 8.290627118541114e-06, "loss": 0.4185, "step": 9211 }, { "epoch": 1.7, "learning_rate": 8.288659099238841e-06, "loss": 0.4305, "step": 9212 }, { "epoch": 1.7, "learning_rate": 8.286691148215899e-06, "loss": 0.4375, "step": 9213 }, { "epoch": 1.7, "learning_rate": 8.28472326555081e-06, "loss": 0.4126, "step": 9214 }, { "epoch": 1.7, "learning_rate": 8.282755451322087e-06, "loss": 0.414, "step": 9215 }, { "epoch": 1.71, "learning_rate": 8.28078770560824e-06, "loss": 0.4133, "step": 9216 }, { "epoch": 1.71, "learning_rate": 8.278820028487782e-06, "loss": 0.4234, "step": 9217 }, { "epoch": 1.71, "learning_rate": 8.276852420039216e-06, "loss": 0.4429, "step": 9218 }, { "epoch": 1.71, "learning_rate": 8.274884880341051e-06, "loss": 0.4468, "step": 9219 }, { "epoch": 1.71, "learning_rate": 8.272917409471785e-06, "loss": 0.4241, "step": 9220 }, { "epoch": 1.71, "learning_rate": 8.270950007509915e-06, "loss": 0.44, "step": 9221 }, { "epoch": 1.71, "learning_rate": 8.268982674533938e-06, "loss": 0.4089, "step": 9222 }, { "epoch": 1.71, "learning_rate": 8.26701541062235e-06, "loss": 0.4237, "step": 9223 }, { "epoch": 1.71, "learning_rate": 8.265048215853635e-06, "loss": 0.4438, "step": 9224 }, { "epoch": 1.71, "learning_rate": 8.26308109030629e-06, "loss": 0.4072, "step": 9225 }, { "epoch": 1.71, "learning_rate": 8.261114034058788e-06, "loss": 0.4081, "step": 9226 }, { "epoch": 1.71, "learning_rate": 8.259147047189619e-06, "loss": 0.421, "step": 9227 }, { "epoch": 1.71, "learning_rate": 8.257180129777258e-06, "loss": 0.4434, "step": 9228 }, { "epoch": 1.71, "learning_rate": 8.255213281900186e-06, "loss": 0.4582, "step": 9229 }, { "epoch": 1.71, "learning_rate": 8.253246503636873e-06, "loss": 0.4341, "step": 9230 }, { "epoch": 1.71, "learning_rate": 8.251279795065788e-06, "loss": 0.4338, "step": 9231 }, { "epoch": 1.71, "learning_rate": 8.249313156265403e-06, "loss": 0.4356, "step": 9232 }, { "epoch": 1.71, "learning_rate": 8.24734658731418e-06, "loss": 0.4522, "step": 9233 }, { "epoch": 1.71, "learning_rate": 8.245380088290587e-06, "loss": 0.4318, "step": 9234 }, { "epoch": 1.71, "learning_rate": 8.243413659273077e-06, "loss": 0.4388, "step": 9235 }, { "epoch": 1.71, "learning_rate": 8.241447300340111e-06, "loss": 0.4306, "step": 9236 }, { "epoch": 1.71, "learning_rate": 8.239481011570144e-06, "loss": 0.4478, "step": 9237 }, { "epoch": 1.71, "learning_rate": 8.23751479304162e-06, "loss": 0.4591, "step": 9238 }, { "epoch": 1.71, "learning_rate": 8.235548644832997e-06, "loss": 0.4332, "step": 9239 }, { "epoch": 1.71, "learning_rate": 8.233582567022713e-06, "loss": 0.4305, "step": 9240 }, { "epoch": 1.71, "learning_rate": 8.231616559689217e-06, "loss": 0.4062, "step": 9241 }, { "epoch": 1.71, "learning_rate": 8.229650622910943e-06, "loss": 0.4274, "step": 9242 }, { "epoch": 1.71, "learning_rate": 8.227684756766334e-06, "loss": 0.4204, "step": 9243 }, { "epoch": 1.71, "learning_rate": 8.22571896133382e-06, "loss": 0.4272, "step": 9244 }, { "epoch": 1.71, "learning_rate": 8.223753236691836e-06, "loss": 0.4067, "step": 9245 }, { "epoch": 1.71, "learning_rate": 8.221787582918807e-06, "loss": 0.4388, "step": 9246 }, { "epoch": 1.71, "learning_rate": 8.219822000093166e-06, "loss": 0.4314, "step": 9247 }, { "epoch": 1.71, "learning_rate": 8.217856488293326e-06, "loss": 0.4388, "step": 9248 }, { "epoch": 1.71, "learning_rate": 8.215891047597716e-06, "loss": 0.4434, "step": 9249 }, { "epoch": 1.71, "learning_rate": 8.213925678084746e-06, "loss": 0.4417, "step": 9250 }, { "epoch": 1.71, "learning_rate": 8.211960379832839e-06, "loss": 0.443, "step": 9251 }, { "epoch": 1.71, "learning_rate": 8.209995152920403e-06, "loss": 0.436, "step": 9252 }, { "epoch": 1.71, "learning_rate": 8.208029997425842e-06, "loss": 0.4071, "step": 9253 }, { "epoch": 1.71, "learning_rate": 8.20606491342757e-06, "loss": 0.4564, "step": 9254 }, { "epoch": 1.71, "learning_rate": 8.204099901003983e-06, "loss": 0.4147, "step": 9255 }, { "epoch": 1.71, "learning_rate": 8.202134960233488e-06, "loss": 0.4222, "step": 9256 }, { "epoch": 1.71, "learning_rate": 8.200170091194477e-06, "loss": 0.4216, "step": 9257 }, { "epoch": 1.71, "learning_rate": 8.19820529396535e-06, "loss": 0.4373, "step": 9258 }, { "epoch": 1.71, "learning_rate": 8.196240568624496e-06, "loss": 0.4361, "step": 9259 }, { "epoch": 1.71, "learning_rate": 8.1942759152503e-06, "loss": 0.4025, "step": 9260 }, { "epoch": 1.71, "learning_rate": 8.192311333921155e-06, "loss": 0.4143, "step": 9261 }, { "epoch": 1.71, "learning_rate": 8.190346824715438e-06, "loss": 0.4363, "step": 9262 }, { "epoch": 1.71, "learning_rate": 8.188382387711536e-06, "loss": 0.4134, "step": 9263 }, { "epoch": 1.71, "learning_rate": 8.186418022987821e-06, "loss": 0.4422, "step": 9264 }, { "epoch": 1.71, "learning_rate": 8.184453730622667e-06, "loss": 0.4231, "step": 9265 }, { "epoch": 1.71, "learning_rate": 8.182489510694451e-06, "loss": 0.417, "step": 9266 }, { "epoch": 1.71, "learning_rate": 8.180525363281536e-06, "loss": 0.425, "step": 9267 }, { "epoch": 1.71, "learning_rate": 8.178561288462293e-06, "loss": 0.4331, "step": 9268 }, { "epoch": 1.71, "learning_rate": 8.176597286315079e-06, "loss": 0.4162, "step": 9269 }, { "epoch": 1.72, "learning_rate": 8.174633356918257e-06, "loss": 0.4553, "step": 9270 }, { "epoch": 1.72, "learning_rate": 8.172669500350188e-06, "loss": 0.442, "step": 9271 }, { "epoch": 1.72, "learning_rate": 8.17070571668922e-06, "loss": 0.4331, "step": 9272 }, { "epoch": 1.72, "learning_rate": 8.168742006013709e-06, "loss": 0.4367, "step": 9273 }, { "epoch": 1.72, "learning_rate": 8.166778368402002e-06, "loss": 0.4427, "step": 9274 }, { "epoch": 1.72, "learning_rate": 8.16481480393244e-06, "loss": 0.4305, "step": 9275 }, { "epoch": 1.72, "learning_rate": 8.162851312683373e-06, "loss": 0.4198, "step": 9276 }, { "epoch": 1.72, "learning_rate": 8.160887894733135e-06, "loss": 0.4227, "step": 9277 }, { "epoch": 1.72, "learning_rate": 8.158924550160067e-06, "loss": 0.4421, "step": 9278 }, { "epoch": 1.72, "learning_rate": 8.156961279042497e-06, "loss": 0.4373, "step": 9279 }, { "epoch": 1.72, "learning_rate": 8.154998081458766e-06, "loss": 0.4063, "step": 9280 }, { "epoch": 1.72, "learning_rate": 8.153034957487193e-06, "loss": 0.4268, "step": 9281 }, { "epoch": 1.72, "learning_rate": 8.151071907206105e-06, "loss": 0.4108, "step": 9282 }, { "epoch": 1.72, "learning_rate": 8.149108930693825e-06, "loss": 0.4286, "step": 9283 }, { "epoch": 1.72, "learning_rate": 8.14714602802867e-06, "loss": 0.444, "step": 9284 }, { "epoch": 1.72, "learning_rate": 8.145183199288961e-06, "loss": 0.4215, "step": 9285 }, { "epoch": 1.72, "learning_rate": 8.143220444553008e-06, "loss": 0.4295, "step": 9286 }, { "epoch": 1.72, "learning_rate": 8.141257763899118e-06, "loss": 0.4495, "step": 9287 }, { "epoch": 1.72, "learning_rate": 8.139295157405606e-06, "loss": 0.4197, "step": 9288 }, { "epoch": 1.72, "learning_rate": 8.13733262515077e-06, "loss": 0.4232, "step": 9289 }, { "epoch": 1.72, "learning_rate": 8.135370167212914e-06, "loss": 0.4276, "step": 9290 }, { "epoch": 1.72, "learning_rate": 8.13340778367034e-06, "loss": 0.4489, "step": 9291 }, { "epoch": 1.72, "learning_rate": 8.131445474601332e-06, "loss": 0.4165, "step": 9292 }, { "epoch": 1.72, "learning_rate": 8.129483240084195e-06, "loss": 0.4299, "step": 9293 }, { "epoch": 1.72, "learning_rate": 8.12752108019721e-06, "loss": 0.4225, "step": 9294 }, { "epoch": 1.72, "learning_rate": 8.125558995018672e-06, "loss": 0.4251, "step": 9295 }, { "epoch": 1.72, "learning_rate": 8.123596984626857e-06, "loss": 0.4176, "step": 9296 }, { "epoch": 1.72, "learning_rate": 8.121635049100048e-06, "loss": 0.4346, "step": 9297 }, { "epoch": 1.72, "learning_rate": 8.11967318851652e-06, "loss": 0.421, "step": 9298 }, { "epoch": 1.72, "learning_rate": 8.117711402954556e-06, "loss": 0.4289, "step": 9299 }, { "epoch": 1.72, "learning_rate": 8.115749692492418e-06, "loss": 0.427, "step": 9300 }, { "epoch": 1.72, "learning_rate": 8.11378805720838e-06, "loss": 0.4368, "step": 9301 }, { "epoch": 1.72, "learning_rate": 8.111826497180707e-06, "loss": 0.4322, "step": 9302 }, { "epoch": 1.72, "learning_rate": 8.109865012487662e-06, "loss": 0.4267, "step": 9303 }, { "epoch": 1.72, "learning_rate": 8.107903603207499e-06, "loss": 0.4324, "step": 9304 }, { "epoch": 1.72, "learning_rate": 8.105942269418485e-06, "loss": 0.4265, "step": 9305 }, { "epoch": 1.72, "learning_rate": 8.103981011198862e-06, "loss": 0.4269, "step": 9306 }, { "epoch": 1.72, "learning_rate": 8.10201982862689e-06, "loss": 0.4299, "step": 9307 }, { "epoch": 1.72, "learning_rate": 8.100058721780814e-06, "loss": 0.4212, "step": 9308 }, { "epoch": 1.72, "learning_rate": 8.098097690738873e-06, "loss": 0.4323, "step": 9309 }, { "epoch": 1.72, "learning_rate": 8.096136735579316e-06, "loss": 0.4018, "step": 9310 }, { "epoch": 1.72, "learning_rate": 8.094175856380375e-06, "loss": 0.4345, "step": 9311 }, { "epoch": 1.72, "learning_rate": 8.092215053220294e-06, "loss": 0.4391, "step": 9312 }, { "epoch": 1.72, "learning_rate": 8.0902543261773e-06, "loss": 0.4481, "step": 9313 }, { "epoch": 1.72, "learning_rate": 8.088293675329617e-06, "loss": 0.4532, "step": 9314 }, { "epoch": 1.72, "learning_rate": 8.086333100755482e-06, "loss": 0.4245, "step": 9315 }, { "epoch": 1.72, "learning_rate": 8.084372602533108e-06, "loss": 0.4195, "step": 9316 }, { "epoch": 1.72, "learning_rate": 8.082412180740726e-06, "loss": 0.4181, "step": 9317 }, { "epoch": 1.72, "learning_rate": 8.080451835456544e-06, "loss": 0.4211, "step": 9318 }, { "epoch": 1.72, "learning_rate": 8.078491566758782e-06, "loss": 0.4134, "step": 9319 }, { "epoch": 1.72, "learning_rate": 8.076531374725647e-06, "loss": 0.4384, "step": 9320 }, { "epoch": 1.72, "learning_rate": 8.07457125943535e-06, "loss": 0.4068, "step": 9321 }, { "epoch": 1.72, "learning_rate": 8.072611220966094e-06, "loss": 0.4301, "step": 9322 }, { "epoch": 1.72, "learning_rate": 8.070651259396083e-06, "loss": 0.4243, "step": 9323 }, { "epoch": 1.73, "learning_rate": 8.068691374803514e-06, "loss": 0.4402, "step": 9324 }, { "epoch": 1.73, "learning_rate": 8.066731567266586e-06, "loss": 0.4377, "step": 9325 }, { "epoch": 1.73, "learning_rate": 8.064771836863483e-06, "loss": 0.4152, "step": 9326 }, { "epoch": 1.73, "learning_rate": 8.062812183672408e-06, "loss": 0.4346, "step": 9327 }, { "epoch": 1.73, "learning_rate": 8.060852607771533e-06, "loss": 0.4403, "step": 9328 }, { "epoch": 1.73, "learning_rate": 8.058893109239055e-06, "loss": 0.4236, "step": 9329 }, { "epoch": 1.73, "learning_rate": 8.056933688153149e-06, "loss": 0.4382, "step": 9330 }, { "epoch": 1.73, "learning_rate": 8.054974344591984e-06, "loss": 0.4237, "step": 9331 }, { "epoch": 1.73, "learning_rate": 8.053015078633748e-06, "loss": 0.4346, "step": 9332 }, { "epoch": 1.73, "learning_rate": 8.0510558903566e-06, "loss": 0.4188, "step": 9333 }, { "epoch": 1.73, "learning_rate": 8.04909677983872e-06, "loss": 0.4247, "step": 9334 }, { "epoch": 1.73, "learning_rate": 8.047137747158263e-06, "loss": 0.4277, "step": 9335 }, { "epoch": 1.73, "learning_rate": 8.045178792393393e-06, "loss": 0.4179, "step": 9336 }, { "epoch": 1.73, "learning_rate": 8.043219915622273e-06, "loss": 0.428, "step": 9337 }, { "epoch": 1.73, "learning_rate": 8.041261116923051e-06, "loss": 0.4363, "step": 9338 }, { "epoch": 1.73, "learning_rate": 8.039302396373889e-06, "loss": 0.4248, "step": 9339 }, { "epoch": 1.73, "learning_rate": 8.03734375405293e-06, "loss": 0.4215, "step": 9340 }, { "epoch": 1.73, "learning_rate": 8.03538519003832e-06, "loss": 0.4151, "step": 9341 }, { "epoch": 1.73, "learning_rate": 8.033426704408204e-06, "loss": 0.4263, "step": 9342 }, { "epoch": 1.73, "learning_rate": 8.03146829724072e-06, "loss": 0.4358, "step": 9343 }, { "epoch": 1.73, "learning_rate": 8.02950996861401e-06, "loss": 0.4406, "step": 9344 }, { "epoch": 1.73, "learning_rate": 8.027551718606202e-06, "loss": 0.4262, "step": 9345 }, { "epoch": 1.73, "learning_rate": 8.025593547295427e-06, "loss": 0.4255, "step": 9346 }, { "epoch": 1.73, "learning_rate": 8.023635454759815e-06, "loss": 0.4415, "step": 9347 }, { "epoch": 1.73, "learning_rate": 8.02167744107749e-06, "loss": 0.4241, "step": 9348 }, { "epoch": 1.73, "learning_rate": 8.019719506326571e-06, "loss": 0.436, "step": 9349 }, { "epoch": 1.73, "learning_rate": 8.017761650585178e-06, "loss": 0.4452, "step": 9350 }, { "epoch": 1.73, "learning_rate": 8.015803873931424e-06, "loss": 0.4159, "step": 9351 }, { "epoch": 1.73, "learning_rate": 8.013846176443426e-06, "loss": 0.4157, "step": 9352 }, { "epoch": 1.73, "learning_rate": 8.011888558199284e-06, "loss": 0.4388, "step": 9353 }, { "epoch": 1.73, "learning_rate": 8.00993101927711e-06, "loss": 0.4255, "step": 9354 }, { "epoch": 1.73, "learning_rate": 8.007973559755e-06, "loss": 0.4225, "step": 9355 }, { "epoch": 1.73, "learning_rate": 8.006016179711062e-06, "loss": 0.4352, "step": 9356 }, { "epoch": 1.73, "learning_rate": 8.004058879223386e-06, "loss": 0.4291, "step": 9357 }, { "epoch": 1.73, "learning_rate": 8.00210165837006e-06, "loss": 0.4397, "step": 9358 }, { "epoch": 1.73, "learning_rate": 8.000144517229185e-06, "loss": 0.4234, "step": 9359 }, { "epoch": 1.73, "learning_rate": 7.998187455878836e-06, "loss": 0.4378, "step": 9360 }, { "epoch": 1.73, "learning_rate": 7.996230474397106e-06, "loss": 0.4451, "step": 9361 }, { "epoch": 1.73, "learning_rate": 7.99427357286207e-06, "loss": 0.4418, "step": 9362 }, { "epoch": 1.73, "learning_rate": 7.9923167513518e-06, "loss": 0.4354, "step": 9363 }, { "epoch": 1.73, "learning_rate": 7.99036000994438e-06, "loss": 0.4175, "step": 9364 }, { "epoch": 1.73, "learning_rate": 7.98840334871787e-06, "loss": 0.438, "step": 9365 }, { "epoch": 1.73, "learning_rate": 7.986446767750346e-06, "loss": 0.4409, "step": 9366 }, { "epoch": 1.73, "learning_rate": 7.984490267119867e-06, "loss": 0.4315, "step": 9367 }, { "epoch": 1.73, "learning_rate": 7.982533846904494e-06, "loss": 0.4053, "step": 9368 }, { "epoch": 1.73, "learning_rate": 7.980577507182285e-06, "loss": 0.4145, "step": 9369 }, { "epoch": 1.73, "learning_rate": 7.978621248031294e-06, "loss": 0.4325, "step": 9370 }, { "epoch": 1.73, "learning_rate": 7.976665069529574e-06, "loss": 0.402, "step": 9371 }, { "epoch": 1.73, "learning_rate": 7.97470897175517e-06, "loss": 0.4384, "step": 9372 }, { "epoch": 1.73, "learning_rate": 7.972752954786129e-06, "loss": 0.4251, "step": 9373 }, { "epoch": 1.73, "learning_rate": 7.970797018700495e-06, "loss": 0.418, "step": 9374 }, { "epoch": 1.73, "learning_rate": 7.968841163576297e-06, "loss": 0.4289, "step": 9375 }, { "epoch": 1.73, "learning_rate": 7.96688538949158e-06, "loss": 0.4195, "step": 9376 }, { "epoch": 1.73, "learning_rate": 7.964929696524371e-06, "loss": 0.4288, "step": 9377 }, { "epoch": 1.74, "learning_rate": 7.9629740847527e-06, "loss": 0.4473, "step": 9378 }, { "epoch": 1.74, "learning_rate": 7.961018554254593e-06, "loss": 0.4322, "step": 9379 }, { "epoch": 1.74, "learning_rate": 7.959063105108066e-06, "loss": 0.4078, "step": 9380 }, { "epoch": 1.74, "learning_rate": 7.957107737391147e-06, "loss": 0.4429, "step": 9381 }, { "epoch": 1.74, "learning_rate": 7.955152451181842e-06, "loss": 0.4081, "step": 9382 }, { "epoch": 1.74, "learning_rate": 7.953197246558173e-06, "loss": 0.4487, "step": 9383 }, { "epoch": 1.74, "learning_rate": 7.951242123598144e-06, "loss": 0.4295, "step": 9384 }, { "epoch": 1.74, "learning_rate": 7.949287082379758e-06, "loss": 0.4305, "step": 9385 }, { "epoch": 1.74, "learning_rate": 7.947332122981024e-06, "loss": 0.4239, "step": 9386 }, { "epoch": 1.74, "learning_rate": 7.945377245479932e-06, "loss": 0.4095, "step": 9387 }, { "epoch": 1.74, "learning_rate": 7.94342244995449e-06, "loss": 0.4205, "step": 9388 }, { "epoch": 1.74, "learning_rate": 7.941467736482686e-06, "loss": 0.406, "step": 9389 }, { "epoch": 1.74, "learning_rate": 7.939513105142501e-06, "loss": 0.4334, "step": 9390 }, { "epoch": 1.74, "learning_rate": 7.937558556011934e-06, "loss": 0.441, "step": 9391 }, { "epoch": 1.74, "learning_rate": 7.935604089168957e-06, "loss": 0.4394, "step": 9392 }, { "epoch": 1.74, "learning_rate": 7.93364970469156e-06, "loss": 0.4399, "step": 9393 }, { "epoch": 1.74, "learning_rate": 7.931695402657708e-06, "loss": 0.4362, "step": 9394 }, { "epoch": 1.74, "learning_rate": 7.929741183145386e-06, "loss": 0.4294, "step": 9395 }, { "epoch": 1.74, "learning_rate": 7.927787046232556e-06, "loss": 0.4193, "step": 9396 }, { "epoch": 1.74, "learning_rate": 7.925832991997185e-06, "loss": 0.4154, "step": 9397 }, { "epoch": 1.74, "learning_rate": 7.923879020517238e-06, "loss": 0.4144, "step": 9398 }, { "epoch": 1.74, "learning_rate": 7.921925131870673e-06, "loss": 0.4124, "step": 9399 }, { "epoch": 1.74, "learning_rate": 7.91997132613545e-06, "loss": 0.4336, "step": 9400 }, { "epoch": 1.74, "learning_rate": 7.91801760338952e-06, "loss": 0.4289, "step": 9401 }, { "epoch": 1.74, "learning_rate": 7.91606396371083e-06, "loss": 0.4245, "step": 9402 }, { "epoch": 1.74, "learning_rate": 7.914110407177335e-06, "loss": 0.4241, "step": 9403 }, { "epoch": 1.74, "learning_rate": 7.912156933866965e-06, "loss": 0.4266, "step": 9404 }, { "epoch": 1.74, "learning_rate": 7.910203543857676e-06, "loss": 0.4271, "step": 9405 }, { "epoch": 1.74, "learning_rate": 7.908250237227394e-06, "loss": 0.4198, "step": 9406 }, { "epoch": 1.74, "learning_rate": 7.906297014054051e-06, "loss": 0.4221, "step": 9407 }, { "epoch": 1.74, "learning_rate": 7.904343874415585e-06, "loss": 0.426, "step": 9408 }, { "epoch": 1.74, "learning_rate": 7.902390818389915e-06, "loss": 0.422, "step": 9409 }, { "epoch": 1.74, "learning_rate": 7.90043784605497e-06, "loss": 0.4285, "step": 9410 }, { "epoch": 1.74, "learning_rate": 7.89848495748867e-06, "loss": 0.4226, "step": 9411 }, { "epoch": 1.74, "learning_rate": 7.896532152768923e-06, "loss": 0.4213, "step": 9412 }, { "epoch": 1.74, "learning_rate": 7.894579431973655e-06, "loss": 0.4252, "step": 9413 }, { "epoch": 1.74, "learning_rate": 7.892626795180764e-06, "loss": 0.4306, "step": 9414 }, { "epoch": 1.74, "learning_rate": 7.890674242468166e-06, "loss": 0.4322, "step": 9415 }, { "epoch": 1.74, "learning_rate": 7.888721773913757e-06, "loss": 0.4334, "step": 9416 }, { "epoch": 1.74, "learning_rate": 7.886769389595444e-06, "loss": 0.4332, "step": 9417 }, { "epoch": 1.74, "learning_rate": 7.884817089591121e-06, "loss": 0.4078, "step": 9418 }, { "epoch": 1.74, "learning_rate": 7.882864873978675e-06, "loss": 0.4228, "step": 9419 }, { "epoch": 1.74, "learning_rate": 7.880912742836005e-06, "loss": 0.4299, "step": 9420 }, { "epoch": 1.74, "learning_rate": 7.878960696240989e-06, "loss": 0.4296, "step": 9421 }, { "epoch": 1.74, "learning_rate": 7.877008734271518e-06, "loss": 0.4435, "step": 9422 }, { "epoch": 1.74, "learning_rate": 7.875056857005466e-06, "loss": 0.4228, "step": 9423 }, { "epoch": 1.74, "learning_rate": 7.873105064520712e-06, "loss": 0.4316, "step": 9424 }, { "epoch": 1.74, "learning_rate": 7.871153356895127e-06, "loss": 0.4269, "step": 9425 }, { "epoch": 1.74, "learning_rate": 7.869201734206582e-06, "loss": 0.4135, "step": 9426 }, { "epoch": 1.74, "learning_rate": 7.867250196532943e-06, "loss": 0.4313, "step": 9427 }, { "epoch": 1.74, "learning_rate": 7.865298743952074e-06, "loss": 0.4528, "step": 9428 }, { "epoch": 1.74, "learning_rate": 7.863347376541827e-06, "loss": 0.4238, "step": 9429 }, { "epoch": 1.74, "learning_rate": 7.861396094380072e-06, "loss": 0.4339, "step": 9430 }, { "epoch": 1.74, "learning_rate": 7.859444897544646e-06, "loss": 0.4291, "step": 9431 }, { "epoch": 1.75, "learning_rate": 7.85749378611341e-06, "loss": 0.444, "step": 9432 }, { "epoch": 1.75, "learning_rate": 7.855542760164207e-06, "loss": 0.424, "step": 9433 }, { "epoch": 1.75, "learning_rate": 7.853591819774872e-06, "loss": 0.421, "step": 9434 }, { "epoch": 1.75, "learning_rate": 7.851640965023253e-06, "loss": 0.4137, "step": 9435 }, { "epoch": 1.75, "learning_rate": 7.84969019598718e-06, "loss": 0.4067, "step": 9436 }, { "epoch": 1.75, "learning_rate": 7.847739512744489e-06, "loss": 0.4202, "step": 9437 }, { "epoch": 1.75, "learning_rate": 7.845788915373003e-06, "loss": 0.4335, "step": 9438 }, { "epoch": 1.75, "learning_rate": 7.843838403950555e-06, "loss": 0.426, "step": 9439 }, { "epoch": 1.75, "learning_rate": 7.841887978554963e-06, "loss": 0.418, "step": 9440 }, { "epoch": 1.75, "learning_rate": 7.83993763926404e-06, "loss": 0.4329, "step": 9441 }, { "epoch": 1.75, "learning_rate": 7.837987386155612e-06, "loss": 0.4257, "step": 9442 }, { "epoch": 1.75, "learning_rate": 7.83603721930748e-06, "loss": 0.4387, "step": 9443 }, { "epoch": 1.75, "learning_rate": 7.834087138797458e-06, "loss": 0.4473, "step": 9444 }, { "epoch": 1.75, "learning_rate": 7.832137144703348e-06, "loss": 0.4323, "step": 9445 }, { "epoch": 1.75, "learning_rate": 7.830187237102953e-06, "loss": 0.4134, "step": 9446 }, { "epoch": 1.75, "learning_rate": 7.82823741607407e-06, "loss": 0.4371, "step": 9447 }, { "epoch": 1.75, "learning_rate": 7.826287681694494e-06, "loss": 0.4014, "step": 9448 }, { "epoch": 1.75, "learning_rate": 7.824338034042013e-06, "loss": 0.4212, "step": 9449 }, { "epoch": 1.75, "learning_rate": 7.82238847319442e-06, "loss": 0.4144, "step": 9450 }, { "epoch": 1.75, "learning_rate": 7.82043899922949e-06, "loss": 0.4396, "step": 9451 }, { "epoch": 1.75, "learning_rate": 7.818489612225012e-06, "loss": 0.4091, "step": 9452 }, { "epoch": 1.75, "learning_rate": 7.816540312258759e-06, "loss": 0.4337, "step": 9453 }, { "epoch": 1.75, "learning_rate": 7.814591099408507e-06, "loss": 0.4349, "step": 9454 }, { "epoch": 1.75, "learning_rate": 7.812641973752021e-06, "loss": 0.456, "step": 9455 }, { "epoch": 1.75, "learning_rate": 7.81069293536707e-06, "loss": 0.4491, "step": 9456 }, { "epoch": 1.75, "learning_rate": 7.808743984331421e-06, "loss": 0.435, "step": 9457 }, { "epoch": 1.75, "learning_rate": 7.806795120722826e-06, "loss": 0.419, "step": 9458 }, { "epoch": 1.75, "learning_rate": 7.804846344619049e-06, "loss": 0.4427, "step": 9459 }, { "epoch": 1.75, "learning_rate": 7.802897656097833e-06, "loss": 0.4067, "step": 9460 }, { "epoch": 1.75, "learning_rate": 7.800949055236937e-06, "loss": 0.4405, "step": 9461 }, { "epoch": 1.75, "learning_rate": 7.799000542114103e-06, "loss": 0.43, "step": 9462 }, { "epoch": 1.75, "learning_rate": 7.797052116807069e-06, "loss": 0.4394, "step": 9463 }, { "epoch": 1.75, "learning_rate": 7.795103779393581e-06, "loss": 0.4154, "step": 9464 }, { "epoch": 1.75, "learning_rate": 7.793155529951365e-06, "loss": 0.4272, "step": 9465 }, { "epoch": 1.75, "learning_rate": 7.791207368558162e-06, "loss": 0.4123, "step": 9466 }, { "epoch": 1.75, "learning_rate": 7.789259295291696e-06, "loss": 0.4535, "step": 9467 }, { "epoch": 1.75, "learning_rate": 7.787311310229685e-06, "loss": 0.4243, "step": 9468 }, { "epoch": 1.75, "learning_rate": 7.785363413449862e-06, "loss": 0.4352, "step": 9469 }, { "epoch": 1.75, "learning_rate": 7.783415605029934e-06, "loss": 0.4263, "step": 9470 }, { "epoch": 1.75, "learning_rate": 7.781467885047623e-06, "loss": 0.4239, "step": 9471 }, { "epoch": 1.75, "learning_rate": 7.779520253580635e-06, "loss": 0.4342, "step": 9472 }, { "epoch": 1.75, "learning_rate": 7.777572710706677e-06, "loss": 0.4181, "step": 9473 }, { "epoch": 1.75, "learning_rate": 7.775625256503453e-06, "loss": 0.4342, "step": 9474 }, { "epoch": 1.75, "learning_rate": 7.773677891048664e-06, "loss": 0.4054, "step": 9475 }, { "epoch": 1.75, "learning_rate": 7.771730614420003e-06, "loss": 0.414, "step": 9476 }, { "epoch": 1.75, "learning_rate": 7.76978342669517e-06, "loss": 0.408, "step": 9477 }, { "epoch": 1.75, "learning_rate": 7.767836327951842e-06, "loss": 0.4399, "step": 9478 }, { "epoch": 1.75, "learning_rate": 7.765889318267718e-06, "loss": 0.4379, "step": 9479 }, { "epoch": 1.75, "learning_rate": 7.763942397720468e-06, "loss": 0.4327, "step": 9480 }, { "epoch": 1.75, "learning_rate": 7.761995566387782e-06, "loss": 0.4301, "step": 9481 }, { "epoch": 1.75, "learning_rate": 7.760048824347324e-06, "loss": 0.4312, "step": 9482 }, { "epoch": 1.75, "learning_rate": 7.758102171676775e-06, "loss": 0.4054, "step": 9483 }, { "epoch": 1.75, "learning_rate": 7.7561556084538e-06, "loss": 0.4291, "step": 9484 }, { "epoch": 1.75, "learning_rate": 7.754209134756056e-06, "loss": 0.401, "step": 9485 }, { "epoch": 1.76, "learning_rate": 7.752262750661216e-06, "loss": 0.4172, "step": 9486 }, { "epoch": 1.76, "learning_rate": 7.750316456246924e-06, "loss": 0.4279, "step": 9487 }, { "epoch": 1.76, "learning_rate": 7.748370251590847e-06, "loss": 0.4365, "step": 9488 }, { "epoch": 1.76, "learning_rate": 7.746424136770627e-06, "loss": 0.4204, "step": 9489 }, { "epoch": 1.76, "learning_rate": 7.744478111863908e-06, "loss": 0.4401, "step": 9490 }, { "epoch": 1.76, "learning_rate": 7.742532176948339e-06, "loss": 0.422, "step": 9491 }, { "epoch": 1.76, "learning_rate": 7.740586332101552e-06, "loss": 0.4294, "step": 9492 }, { "epoch": 1.76, "learning_rate": 7.738640577401191e-06, "loss": 0.425, "step": 9493 }, { "epoch": 1.76, "learning_rate": 7.736694912924884e-06, "loss": 0.4129, "step": 9494 }, { "epoch": 1.76, "learning_rate": 7.73474933875026e-06, "loss": 0.4156, "step": 9495 }, { "epoch": 1.76, "learning_rate": 7.732803854954943e-06, "loss": 0.4146, "step": 9496 }, { "epoch": 1.76, "learning_rate": 7.730858461616554e-06, "loss": 0.4269, "step": 9497 }, { "epoch": 1.76, "learning_rate": 7.72891315881271e-06, "loss": 0.4246, "step": 9498 }, { "epoch": 1.76, "learning_rate": 7.726967946621029e-06, "loss": 0.433, "step": 9499 }, { "epoch": 1.76, "learning_rate": 7.725022825119116e-06, "loss": 0.4135, "step": 9500 }, { "epoch": 1.76, "learning_rate": 7.723077794384582e-06, "loss": 0.4168, "step": 9501 }, { "epoch": 1.76, "learning_rate": 7.721132854495025e-06, "loss": 0.4324, "step": 9502 }, { "epoch": 1.76, "learning_rate": 7.719188005528053e-06, "loss": 0.4115, "step": 9503 }, { "epoch": 1.76, "learning_rate": 7.717243247561253e-06, "loss": 0.4192, "step": 9504 }, { "epoch": 1.76, "learning_rate": 7.715298580672224e-06, "loss": 0.4494, "step": 9505 }, { "epoch": 1.76, "learning_rate": 7.713354004938552e-06, "loss": 0.4223, "step": 9506 }, { "epoch": 1.76, "learning_rate": 7.711409520437815e-06, "loss": 0.4254, "step": 9507 }, { "epoch": 1.76, "learning_rate": 7.709465127247609e-06, "loss": 0.4269, "step": 9508 }, { "epoch": 1.76, "learning_rate": 7.707520825445498e-06, "loss": 0.4304, "step": 9509 }, { "epoch": 1.76, "learning_rate": 7.705576615109066e-06, "loss": 0.4575, "step": 9510 }, { "epoch": 1.76, "learning_rate": 7.703632496315878e-06, "loss": 0.4093, "step": 9511 }, { "epoch": 1.76, "learning_rate": 7.701688469143497e-06, "loss": 0.4099, "step": 9512 }, { "epoch": 1.76, "learning_rate": 7.699744533669497e-06, "loss": 0.4286, "step": 9513 }, { "epoch": 1.76, "learning_rate": 7.697800689971427e-06, "loss": 0.4172, "step": 9514 }, { "epoch": 1.76, "learning_rate": 7.69585693812685e-06, "loss": 0.4107, "step": 9515 }, { "epoch": 1.76, "learning_rate": 7.693913278213316e-06, "loss": 0.4477, "step": 9516 }, { "epoch": 1.76, "learning_rate": 7.691969710308367e-06, "loss": 0.4254, "step": 9517 }, { "epoch": 1.76, "learning_rate": 7.69002623448956e-06, "loss": 0.4096, "step": 9518 }, { "epoch": 1.76, "learning_rate": 7.688082850834424e-06, "loss": 0.4303, "step": 9519 }, { "epoch": 1.76, "learning_rate": 7.686139559420507e-06, "loss": 0.4233, "step": 9520 }, { "epoch": 1.76, "learning_rate": 7.684196360325333e-06, "loss": 0.4207, "step": 9521 }, { "epoch": 1.76, "learning_rate": 7.68225325362644e-06, "loss": 0.4641, "step": 9522 }, { "epoch": 1.76, "learning_rate": 7.680310239401349e-06, "loss": 0.4486, "step": 9523 }, { "epoch": 1.76, "learning_rate": 7.678367317727583e-06, "loss": 0.436, "step": 9524 }, { "epoch": 1.76, "learning_rate": 7.676424488682666e-06, "loss": 0.4203, "step": 9525 }, { "epoch": 1.76, "learning_rate": 7.674481752344107e-06, "loss": 0.4186, "step": 9526 }, { "epoch": 1.76, "learning_rate": 7.672539108789423e-06, "loss": 0.4279, "step": 9527 }, { "epoch": 1.76, "learning_rate": 7.670596558096119e-06, "loss": 0.4362, "step": 9528 }, { "epoch": 1.76, "learning_rate": 7.668654100341697e-06, "loss": 0.4299, "step": 9529 }, { "epoch": 1.76, "learning_rate": 7.666711735603665e-06, "loss": 0.4174, "step": 9530 }, { "epoch": 1.76, "learning_rate": 7.66476946395951e-06, "loss": 0.409, "step": 9531 }, { "epoch": 1.76, "learning_rate": 7.662827285486732e-06, "loss": 0.4379, "step": 9532 }, { "epoch": 1.76, "learning_rate": 7.66088520026282e-06, "loss": 0.4336, "step": 9533 }, { "epoch": 1.76, "learning_rate": 7.658943208365253e-06, "loss": 0.4319, "step": 9534 }, { "epoch": 1.76, "learning_rate": 7.657001309871524e-06, "loss": 0.4476, "step": 9535 }, { "epoch": 1.76, "learning_rate": 7.655059504859097e-06, "loss": 0.3987, "step": 9536 }, { "epoch": 1.76, "learning_rate": 7.65311779340546e-06, "loss": 0.4097, "step": 9537 }, { "epoch": 1.76, "learning_rate": 7.651176175588078e-06, "loss": 0.44, "step": 9538 }, { "epoch": 1.76, "learning_rate": 7.649234651484415e-06, "loss": 0.4245, "step": 9539 }, { "epoch": 1.77, "learning_rate": 7.647293221171939e-06, "loss": 0.4157, "step": 9540 }, { "epoch": 1.77, "learning_rate": 7.645351884728104e-06, "loss": 0.4101, "step": 9541 }, { "epoch": 1.77, "learning_rate": 7.643410642230375e-06, "loss": 0.4258, "step": 9542 }, { "epoch": 1.77, "learning_rate": 7.641469493756196e-06, "loss": 0.4407, "step": 9543 }, { "epoch": 1.77, "learning_rate": 7.639528439383015e-06, "loss": 0.4461, "step": 9544 }, { "epoch": 1.77, "learning_rate": 7.637587479188282e-06, "loss": 0.4198, "step": 9545 }, { "epoch": 1.77, "learning_rate": 7.63564661324943e-06, "loss": 0.4406, "step": 9546 }, { "epoch": 1.77, "learning_rate": 7.633705841643907e-06, "loss": 0.4369, "step": 9547 }, { "epoch": 1.77, "learning_rate": 7.631765164449134e-06, "loss": 0.423, "step": 9548 }, { "epoch": 1.77, "learning_rate": 7.629824581742552e-06, "loss": 0.4245, "step": 9549 }, { "epoch": 1.77, "learning_rate": 7.627884093601577e-06, "loss": 0.4159, "step": 9550 }, { "epoch": 1.77, "learning_rate": 7.625943700103635e-06, "loss": 0.4417, "step": 9551 }, { "epoch": 1.77, "learning_rate": 7.624003401326145e-06, "loss": 0.4153, "step": 9552 }, { "epoch": 1.77, "learning_rate": 7.6220631973465174e-06, "loss": 0.4464, "step": 9553 }, { "epoch": 1.77, "learning_rate": 7.620123088242171e-06, "loss": 0.4256, "step": 9554 }, { "epoch": 1.77, "learning_rate": 7.618183074090506e-06, "loss": 0.4332, "step": 9555 }, { "epoch": 1.77, "learning_rate": 7.616243154968922e-06, "loss": 0.4343, "step": 9556 }, { "epoch": 1.77, "learning_rate": 7.614303330954827e-06, "loss": 0.4189, "step": 9557 }, { "epoch": 1.77, "learning_rate": 7.612363602125608e-06, "loss": 0.4114, "step": 9558 }, { "epoch": 1.77, "learning_rate": 7.610423968558667e-06, "loss": 0.4086, "step": 9559 }, { "epoch": 1.77, "learning_rate": 7.6084844303313836e-06, "loss": 0.4483, "step": 9560 }, { "epoch": 1.77, "learning_rate": 7.6065449875211385e-06, "loss": 0.427, "step": 9561 }, { "epoch": 1.77, "learning_rate": 7.604605640205323e-06, "loss": 0.406, "step": 9562 }, { "epoch": 1.77, "learning_rate": 7.6026663884613015e-06, "loss": 0.4121, "step": 9563 }, { "epoch": 1.77, "learning_rate": 7.600727232366458e-06, "loss": 0.4425, "step": 9564 }, { "epoch": 1.77, "learning_rate": 7.598788171998156e-06, "loss": 0.4282, "step": 9565 }, { "epoch": 1.77, "learning_rate": 7.596849207433756e-06, "loss": 0.4273, "step": 9566 }, { "epoch": 1.77, "learning_rate": 7.594910338750627e-06, "loss": 0.433, "step": 9567 }, { "epoch": 1.77, "learning_rate": 7.592971566026119e-06, "loss": 0.4087, "step": 9568 }, { "epoch": 1.77, "learning_rate": 7.591032889337593e-06, "loss": 0.4366, "step": 9569 }, { "epoch": 1.77, "learning_rate": 7.589094308762389e-06, "loss": 0.4172, "step": 9570 }, { "epoch": 1.77, "learning_rate": 7.587155824377865e-06, "loss": 0.424, "step": 9571 }, { "epoch": 1.77, "learning_rate": 7.585217436261352e-06, "loss": 0.4327, "step": 9572 }, { "epoch": 1.77, "learning_rate": 7.5832791444901945e-06, "loss": 0.417, "step": 9573 }, { "epoch": 1.77, "learning_rate": 7.581340949141723e-06, "loss": 0.4382, "step": 9574 }, { "epoch": 1.77, "learning_rate": 7.5794028502932705e-06, "loss": 0.4296, "step": 9575 }, { "epoch": 1.77, "learning_rate": 7.577464848022162e-06, "loss": 0.4367, "step": 9576 }, { "epoch": 1.77, "learning_rate": 7.575526942405724e-06, "loss": 0.4283, "step": 9577 }, { "epoch": 1.77, "learning_rate": 7.573589133521267e-06, "loss": 0.4062, "step": 9578 }, { "epoch": 1.77, "learning_rate": 7.571651421446116e-06, "loss": 0.4256, "step": 9579 }, { "epoch": 1.77, "learning_rate": 7.569713806257573e-06, "loss": 0.4258, "step": 9580 }, { "epoch": 1.77, "learning_rate": 7.567776288032953e-06, "loss": 0.4128, "step": 9581 }, { "epoch": 1.77, "learning_rate": 7.565838866849558e-06, "loss": 0.4408, "step": 9582 }, { "epoch": 1.77, "learning_rate": 7.56390154278468e-06, "loss": 0.4327, "step": 9583 }, { "epoch": 1.77, "learning_rate": 7.561964315915623e-06, "loss": 0.4056, "step": 9584 }, { "epoch": 1.77, "learning_rate": 7.5600271863196725e-06, "loss": 0.4458, "step": 9585 }, { "epoch": 1.77, "learning_rate": 7.558090154074125e-06, "loss": 0.4095, "step": 9586 }, { "epoch": 1.77, "learning_rate": 7.556153219256259e-06, "loss": 0.4134, "step": 9587 }, { "epoch": 1.77, "learning_rate": 7.55421638194335e-06, "loss": 0.4203, "step": 9588 }, { "epoch": 1.77, "learning_rate": 7.552279642212684e-06, "loss": 0.4364, "step": 9589 }, { "epoch": 1.77, "learning_rate": 7.5503430001415245e-06, "loss": 0.4073, "step": 9590 }, { "epoch": 1.77, "learning_rate": 7.548406455807147e-06, "loss": 0.4369, "step": 9591 }, { "epoch": 1.77, "learning_rate": 7.546470009286809e-06, "loss": 0.4391, "step": 9592 }, { "epoch": 1.77, "learning_rate": 7.5445336606577804e-06, "loss": 0.4294, "step": 9593 }, { "epoch": 1.78, "learning_rate": 7.542597409997311e-06, "loss": 0.4339, "step": 9594 }, { "epoch": 1.78, "learning_rate": 7.540661257382651e-06, "loss": 0.414, "step": 9595 }, { "epoch": 1.78, "learning_rate": 7.538725202891058e-06, "loss": 0.4183, "step": 9596 }, { "epoch": 1.78, "learning_rate": 7.536789246599769e-06, "loss": 0.4295, "step": 9597 }, { "epoch": 1.78, "learning_rate": 7.534853388586033e-06, "loss": 0.4414, "step": 9598 }, { "epoch": 1.78, "learning_rate": 7.5329176289270804e-06, "loss": 0.4157, "step": 9599 }, { "epoch": 1.78, "learning_rate": 7.530981967700146e-06, "loss": 0.4232, "step": 9600 }, { "epoch": 1.78, "learning_rate": 7.5290464049824596e-06, "loss": 0.4191, "step": 9601 }, { "epoch": 1.78, "learning_rate": 7.5271109408512476e-06, "loss": 0.4064, "step": 9602 }, { "epoch": 1.78, "learning_rate": 7.52517557538373e-06, "loss": 0.4289, "step": 9603 }, { "epoch": 1.78, "learning_rate": 7.523240308657127e-06, "loss": 0.4301, "step": 9604 }, { "epoch": 1.78, "learning_rate": 7.5213051407486474e-06, "loss": 0.4106, "step": 9605 }, { "epoch": 1.78, "learning_rate": 7.519370071735506e-06, "loss": 0.4439, "step": 9606 }, { "epoch": 1.78, "learning_rate": 7.517435101694902e-06, "loss": 0.4556, "step": 9607 }, { "epoch": 1.78, "learning_rate": 7.515500230704045e-06, "loss": 0.4324, "step": 9608 }, { "epoch": 1.78, "learning_rate": 7.51356545884013e-06, "loss": 0.4052, "step": 9609 }, { "epoch": 1.78, "learning_rate": 7.511630786180345e-06, "loss": 0.4411, "step": 9610 }, { "epoch": 1.78, "learning_rate": 7.509696212801889e-06, "loss": 0.4375, "step": 9611 }, { "epoch": 1.78, "learning_rate": 7.507761738781938e-06, "loss": 0.4091, "step": 9612 }, { "epoch": 1.78, "learning_rate": 7.505827364197684e-06, "loss": 0.4427, "step": 9613 }, { "epoch": 1.78, "learning_rate": 7.503893089126297e-06, "loss": 0.4338, "step": 9614 }, { "epoch": 1.78, "learning_rate": 7.501958913644959e-06, "loss": 0.4184, "step": 9615 }, { "epoch": 1.78, "learning_rate": 7.500024837830834e-06, "loss": 0.4127, "step": 9616 }, { "epoch": 1.78, "learning_rate": 7.498090861761086e-06, "loss": 0.4373, "step": 9617 }, { "epoch": 1.78, "learning_rate": 7.496156985512883e-06, "loss": 0.4353, "step": 9618 }, { "epoch": 1.78, "learning_rate": 7.494223209163378e-06, "loss": 0.4308, "step": 9619 }, { "epoch": 1.78, "learning_rate": 7.492289532789732e-06, "loss": 0.4314, "step": 9620 }, { "epoch": 1.78, "learning_rate": 7.490355956469089e-06, "loss": 0.4273, "step": 9621 }, { "epoch": 1.78, "learning_rate": 7.4884224802785955e-06, "loss": 0.4308, "step": 9622 }, { "epoch": 1.78, "learning_rate": 7.486489104295396e-06, "loss": 0.418, "step": 9623 }, { "epoch": 1.78, "learning_rate": 7.484555828596627e-06, "loss": 0.4283, "step": 9624 }, { "epoch": 1.78, "learning_rate": 7.4826226532594225e-06, "loss": 0.4307, "step": 9625 }, { "epoch": 1.78, "learning_rate": 7.480689578360916e-06, "loss": 0.4241, "step": 9626 }, { "epoch": 1.78, "learning_rate": 7.478756603978228e-06, "loss": 0.4441, "step": 9627 }, { "epoch": 1.78, "learning_rate": 7.4768237301884865e-06, "loss": 0.4324, "step": 9628 }, { "epoch": 1.78, "learning_rate": 7.474890957068802e-06, "loss": 0.4452, "step": 9629 }, { "epoch": 1.78, "learning_rate": 7.472958284696298e-06, "loss": 0.4132, "step": 9630 }, { "epoch": 1.78, "learning_rate": 7.471025713148079e-06, "loss": 0.4288, "step": 9631 }, { "epoch": 1.78, "learning_rate": 7.469093242501249e-06, "loss": 0.4295, "step": 9632 }, { "epoch": 1.78, "learning_rate": 7.467160872832917e-06, "loss": 0.4389, "step": 9633 }, { "epoch": 1.78, "learning_rate": 7.465228604220172e-06, "loss": 0.4422, "step": 9634 }, { "epoch": 1.78, "learning_rate": 7.463296436740116e-06, "loss": 0.4229, "step": 9635 }, { "epoch": 1.78, "learning_rate": 7.461364370469833e-06, "loss": 0.4539, "step": 9636 }, { "epoch": 1.78, "learning_rate": 7.459432405486414e-06, "loss": 0.4083, "step": 9637 }, { "epoch": 1.78, "learning_rate": 7.4575005418669386e-06, "loss": 0.4178, "step": 9638 }, { "epoch": 1.78, "learning_rate": 7.455568779688481e-06, "loss": 0.4179, "step": 9639 }, { "epoch": 1.78, "learning_rate": 7.453637119028122e-06, "loss": 0.4298, "step": 9640 }, { "epoch": 1.78, "learning_rate": 7.451705559962923e-06, "loss": 0.4076, "step": 9641 }, { "epoch": 1.78, "learning_rate": 7.449774102569959e-06, "loss": 0.4343, "step": 9642 }, { "epoch": 1.78, "learning_rate": 7.447842746926286e-06, "loss": 0.4412, "step": 9643 }, { "epoch": 1.78, "learning_rate": 7.445911493108958e-06, "loss": 0.4306, "step": 9644 }, { "epoch": 1.78, "learning_rate": 7.443980341195037e-06, "loss": 0.4146, "step": 9645 }, { "epoch": 1.78, "learning_rate": 7.442049291261564e-06, "loss": 0.4162, "step": 9646 }, { "epoch": 1.78, "learning_rate": 7.4401183433855926e-06, "loss": 0.4328, "step": 9647 }, { "epoch": 1.79, "learning_rate": 7.4381874976441585e-06, "loss": 0.4326, "step": 9648 }, { "epoch": 1.79, "learning_rate": 7.436256754114299e-06, "loss": 0.4226, "step": 9649 }, { "epoch": 1.79, "learning_rate": 7.434326112873048e-06, "loss": 0.4368, "step": 9650 }, { "epoch": 1.79, "learning_rate": 7.432395573997435e-06, "loss": 0.439, "step": 9651 }, { "epoch": 1.79, "learning_rate": 7.430465137564487e-06, "loss": 0.4305, "step": 9652 }, { "epoch": 1.79, "learning_rate": 7.428534803651222e-06, "loss": 0.4272, "step": 9653 }, { "epoch": 1.79, "learning_rate": 7.4266045723346545e-06, "loss": 0.4381, "step": 9654 }, { "epoch": 1.79, "learning_rate": 7.424674443691804e-06, "loss": 0.4229, "step": 9655 }, { "epoch": 1.79, "learning_rate": 7.422744417799671e-06, "loss": 0.435, "step": 9656 }, { "epoch": 1.79, "learning_rate": 7.420814494735269e-06, "loss": 0.4261, "step": 9657 }, { "epoch": 1.79, "learning_rate": 7.418884674575588e-06, "loss": 0.4184, "step": 9658 }, { "epoch": 1.79, "learning_rate": 7.416954957397634e-06, "loss": 0.4355, "step": 9659 }, { "epoch": 1.79, "learning_rate": 7.415025343278395e-06, "loss": 0.4034, "step": 9660 }, { "epoch": 1.79, "learning_rate": 7.413095832294854e-06, "loss": 0.4274, "step": 9661 }, { "epoch": 1.79, "learning_rate": 7.4111664245240055e-06, "loss": 0.4471, "step": 9662 }, { "epoch": 1.79, "learning_rate": 7.4092371200428185e-06, "loss": 0.4158, "step": 9663 }, { "epoch": 1.79, "learning_rate": 7.407307918928278e-06, "loss": 0.426, "step": 9664 }, { "epoch": 1.79, "learning_rate": 7.405378821257352e-06, "loss": 0.4307, "step": 9665 }, { "epoch": 1.79, "learning_rate": 7.403449827107001e-06, "loss": 0.4158, "step": 9666 }, { "epoch": 1.79, "learning_rate": 7.401520936554201e-06, "loss": 0.3982, "step": 9667 }, { "epoch": 1.79, "learning_rate": 7.3995921496759e-06, "loss": 0.4244, "step": 9668 }, { "epoch": 1.79, "learning_rate": 7.397663466549061e-06, "loss": 0.4121, "step": 9669 }, { "epoch": 1.79, "learning_rate": 7.39573488725063e-06, "loss": 0.4301, "step": 9670 }, { "epoch": 1.79, "learning_rate": 7.393806411857555e-06, "loss": 0.4499, "step": 9671 }, { "epoch": 1.79, "learning_rate": 7.39187804044678e-06, "loss": 0.4163, "step": 9672 }, { "epoch": 1.79, "learning_rate": 7.389949773095241e-06, "loss": 0.4449, "step": 9673 }, { "epoch": 1.79, "learning_rate": 7.388021609879874e-06, "loss": 0.4356, "step": 9674 }, { "epoch": 1.79, "learning_rate": 7.386093550877611e-06, "loss": 0.419, "step": 9675 }, { "epoch": 1.79, "learning_rate": 7.384165596165371e-06, "loss": 0.4436, "step": 9676 }, { "epoch": 1.79, "learning_rate": 7.3822377458200865e-06, "loss": 0.4084, "step": 9677 }, { "epoch": 1.79, "learning_rate": 7.380309999918665e-06, "loss": 0.4473, "step": 9678 }, { "epoch": 1.79, "learning_rate": 7.378382358538028e-06, "loss": 0.4094, "step": 9679 }, { "epoch": 1.79, "learning_rate": 7.376454821755079e-06, "loss": 0.4246, "step": 9680 }, { "epoch": 1.79, "learning_rate": 7.374527389646724e-06, "loss": 0.4222, "step": 9681 }, { "epoch": 1.79, "learning_rate": 7.372600062289867e-06, "loss": 0.4391, "step": 9682 }, { "epoch": 1.79, "learning_rate": 7.370672839761401e-06, "loss": 0.4277, "step": 9683 }, { "epoch": 1.79, "learning_rate": 7.368745722138224e-06, "loss": 0.4223, "step": 9684 }, { "epoch": 1.79, "learning_rate": 7.366818709497216e-06, "loss": 0.4244, "step": 9685 }, { "epoch": 1.79, "learning_rate": 7.364891801915271e-06, "loss": 0.43, "step": 9686 }, { "epoch": 1.79, "learning_rate": 7.362964999469264e-06, "loss": 0.4324, "step": 9687 }, { "epoch": 1.79, "learning_rate": 7.361038302236068e-06, "loss": 0.4238, "step": 9688 }, { "epoch": 1.79, "learning_rate": 7.359111710292562e-06, "loss": 0.4333, "step": 9689 }, { "epoch": 1.79, "learning_rate": 7.357185223715604e-06, "loss": 0.4275, "step": 9690 }, { "epoch": 1.79, "learning_rate": 7.355258842582067e-06, "loss": 0.417, "step": 9691 }, { "epoch": 1.79, "learning_rate": 7.353332566968807e-06, "loss": 0.4351, "step": 9692 }, { "epoch": 1.79, "learning_rate": 7.351406396952672e-06, "loss": 0.4235, "step": 9693 }, { "epoch": 1.79, "learning_rate": 7.349480332610523e-06, "loss": 0.4299, "step": 9694 }, { "epoch": 1.79, "learning_rate": 7.347554374019196e-06, "loss": 0.4374, "step": 9695 }, { "epoch": 1.79, "learning_rate": 7.345628521255543e-06, "loss": 0.403, "step": 9696 }, { "epoch": 1.79, "learning_rate": 7.343702774396395e-06, "loss": 0.4246, "step": 9697 }, { "epoch": 1.79, "learning_rate": 7.3417771335185905e-06, "loss": 0.4081, "step": 9698 }, { "epoch": 1.79, "learning_rate": 7.339851598698955e-06, "loss": 0.451, "step": 9699 }, { "epoch": 1.79, "learning_rate": 7.337926170014315e-06, "loss": 0.431, "step": 9700 }, { "epoch": 1.79, "learning_rate": 7.336000847541494e-06, "loss": 0.4256, "step": 9701 }, { "epoch": 1.8, "learning_rate": 7.334075631357308e-06, "loss": 0.429, "step": 9702 }, { "epoch": 1.8, "learning_rate": 7.332150521538565e-06, "loss": 0.414, "step": 9703 }, { "epoch": 1.8, "learning_rate": 7.33022551816208e-06, "loss": 0.4135, "step": 9704 }, { "epoch": 1.8, "learning_rate": 7.32830062130465e-06, "loss": 0.4372, "step": 9705 }, { "epoch": 1.8, "learning_rate": 7.3263758310430834e-06, "loss": 0.4259, "step": 9706 }, { "epoch": 1.8, "learning_rate": 7.324451147454165e-06, "loss": 0.4204, "step": 9707 }, { "epoch": 1.8, "learning_rate": 7.322526570614699e-06, "loss": 0.4196, "step": 9708 }, { "epoch": 1.8, "learning_rate": 7.320602100601464e-06, "loss": 0.4214, "step": 9709 }, { "epoch": 1.8, "learning_rate": 7.318677737491241e-06, "loss": 0.4461, "step": 9710 }, { "epoch": 1.8, "learning_rate": 7.316753481360817e-06, "loss": 0.438, "step": 9711 }, { "epoch": 1.8, "learning_rate": 7.314829332286954e-06, "loss": 0.4574, "step": 9712 }, { "epoch": 1.8, "learning_rate": 7.312905290346436e-06, "loss": 0.4244, "step": 9713 }, { "epoch": 1.8, "learning_rate": 7.31098135561602e-06, "loss": 0.4388, "step": 9714 }, { "epoch": 1.8, "learning_rate": 7.309057528172467e-06, "loss": 0.4274, "step": 9715 }, { "epoch": 1.8, "learning_rate": 7.307133808092541e-06, "loss": 0.4324, "step": 9716 }, { "epoch": 1.8, "learning_rate": 7.3052101954529845e-06, "loss": 0.413, "step": 9717 }, { "epoch": 1.8, "learning_rate": 7.303286690330555e-06, "loss": 0.4259, "step": 9718 }, { "epoch": 1.8, "learning_rate": 7.301363292801997e-06, "loss": 0.4386, "step": 9719 }, { "epoch": 1.8, "learning_rate": 7.29944000294404e-06, "loss": 0.4188, "step": 9720 }, { "epoch": 1.8, "learning_rate": 7.2975168208334334e-06, "loss": 0.451, "step": 9721 }, { "epoch": 1.8, "learning_rate": 7.295593746546897e-06, "loss": 0.4275, "step": 9722 }, { "epoch": 1.8, "learning_rate": 7.293670780161167e-06, "loss": 0.4144, "step": 9723 }, { "epoch": 1.8, "learning_rate": 7.291747921752961e-06, "loss": 0.4329, "step": 9724 }, { "epoch": 1.8, "learning_rate": 7.289825171398999e-06, "loss": 0.4318, "step": 9725 }, { "epoch": 1.8, "learning_rate": 7.2879025291759934e-06, "loss": 0.4198, "step": 9726 }, { "epoch": 1.8, "learning_rate": 7.285979995160656e-06, "loss": 0.4244, "step": 9727 }, { "epoch": 1.8, "learning_rate": 7.284057569429692e-06, "loss": 0.4264, "step": 9728 }, { "epoch": 1.8, "learning_rate": 7.282135252059804e-06, "loss": 0.4453, "step": 9729 }, { "epoch": 1.8, "learning_rate": 7.2802130431276845e-06, "loss": 0.438, "step": 9730 }, { "epoch": 1.8, "learning_rate": 7.278290942710034e-06, "loss": 0.4311, "step": 9731 }, { "epoch": 1.8, "learning_rate": 7.27636895088353e-06, "loss": 0.4005, "step": 9732 }, { "epoch": 1.8, "learning_rate": 7.274447067724866e-06, "loss": 0.4431, "step": 9733 }, { "epoch": 1.8, "learning_rate": 7.272525293310715e-06, "loss": 0.4292, "step": 9734 }, { "epoch": 1.8, "learning_rate": 7.270603627717758e-06, "loss": 0.4154, "step": 9735 }, { "epoch": 1.8, "learning_rate": 7.2686820710226635e-06, "loss": 0.4244, "step": 9736 }, { "epoch": 1.8, "learning_rate": 7.266760623302094e-06, "loss": 0.4429, "step": 9737 }, { "epoch": 1.8, "learning_rate": 7.264839284632718e-06, "loss": 0.4307, "step": 9738 }, { "epoch": 1.8, "learning_rate": 7.262918055091186e-06, "loss": 0.432, "step": 9739 }, { "epoch": 1.8, "learning_rate": 7.260996934754162e-06, "loss": 0.4204, "step": 9740 }, { "epoch": 1.8, "learning_rate": 7.2590759236982886e-06, "loss": 0.4201, "step": 9741 }, { "epoch": 1.8, "learning_rate": 7.257155022000206e-06, "loss": 0.4296, "step": 9742 }, { "epoch": 1.8, "learning_rate": 7.2552342297365654e-06, "loss": 0.4245, "step": 9743 }, { "epoch": 1.8, "learning_rate": 7.253313546983991e-06, "loss": 0.428, "step": 9744 }, { "epoch": 1.8, "learning_rate": 7.251392973819127e-06, "loss": 0.4462, "step": 9745 }, { "epoch": 1.8, "learning_rate": 7.249472510318591e-06, "loss": 0.4232, "step": 9746 }, { "epoch": 1.8, "learning_rate": 7.24755215655901e-06, "loss": 0.4341, "step": 9747 }, { "epoch": 1.8, "learning_rate": 7.245631912617002e-06, "loss": 0.4032, "step": 9748 }, { "epoch": 1.8, "learning_rate": 7.2437117785691815e-06, "loss": 0.4422, "step": 9749 }, { "epoch": 1.8, "learning_rate": 7.241791754492157e-06, "loss": 0.4504, "step": 9750 }, { "epoch": 1.8, "learning_rate": 7.239871840462535e-06, "loss": 0.4253, "step": 9751 }, { "epoch": 1.8, "learning_rate": 7.237952036556917e-06, "loss": 0.4358, "step": 9752 }, { "epoch": 1.8, "learning_rate": 7.2360323428519e-06, "loss": 0.4264, "step": 9753 }, { "epoch": 1.8, "learning_rate": 7.234112759424072e-06, "loss": 0.4531, "step": 9754 }, { "epoch": 1.8, "learning_rate": 7.232193286350027e-06, "loss": 0.4183, "step": 9755 }, { "epoch": 1.8, "learning_rate": 7.230273923706342e-06, "loss": 0.4268, "step": 9756 }, { "epoch": 1.81, "learning_rate": 7.228354671569604e-06, "loss": 0.4197, "step": 9757 }, { "epoch": 1.81, "learning_rate": 7.226435530016382e-06, "loss": 0.424, "step": 9758 }, { "epoch": 1.81, "learning_rate": 7.224516499123244e-06, "loss": 0.4619, "step": 9759 }, { "epoch": 1.81, "learning_rate": 7.222597578966763e-06, "loss": 0.4438, "step": 9760 }, { "epoch": 1.81, "learning_rate": 7.220678769623492e-06, "loss": 0.4247, "step": 9761 }, { "epoch": 1.81, "learning_rate": 7.218760071169997e-06, "loss": 0.4274, "step": 9762 }, { "epoch": 1.81, "learning_rate": 7.2168414836828245e-06, "loss": 0.4075, "step": 9763 }, { "epoch": 1.81, "learning_rate": 7.214923007238521e-06, "loss": 0.4267, "step": 9764 }, { "epoch": 1.81, "learning_rate": 7.2130046419136364e-06, "loss": 0.4175, "step": 9765 }, { "epoch": 1.81, "learning_rate": 7.2110863877847025e-06, "loss": 0.4345, "step": 9766 }, { "epoch": 1.81, "learning_rate": 7.209168244928264e-06, "loss": 0.4343, "step": 9767 }, { "epoch": 1.81, "learning_rate": 7.207250213420844e-06, "loss": 0.4182, "step": 9768 }, { "epoch": 1.81, "learning_rate": 7.205332293338966e-06, "loss": 0.4212, "step": 9769 }, { "epoch": 1.81, "learning_rate": 7.203414484759159e-06, "loss": 0.4254, "step": 9770 }, { "epoch": 1.81, "learning_rate": 7.201496787757933e-06, "loss": 0.4393, "step": 9771 }, { "epoch": 1.81, "learning_rate": 7.1995792024118065e-06, "loss": 0.4218, "step": 9772 }, { "epoch": 1.81, "learning_rate": 7.197661728797283e-06, "loss": 0.4293, "step": 9773 }, { "epoch": 1.81, "learning_rate": 7.195744366990871e-06, "loss": 0.4368, "step": 9774 }, { "epoch": 1.81, "learning_rate": 7.193827117069064e-06, "loss": 0.4305, "step": 9775 }, { "epoch": 1.81, "learning_rate": 7.1919099791083605e-06, "loss": 0.4036, "step": 9776 }, { "epoch": 1.81, "learning_rate": 7.1899929531852494e-06, "loss": 0.4374, "step": 9777 }, { "epoch": 1.81, "learning_rate": 7.188076039376217e-06, "loss": 0.4335, "step": 9778 }, { "epoch": 1.81, "learning_rate": 7.186159237757746e-06, "loss": 0.4608, "step": 9779 }, { "epoch": 1.81, "learning_rate": 7.184242548406312e-06, "loss": 0.4408, "step": 9780 }, { "epoch": 1.81, "learning_rate": 7.182325971398383e-06, "loss": 0.4054, "step": 9781 }, { "epoch": 1.81, "learning_rate": 7.1804095068104355e-06, "loss": 0.417, "step": 9782 }, { "epoch": 1.81, "learning_rate": 7.178493154718924e-06, "loss": 0.4491, "step": 9783 }, { "epoch": 1.81, "learning_rate": 7.176576915200318e-06, "loss": 0.4113, "step": 9784 }, { "epoch": 1.81, "learning_rate": 7.1746607883310626e-06, "loss": 0.4372, "step": 9785 }, { "epoch": 1.81, "learning_rate": 7.172744774187608e-06, "loss": 0.426, "step": 9786 }, { "epoch": 1.81, "learning_rate": 7.170828872846406e-06, "loss": 0.4104, "step": 9787 }, { "epoch": 1.81, "learning_rate": 7.16891308438389e-06, "loss": 0.4324, "step": 9788 }, { "epoch": 1.81, "learning_rate": 7.166997408876504e-06, "loss": 0.4274, "step": 9789 }, { "epoch": 1.81, "learning_rate": 7.165081846400677e-06, "loss": 0.4302, "step": 9790 }, { "epoch": 1.81, "learning_rate": 7.163166397032831e-06, "loss": 0.4298, "step": 9791 }, { "epoch": 1.81, "learning_rate": 7.161251060849399e-06, "loss": 0.4159, "step": 9792 }, { "epoch": 1.81, "learning_rate": 7.159335837926788e-06, "loss": 0.4159, "step": 9793 }, { "epoch": 1.81, "learning_rate": 7.157420728341422e-06, "loss": 0.4028, "step": 9794 }, { "epoch": 1.81, "learning_rate": 7.155505732169703e-06, "loss": 0.4232, "step": 9795 }, { "epoch": 1.81, "learning_rate": 7.1535908494880415e-06, "loss": 0.4391, "step": 9796 }, { "epoch": 1.81, "learning_rate": 7.1516760803728335e-06, "loss": 0.4301, "step": 9797 }, { "epoch": 1.81, "learning_rate": 7.149761424900478e-06, "loss": 0.4151, "step": 9798 }, { "epoch": 1.81, "learning_rate": 7.147846883147362e-06, "loss": 0.4447, "step": 9799 }, { "epoch": 1.81, "learning_rate": 7.145932455189877e-06, "loss": 0.4263, "step": 9800 }, { "epoch": 1.81, "learning_rate": 7.144018141104402e-06, "loss": 0.4414, "step": 9801 }, { "epoch": 1.81, "learning_rate": 7.142103940967318e-06, "loss": 0.435, "step": 9802 }, { "epoch": 1.81, "learning_rate": 7.1401898548549905e-06, "loss": 0.4201, "step": 9803 }, { "epoch": 1.81, "learning_rate": 7.138275882843797e-06, "loss": 0.4108, "step": 9804 }, { "epoch": 1.81, "learning_rate": 7.136362025010094e-06, "loss": 0.4304, "step": 9805 }, { "epoch": 1.81, "learning_rate": 7.134448281430249e-06, "loss": 0.441, "step": 9806 }, { "epoch": 1.81, "learning_rate": 7.13253465218061e-06, "loss": 0.42, "step": 9807 }, { "epoch": 1.81, "learning_rate": 7.130621137337528e-06, "loss": 0.4117, "step": 9808 }, { "epoch": 1.81, "learning_rate": 7.128707736977352e-06, "loss": 0.4268, "step": 9809 }, { "epoch": 1.81, "learning_rate": 7.126794451176418e-06, "loss": 0.4266, "step": 9810 }, { "epoch": 1.82, "learning_rate": 7.12488128001107e-06, "loss": 0.4046, "step": 9811 }, { "epoch": 1.82, "learning_rate": 7.1229682235576355e-06, "loss": 0.4447, "step": 9812 }, { "epoch": 1.82, "learning_rate": 7.121055281892438e-06, "loss": 0.4083, "step": 9813 }, { "epoch": 1.82, "learning_rate": 7.11914245509181e-06, "loss": 0.4287, "step": 9814 }, { "epoch": 1.82, "learning_rate": 7.117229743232059e-06, "loss": 0.4274, "step": 9815 }, { "epoch": 1.82, "learning_rate": 7.115317146389508e-06, "loss": 0.4359, "step": 9816 }, { "epoch": 1.82, "learning_rate": 7.113404664640457e-06, "loss": 0.4556, "step": 9817 }, { "epoch": 1.82, "learning_rate": 7.111492298061221e-06, "loss": 0.4065, "step": 9818 }, { "epoch": 1.82, "learning_rate": 7.109580046728094e-06, "loss": 0.4272, "step": 9819 }, { "epoch": 1.82, "learning_rate": 7.107667910717369e-06, "loss": 0.4325, "step": 9820 }, { "epoch": 1.82, "learning_rate": 7.105755890105342e-06, "loss": 0.4214, "step": 9821 }, { "epoch": 1.82, "learning_rate": 7.103843984968291e-06, "loss": 0.4313, "step": 9822 }, { "epoch": 1.82, "learning_rate": 7.101932195382508e-06, "loss": 0.4043, "step": 9823 }, { "epoch": 1.82, "learning_rate": 7.1000205214242636e-06, "loss": 0.4124, "step": 9824 }, { "epoch": 1.82, "learning_rate": 7.09810896316983e-06, "loss": 0.4188, "step": 9825 }, { "epoch": 1.82, "learning_rate": 7.096197520695478e-06, "loss": 0.4354, "step": 9826 }, { "epoch": 1.82, "learning_rate": 7.094286194077467e-06, "loss": 0.4303, "step": 9827 }, { "epoch": 1.82, "learning_rate": 7.092374983392057e-06, "loss": 0.3993, "step": 9828 }, { "epoch": 1.82, "learning_rate": 7.090463888715504e-06, "loss": 0.4336, "step": 9829 }, { "epoch": 1.82, "learning_rate": 7.088552910124051e-06, "loss": 0.4013, "step": 9830 }, { "epoch": 1.82, "learning_rate": 7.086642047693953e-06, "loss": 0.4271, "step": 9831 }, { "epoch": 1.82, "learning_rate": 7.084731301501436e-06, "loss": 0.4451, "step": 9832 }, { "epoch": 1.82, "learning_rate": 7.082820671622747e-06, "loss": 0.4314, "step": 9833 }, { "epoch": 1.82, "learning_rate": 7.080910158134113e-06, "loss": 0.447, "step": 9834 }, { "epoch": 1.82, "learning_rate": 7.078999761111756e-06, "loss": 0.4445, "step": 9835 }, { "epoch": 1.82, "learning_rate": 7.077089480631904e-06, "loss": 0.4266, "step": 9836 }, { "epoch": 1.82, "learning_rate": 7.0751793167707665e-06, "loss": 0.4175, "step": 9837 }, { "epoch": 1.82, "learning_rate": 7.073269269604561e-06, "loss": 0.4367, "step": 9838 }, { "epoch": 1.82, "learning_rate": 7.0713593392094905e-06, "loss": 0.4156, "step": 9839 }, { "epoch": 1.82, "learning_rate": 7.0694495256617635e-06, "loss": 0.4354, "step": 9840 }, { "epoch": 1.82, "learning_rate": 7.067539829037575e-06, "loss": 0.422, "step": 9841 }, { "epoch": 1.82, "learning_rate": 7.065630249413114e-06, "loss": 0.4076, "step": 9842 }, { "epoch": 1.82, "learning_rate": 7.063720786864577e-06, "loss": 0.4328, "step": 9843 }, { "epoch": 1.82, "learning_rate": 7.06181144146814e-06, "loss": 0.4079, "step": 9844 }, { "epoch": 1.82, "learning_rate": 7.059902213299991e-06, "loss": 0.4076, "step": 9845 }, { "epoch": 1.82, "learning_rate": 7.057993102436301e-06, "loss": 0.4226, "step": 9846 }, { "epoch": 1.82, "learning_rate": 7.0560841089532336e-06, "loss": 0.4117, "step": 9847 }, { "epoch": 1.82, "learning_rate": 7.054175232926965e-06, "loss": 0.4531, "step": 9848 }, { "epoch": 1.82, "learning_rate": 7.0522664744336465e-06, "loss": 0.4109, "step": 9849 }, { "epoch": 1.82, "learning_rate": 7.050357833549442e-06, "loss": 0.4301, "step": 9850 }, { "epoch": 1.82, "learning_rate": 7.048449310350496e-06, "loss": 0.441, "step": 9851 }, { "epoch": 1.82, "learning_rate": 7.0465409049129596e-06, "loss": 0.4383, "step": 9852 }, { "epoch": 1.82, "learning_rate": 7.044632617312972e-06, "loss": 0.429, "step": 9853 }, { "epoch": 1.82, "learning_rate": 7.0427244476266695e-06, "loss": 0.3944, "step": 9854 }, { "epoch": 1.82, "learning_rate": 7.040816395930188e-06, "loss": 0.4317, "step": 9855 }, { "epoch": 1.82, "learning_rate": 7.038908462299657e-06, "loss": 0.4518, "step": 9856 }, { "epoch": 1.82, "learning_rate": 7.03700064681119e-06, "loss": 0.4196, "step": 9857 }, { "epoch": 1.82, "learning_rate": 7.035092949540915e-06, "loss": 0.4072, "step": 9858 }, { "epoch": 1.82, "learning_rate": 7.033185370564939e-06, "loss": 0.4527, "step": 9859 }, { "epoch": 1.82, "learning_rate": 7.031277909959378e-06, "loss": 0.4374, "step": 9860 }, { "epoch": 1.82, "learning_rate": 7.029370567800326e-06, "loss": 0.4174, "step": 9861 }, { "epoch": 1.82, "learning_rate": 7.027463344163894e-06, "loss": 0.4505, "step": 9862 }, { "epoch": 1.82, "learning_rate": 7.025556239126171e-06, "loss": 0.4342, "step": 9863 }, { "epoch": 1.82, "learning_rate": 7.023649252763243e-06, "loss": 0.4197, "step": 9864 }, { "epoch": 1.83, "learning_rate": 7.021742385151204e-06, "loss": 0.423, "step": 9865 }, { "epoch": 1.83, "learning_rate": 7.0198356363661234e-06, "loss": 0.4052, "step": 9866 }, { "epoch": 1.83, "learning_rate": 7.01792900648409e-06, "loss": 0.4137, "step": 9867 }, { "epoch": 1.83, "learning_rate": 7.0160224955811665e-06, "loss": 0.4304, "step": 9868 }, { "epoch": 1.83, "learning_rate": 7.014116103733417e-06, "loss": 0.4232, "step": 9869 }, { "epoch": 1.83, "learning_rate": 7.01220983101691e-06, "loss": 0.4215, "step": 9870 }, { "epoch": 1.83, "learning_rate": 7.0103036775076964e-06, "loss": 0.4509, "step": 9871 }, { "epoch": 1.83, "learning_rate": 7.008397643281835e-06, "loss": 0.4336, "step": 9872 }, { "epoch": 1.83, "learning_rate": 7.006491728415366e-06, "loss": 0.4258, "step": 9873 }, { "epoch": 1.83, "learning_rate": 7.004585932984334e-06, "loss": 0.414, "step": 9874 }, { "epoch": 1.83, "learning_rate": 7.0026802570647774e-06, "loss": 0.4088, "step": 9875 }, { "epoch": 1.83, "learning_rate": 7.000774700732731e-06, "loss": 0.4473, "step": 9876 }, { "epoch": 1.83, "learning_rate": 6.998869264064219e-06, "loss": 0.3944, "step": 9877 }, { "epoch": 1.83, "learning_rate": 6.99696394713527e-06, "loss": 0.4139, "step": 9878 }, { "epoch": 1.83, "learning_rate": 6.995058750021896e-06, "loss": 0.4318, "step": 9879 }, { "epoch": 1.83, "learning_rate": 6.993153672800117e-06, "loss": 0.4274, "step": 9880 }, { "epoch": 1.83, "learning_rate": 6.991248715545937e-06, "loss": 0.4197, "step": 9881 }, { "epoch": 1.83, "learning_rate": 6.989343878335366e-06, "loss": 0.3967, "step": 9882 }, { "epoch": 1.83, "learning_rate": 6.9874391612443956e-06, "loss": 0.4308, "step": 9883 }, { "epoch": 1.83, "learning_rate": 6.98553456434903e-06, "loss": 0.4311, "step": 9884 }, { "epoch": 1.83, "learning_rate": 6.983630087725254e-06, "loss": 0.4446, "step": 9885 }, { "epoch": 1.83, "learning_rate": 6.9817257314490484e-06, "loss": 0.4322, "step": 9886 }, { "epoch": 1.83, "learning_rate": 6.979821495596402e-06, "loss": 0.4287, "step": 9887 }, { "epoch": 1.83, "learning_rate": 6.977917380243282e-06, "loss": 0.4208, "step": 9888 }, { "epoch": 1.83, "learning_rate": 6.976013385465668e-06, "loss": 0.4322, "step": 9889 }, { "epoch": 1.83, "learning_rate": 6.974109511339521e-06, "loss": 0.424, "step": 9890 }, { "epoch": 1.83, "learning_rate": 6.972205757940797e-06, "loss": 0.427, "step": 9891 }, { "epoch": 1.83, "learning_rate": 6.970302125345463e-06, "loss": 0.4155, "step": 9892 }, { "epoch": 1.83, "learning_rate": 6.96839861362946e-06, "loss": 0.4398, "step": 9893 }, { "epoch": 1.83, "learning_rate": 6.966495222868744e-06, "loss": 0.4079, "step": 9894 }, { "epoch": 1.83, "learning_rate": 6.964591953139252e-06, "loss": 0.3912, "step": 9895 }, { "epoch": 1.83, "learning_rate": 6.962688804516917e-06, "loss": 0.4377, "step": 9896 }, { "epoch": 1.83, "learning_rate": 6.96078577707768e-06, "loss": 0.4115, "step": 9897 }, { "epoch": 1.83, "learning_rate": 6.958882870897459e-06, "loss": 0.4332, "step": 9898 }, { "epoch": 1.83, "learning_rate": 6.956980086052185e-06, "loss": 0.4322, "step": 9899 }, { "epoch": 1.83, "learning_rate": 6.955077422617768e-06, "loss": 0.4323, "step": 9900 }, { "epoch": 1.83, "learning_rate": 6.953174880670126e-06, "loss": 0.4087, "step": 9901 }, { "epoch": 1.83, "learning_rate": 6.951272460285166e-06, "loss": 0.4281, "step": 9902 }, { "epoch": 1.83, "learning_rate": 6.949370161538789e-06, "loss": 0.4183, "step": 9903 }, { "epoch": 1.83, "learning_rate": 6.947467984506895e-06, "loss": 0.4125, "step": 9904 }, { "epoch": 1.83, "learning_rate": 6.945565929265377e-06, "loss": 0.4346, "step": 9905 }, { "epoch": 1.83, "learning_rate": 6.9436639958901216e-06, "loss": 0.4334, "step": 9906 }, { "epoch": 1.83, "learning_rate": 6.941762184457017e-06, "loss": 0.467, "step": 9907 }, { "epoch": 1.83, "learning_rate": 6.939860495041937e-06, "loss": 0.4262, "step": 9908 }, { "epoch": 1.83, "learning_rate": 6.937958927720759e-06, "loss": 0.4051, "step": 9909 }, { "epoch": 1.83, "learning_rate": 6.936057482569347e-06, "loss": 0.4393, "step": 9910 }, { "epoch": 1.83, "learning_rate": 6.9341561596635744e-06, "loss": 0.4266, "step": 9911 }, { "epoch": 1.83, "learning_rate": 6.932254959079293e-06, "loss": 0.4198, "step": 9912 }, { "epoch": 1.83, "learning_rate": 6.930353880892355e-06, "loss": 0.4302, "step": 9913 }, { "epoch": 1.83, "learning_rate": 6.928452925178619e-06, "loss": 0.43, "step": 9914 }, { "epoch": 1.83, "learning_rate": 6.9265520920139195e-06, "loss": 0.4357, "step": 9915 }, { "epoch": 1.83, "learning_rate": 6.924651381474106e-06, "loss": 0.4193, "step": 9916 }, { "epoch": 1.83, "learning_rate": 6.922750793635008e-06, "loss": 0.4367, "step": 9917 }, { "epoch": 1.83, "learning_rate": 6.920850328572452e-06, "loss": 0.4066, "step": 9918 }, { "epoch": 1.84, "learning_rate": 6.918949986362271e-06, "loss": 0.4305, "step": 9919 }, { "epoch": 1.84, "learning_rate": 6.917049767080277e-06, "loss": 0.4336, "step": 9920 }, { "epoch": 1.84, "learning_rate": 6.9151496708022936e-06, "loss": 0.4109, "step": 9921 }, { "epoch": 1.84, "learning_rate": 6.913249697604125e-06, "loss": 0.4317, "step": 9922 }, { "epoch": 1.84, "learning_rate": 6.911349847561578e-06, "loss": 0.4174, "step": 9923 }, { "epoch": 1.84, "learning_rate": 6.909450120750454e-06, "loss": 0.4238, "step": 9924 }, { "epoch": 1.84, "learning_rate": 6.907550517246548e-06, "loss": 0.4238, "step": 9925 }, { "epoch": 1.84, "learning_rate": 6.905651037125651e-06, "loss": 0.4242, "step": 9926 }, { "epoch": 1.84, "learning_rate": 6.903751680463549e-06, "loss": 0.428, "step": 9927 }, { "epoch": 1.84, "learning_rate": 6.901852447336021e-06, "loss": 0.4279, "step": 9928 }, { "epoch": 1.84, "learning_rate": 6.8999533378188475e-06, "loss": 0.4138, "step": 9929 }, { "epoch": 1.84, "learning_rate": 6.898054351987793e-06, "loss": 0.4369, "step": 9930 }, { "epoch": 1.84, "learning_rate": 6.896155489918629e-06, "loss": 0.4407, "step": 9931 }, { "epoch": 1.84, "learning_rate": 6.894256751687112e-06, "loss": 0.4002, "step": 9932 }, { "epoch": 1.84, "learning_rate": 6.892358137369002e-06, "loss": 0.4387, "step": 9933 }, { "epoch": 1.84, "learning_rate": 6.890459647040051e-06, "loss": 0.4464, "step": 9934 }, { "epoch": 1.84, "learning_rate": 6.888561280775998e-06, "loss": 0.4351, "step": 9935 }, { "epoch": 1.84, "learning_rate": 6.886663038652594e-06, "loss": 0.4239, "step": 9936 }, { "epoch": 1.84, "learning_rate": 6.8847649207455655e-06, "loss": 0.4195, "step": 9937 }, { "epoch": 1.84, "learning_rate": 6.882866927130654e-06, "loss": 0.4193, "step": 9938 }, { "epoch": 1.84, "learning_rate": 6.88096905788358e-06, "loss": 0.4197, "step": 9939 }, { "epoch": 1.84, "learning_rate": 6.879071313080061e-06, "loss": 0.4253, "step": 9940 }, { "epoch": 1.84, "learning_rate": 6.8771736927958246e-06, "loss": 0.4341, "step": 9941 }, { "epoch": 1.84, "learning_rate": 6.87527619710657e-06, "loss": 0.438, "step": 9942 }, { "epoch": 1.84, "learning_rate": 6.873378826088015e-06, "loss": 0.4357, "step": 9943 }, { "epoch": 1.84, "learning_rate": 6.871481579815857e-06, "loss": 0.4337, "step": 9944 }, { "epoch": 1.84, "learning_rate": 6.869584458365786e-06, "loss": 0.4148, "step": 9945 }, { "epoch": 1.84, "learning_rate": 6.867687461813504e-06, "loss": 0.4472, "step": 9946 }, { "epoch": 1.84, "learning_rate": 6.865790590234689e-06, "loss": 0.4253, "step": 9947 }, { "epoch": 1.84, "learning_rate": 6.86389384370503e-06, "loss": 0.4259, "step": 9948 }, { "epoch": 1.84, "learning_rate": 6.861997222300196e-06, "loss": 0.4215, "step": 9949 }, { "epoch": 1.84, "learning_rate": 6.860100726095868e-06, "loss": 0.4207, "step": 9950 }, { "epoch": 1.84, "learning_rate": 6.858204355167705e-06, "loss": 0.4081, "step": 9951 }, { "epoch": 1.84, "learning_rate": 6.856308109591372e-06, "loss": 0.4043, "step": 9952 }, { "epoch": 1.84, "learning_rate": 6.854411989442524e-06, "loss": 0.4098, "step": 9953 }, { "epoch": 1.84, "learning_rate": 6.852515994796816e-06, "loss": 0.4272, "step": 9954 }, { "epoch": 1.84, "learning_rate": 6.85062012572989e-06, "loss": 0.4132, "step": 9955 }, { "epoch": 1.84, "learning_rate": 6.848724382317393e-06, "loss": 0.4383, "step": 9956 }, { "epoch": 1.84, "learning_rate": 6.846828764634954e-06, "loss": 0.4459, "step": 9957 }, { "epoch": 1.84, "learning_rate": 6.844933272758214e-06, "loss": 0.4183, "step": 9958 }, { "epoch": 1.84, "learning_rate": 6.843037906762792e-06, "loss": 0.4066, "step": 9959 }, { "epoch": 1.84, "learning_rate": 6.841142666724316e-06, "loss": 0.413, "step": 9960 }, { "epoch": 1.84, "learning_rate": 6.839247552718398e-06, "loss": 0.4299, "step": 9961 }, { "epoch": 1.84, "learning_rate": 6.837352564820647e-06, "loss": 0.4328, "step": 9962 }, { "epoch": 1.84, "learning_rate": 6.835457703106678e-06, "loss": 0.4446, "step": 9963 }, { "epoch": 1.84, "learning_rate": 6.833562967652083e-06, "loss": 0.4485, "step": 9964 }, { "epoch": 1.84, "learning_rate": 6.831668358532466e-06, "loss": 0.4309, "step": 9965 }, { "epoch": 1.84, "learning_rate": 6.829773875823418e-06, "loss": 0.4311, "step": 9966 }, { "epoch": 1.84, "learning_rate": 6.827879519600518e-06, "loss": 0.4333, "step": 9967 }, { "epoch": 1.84, "learning_rate": 6.825985289939354e-06, "loss": 0.4233, "step": 9968 }, { "epoch": 1.84, "learning_rate": 6.824091186915499e-06, "loss": 0.43, "step": 9969 }, { "epoch": 1.84, "learning_rate": 6.822197210604529e-06, "loss": 0.4126, "step": 9970 }, { "epoch": 1.84, "learning_rate": 6.820303361082002e-06, "loss": 0.4377, "step": 9971 }, { "epoch": 1.84, "learning_rate": 6.818409638423489e-06, "loss": 0.4137, "step": 9972 }, { "epoch": 1.85, "learning_rate": 6.816516042704539e-06, "loss": 0.4084, "step": 9973 }, { "epoch": 1.85, "learning_rate": 6.814622574000702e-06, "loss": 0.4252, "step": 9974 }, { "epoch": 1.85, "learning_rate": 6.812729232387531e-06, "loss": 0.4273, "step": 9975 }, { "epoch": 1.85, "learning_rate": 6.810836017940559e-06, "loss": 0.4067, "step": 9976 }, { "epoch": 1.85, "learning_rate": 6.808942930735327e-06, "loss": 0.4252, "step": 9977 }, { "epoch": 1.85, "learning_rate": 6.807049970847365e-06, "loss": 0.4266, "step": 9978 }, { "epoch": 1.85, "learning_rate": 6.805157138352196e-06, "loss": 0.4084, "step": 9979 }, { "epoch": 1.85, "learning_rate": 6.803264433325342e-06, "loss": 0.4464, "step": 9980 }, { "epoch": 1.85, "learning_rate": 6.801371855842318e-06, "loss": 0.4351, "step": 9981 }, { "epoch": 1.85, "learning_rate": 6.799479405978636e-06, "loss": 0.4091, "step": 9982 }, { "epoch": 1.85, "learning_rate": 6.797587083809802e-06, "loss": 0.4227, "step": 9983 }, { "epoch": 1.85, "learning_rate": 6.7956948894113095e-06, "loss": 0.4119, "step": 9984 }, { "epoch": 1.85, "learning_rate": 6.793802822858663e-06, "loss": 0.4002, "step": 9985 }, { "epoch": 1.85, "learning_rate": 6.791910884227344e-06, "loss": 0.4208, "step": 9986 }, { "epoch": 1.85, "learning_rate": 6.790019073592844e-06, "loss": 0.4308, "step": 9987 }, { "epoch": 1.85, "learning_rate": 6.788127391030641e-06, "loss": 0.4303, "step": 9988 }, { "epoch": 1.85, "learning_rate": 6.786235836616204e-06, "loss": 0.4285, "step": 9989 }, { "epoch": 1.85, "learning_rate": 6.78434441042501e-06, "loss": 0.4189, "step": 9990 }, { "epoch": 1.85, "learning_rate": 6.782453112532517e-06, "loss": 0.4389, "step": 9991 }, { "epoch": 1.85, "learning_rate": 6.7805619430141925e-06, "loss": 0.4303, "step": 9992 }, { "epoch": 1.85, "learning_rate": 6.7786709019454855e-06, "loss": 0.4356, "step": 9993 }, { "epoch": 1.85, "learning_rate": 6.77677998940184e-06, "loss": 0.4359, "step": 9994 }, { "epoch": 1.85, "learning_rate": 6.774889205458711e-06, "loss": 0.4347, "step": 9995 }, { "epoch": 1.85, "learning_rate": 6.772998550191527e-06, "loss": 0.4244, "step": 9996 }, { "epoch": 1.85, "learning_rate": 6.77110802367573e-06, "loss": 0.4257, "step": 9997 }, { "epoch": 1.85, "learning_rate": 6.769217625986741e-06, "loss": 0.4257, "step": 9998 }, { "epoch": 1.85, "learning_rate": 6.767327357199991e-06, "loss": 0.4273, "step": 9999 }, { "epoch": 1.85, "learning_rate": 6.765437217390893e-06, "loss": 0.4208, "step": 10000 }, { "epoch": 1.85, "learning_rate": 6.7635472066348606e-06, "loss": 0.4266, "step": 10001 }, { "epoch": 1.85, "learning_rate": 6.761657325007302e-06, "loss": 0.4442, "step": 10002 }, { "epoch": 1.85, "learning_rate": 6.759767572583622e-06, "loss": 0.4188, "step": 10003 }, { "epoch": 1.85, "learning_rate": 6.757877949439216e-06, "loss": 0.4143, "step": 10004 }, { "epoch": 1.85, "learning_rate": 6.755988455649479e-06, "loss": 0.4366, "step": 10005 }, { "epoch": 1.85, "learning_rate": 6.754099091289792e-06, "loss": 0.404, "step": 10006 }, { "epoch": 1.85, "learning_rate": 6.7522098564355465e-06, "loss": 0.4254, "step": 10007 }, { "epoch": 1.85, "learning_rate": 6.75032075116211e-06, "loss": 0.4327, "step": 10008 }, { "epoch": 1.85, "learning_rate": 6.7484317755448635e-06, "loss": 0.4054, "step": 10009 }, { "epoch": 1.85, "learning_rate": 6.7465429296591685e-06, "loss": 0.4257, "step": 10010 }, { "epoch": 1.85, "learning_rate": 6.744654213580384e-06, "loss": 0.4287, "step": 10011 }, { "epoch": 1.85, "learning_rate": 6.742765627383873e-06, "loss": 0.4315, "step": 10012 }, { "epoch": 1.85, "learning_rate": 6.740877171144977e-06, "loss": 0.4268, "step": 10013 }, { "epoch": 1.85, "learning_rate": 6.738988844939054e-06, "loss": 0.4137, "step": 10014 }, { "epoch": 1.85, "learning_rate": 6.737100648841437e-06, "loss": 0.4229, "step": 10015 }, { "epoch": 1.85, "learning_rate": 6.735212582927459e-06, "loss": 0.4245, "step": 10016 }, { "epoch": 1.85, "learning_rate": 6.73332464727246e-06, "loss": 0.4542, "step": 10017 }, { "epoch": 1.85, "learning_rate": 6.731436841951755e-06, "loss": 0.4176, "step": 10018 }, { "epoch": 1.85, "learning_rate": 6.729549167040672e-06, "loss": 0.4522, "step": 10019 }, { "epoch": 1.85, "learning_rate": 6.727661622614517e-06, "loss": 0.4345, "step": 10020 }, { "epoch": 1.85, "learning_rate": 6.72577420874861e-06, "loss": 0.4404, "step": 10021 }, { "epoch": 1.85, "learning_rate": 6.72388692551825e-06, "loss": 0.4099, "step": 10022 }, { "epoch": 1.85, "learning_rate": 6.721999772998732e-06, "loss": 0.4118, "step": 10023 }, { "epoch": 1.85, "learning_rate": 6.720112751265357e-06, "loss": 0.4394, "step": 10024 }, { "epoch": 1.85, "learning_rate": 6.718225860393408e-06, "loss": 0.4086, "step": 10025 }, { "epoch": 1.85, "learning_rate": 6.716339100458176e-06, "loss": 0.4192, "step": 10026 }, { "epoch": 1.86, "learning_rate": 6.71445247153493e-06, "loss": 0.4201, "step": 10027 }, { "epoch": 1.86, "learning_rate": 6.712565973698948e-06, "loss": 0.4094, "step": 10028 }, { "epoch": 1.86, "learning_rate": 6.7106796070254984e-06, "loss": 0.4312, "step": 10029 }, { "epoch": 1.86, "learning_rate": 6.708793371589841e-06, "loss": 0.4166, "step": 10030 }, { "epoch": 1.86, "learning_rate": 6.7069072674672356e-06, "loss": 0.4214, "step": 10031 }, { "epoch": 1.86, "learning_rate": 6.705021294732934e-06, "loss": 0.4221, "step": 10032 }, { "epoch": 1.86, "learning_rate": 6.703135453462179e-06, "loss": 0.415, "step": 10033 }, { "epoch": 1.86, "learning_rate": 6.70124974373022e-06, "loss": 0.4261, "step": 10034 }, { "epoch": 1.86, "learning_rate": 6.699364165612285e-06, "loss": 0.4502, "step": 10035 }, { "epoch": 1.86, "learning_rate": 6.697478719183611e-06, "loss": 0.4427, "step": 10036 }, { "epoch": 1.86, "learning_rate": 6.695593404519423e-06, "loss": 0.455, "step": 10037 }, { "epoch": 1.86, "learning_rate": 6.6937082216949355e-06, "loss": 0.4271, "step": 10038 }, { "epoch": 1.86, "learning_rate": 6.691823170785373e-06, "loss": 0.4374, "step": 10039 }, { "epoch": 1.86, "learning_rate": 6.689938251865937e-06, "loss": 0.437, "step": 10040 }, { "epoch": 1.86, "learning_rate": 6.688053465011841e-06, "loss": 0.4394, "step": 10041 }, { "epoch": 1.86, "learning_rate": 6.686168810298275e-06, "loss": 0.4205, "step": 10042 }, { "epoch": 1.86, "learning_rate": 6.684284287800442e-06, "loss": 0.4324, "step": 10043 }, { "epoch": 1.86, "learning_rate": 6.6823998975935275e-06, "loss": 0.4164, "step": 10044 }, { "epoch": 1.86, "learning_rate": 6.680515639752709e-06, "loss": 0.4295, "step": 10045 }, { "epoch": 1.86, "learning_rate": 6.678631514353178e-06, "loss": 0.4149, "step": 10046 }, { "epoch": 1.86, "learning_rate": 6.676747521470093e-06, "loss": 0.4256, "step": 10047 }, { "epoch": 1.86, "learning_rate": 6.674863661178635e-06, "loss": 0.4551, "step": 10048 }, { "epoch": 1.86, "learning_rate": 6.672979933553958e-06, "loss": 0.4321, "step": 10049 }, { "epoch": 1.86, "learning_rate": 6.6710963386712215e-06, "loss": 0.4192, "step": 10050 }, { "epoch": 1.86, "learning_rate": 6.669212876605578e-06, "loss": 0.4364, "step": 10051 }, { "epoch": 1.86, "learning_rate": 6.667329547432173e-06, "loss": 0.4285, "step": 10052 }, { "epoch": 1.86, "learning_rate": 6.66544635122615e-06, "loss": 0.4186, "step": 10053 }, { "epoch": 1.86, "learning_rate": 6.663563288062646e-06, "loss": 0.4157, "step": 10054 }, { "epoch": 1.86, "learning_rate": 6.661680358016786e-06, "loss": 0.4179, "step": 10055 }, { "epoch": 1.86, "learning_rate": 6.659797561163701e-06, "loss": 0.4005, "step": 10056 }, { "epoch": 1.86, "learning_rate": 6.657914897578507e-06, "loss": 0.4253, "step": 10057 }, { "epoch": 1.86, "learning_rate": 6.656032367336325e-06, "loss": 0.4217, "step": 10058 }, { "epoch": 1.86, "learning_rate": 6.654149970512258e-06, "loss": 0.3974, "step": 10059 }, { "epoch": 1.86, "learning_rate": 6.65226770718141e-06, "loss": 0.4526, "step": 10060 }, { "epoch": 1.86, "learning_rate": 6.650385577418888e-06, "loss": 0.397, "step": 10061 }, { "epoch": 1.86, "learning_rate": 6.648503581299772e-06, "loss": 0.432, "step": 10062 }, { "epoch": 1.86, "learning_rate": 6.646621718899165e-06, "loss": 0.4057, "step": 10063 }, { "epoch": 1.86, "learning_rate": 6.644739990292137e-06, "loss": 0.4151, "step": 10064 }, { "epoch": 1.86, "learning_rate": 6.642858395553777e-06, "loss": 0.4364, "step": 10065 }, { "epoch": 1.86, "learning_rate": 6.640976934759152e-06, "loss": 0.4306, "step": 10066 }, { "epoch": 1.86, "learning_rate": 6.639095607983321e-06, "loss": 0.4284, "step": 10067 }, { "epoch": 1.86, "learning_rate": 6.637214415301358e-06, "loss": 0.4518, "step": 10068 }, { "epoch": 1.86, "learning_rate": 6.635333356788312e-06, "loss": 0.423, "step": 10069 }, { "epoch": 1.86, "learning_rate": 6.6334524325192375e-06, "loss": 0.4148, "step": 10070 }, { "epoch": 1.86, "learning_rate": 6.631571642569179e-06, "loss": 0.4537, "step": 10071 }, { "epoch": 1.86, "learning_rate": 6.6296909870131695e-06, "loss": 0.4271, "step": 10072 }, { "epoch": 1.86, "learning_rate": 6.6278104659262556e-06, "loss": 0.4211, "step": 10073 }, { "epoch": 1.86, "learning_rate": 6.625930079383456e-06, "loss": 0.4369, "step": 10074 }, { "epoch": 1.86, "learning_rate": 6.624049827459803e-06, "loss": 0.4169, "step": 10075 }, { "epoch": 1.86, "learning_rate": 6.62216971023031e-06, "loss": 0.4285, "step": 10076 }, { "epoch": 1.86, "learning_rate": 6.620289727769991e-06, "loss": 0.4356, "step": 10077 }, { "epoch": 1.86, "learning_rate": 6.618409880153855e-06, "loss": 0.4158, "step": 10078 }, { "epoch": 1.86, "learning_rate": 6.616530167456905e-06, "loss": 0.4327, "step": 10079 }, { "epoch": 1.86, "learning_rate": 6.614650589754134e-06, "loss": 0.437, "step": 10080 }, { "epoch": 1.87, "learning_rate": 6.612771147120542e-06, "loss": 0.4223, "step": 10081 }, { "epoch": 1.87, "learning_rate": 6.610891839631104e-06, "loss": 0.437, "step": 10082 }, { "epoch": 1.87, "learning_rate": 6.609012667360812e-06, "loss": 0.405, "step": 10083 }, { "epoch": 1.87, "learning_rate": 6.607133630384631e-06, "loss": 0.4153, "step": 10084 }, { "epoch": 1.87, "learning_rate": 6.605254728777542e-06, "loss": 0.4073, "step": 10085 }, { "epoch": 1.87, "learning_rate": 6.603375962614499e-06, "loss": 0.4364, "step": 10086 }, { "epoch": 1.87, "learning_rate": 6.60149733197047e-06, "loss": 0.4108, "step": 10087 }, { "epoch": 1.87, "learning_rate": 6.599618836920408e-06, "loss": 0.4186, "step": 10088 }, { "epoch": 1.87, "learning_rate": 6.597740477539251e-06, "loss": 0.429, "step": 10089 }, { "epoch": 1.87, "learning_rate": 6.595862253901955e-06, "loss": 0.442, "step": 10090 }, { "epoch": 1.87, "learning_rate": 6.593984166083449e-06, "loss": 0.4333, "step": 10091 }, { "epoch": 1.87, "learning_rate": 6.592106214158674e-06, "loss": 0.413, "step": 10092 }, { "epoch": 1.87, "learning_rate": 6.590228398202549e-06, "loss": 0.402, "step": 10093 }, { "epoch": 1.87, "learning_rate": 6.588350718289995e-06, "loss": 0.4398, "step": 10094 }, { "epoch": 1.87, "learning_rate": 6.586473174495935e-06, "loss": 0.4276, "step": 10095 }, { "epoch": 1.87, "learning_rate": 6.584595766895272e-06, "loss": 0.4269, "step": 10096 }, { "epoch": 1.87, "learning_rate": 6.582718495562917e-06, "loss": 0.4292, "step": 10097 }, { "epoch": 1.87, "learning_rate": 6.580841360573769e-06, "loss": 0.4334, "step": 10098 }, { "epoch": 1.87, "learning_rate": 6.578964362002716e-06, "loss": 0.4399, "step": 10099 }, { "epoch": 1.87, "learning_rate": 6.5770874999246506e-06, "loss": 0.4342, "step": 10100 }, { "epoch": 1.87, "learning_rate": 6.575210774414459e-06, "loss": 0.4253, "step": 10101 }, { "epoch": 1.87, "learning_rate": 6.573334185547016e-06, "loss": 0.4068, "step": 10102 }, { "epoch": 1.87, "learning_rate": 6.571457733397196e-06, "loss": 0.4357, "step": 10103 }, { "epoch": 1.87, "learning_rate": 6.569581418039861e-06, "loss": 0.4344, "step": 10104 }, { "epoch": 1.87, "learning_rate": 6.567705239549881e-06, "loss": 0.4457, "step": 10105 }, { "epoch": 1.87, "learning_rate": 6.5658291980021025e-06, "loss": 0.4297, "step": 10106 }, { "epoch": 1.87, "learning_rate": 6.563953293471386e-06, "loss": 0.4229, "step": 10107 }, { "epoch": 1.87, "learning_rate": 6.562077526032565e-06, "loss": 0.4351, "step": 10108 }, { "epoch": 1.87, "learning_rate": 6.560201895760492e-06, "loss": 0.4245, "step": 10109 }, { "epoch": 1.87, "learning_rate": 6.558326402729993e-06, "loss": 0.4424, "step": 10110 }, { "epoch": 1.87, "learning_rate": 6.556451047015895e-06, "loss": 0.4461, "step": 10111 }, { "epoch": 1.87, "learning_rate": 6.554575828693029e-06, "loss": 0.4377, "step": 10112 }, { "epoch": 1.87, "learning_rate": 6.552700747836205e-06, "loss": 0.4263, "step": 10113 }, { "epoch": 1.87, "learning_rate": 6.550825804520241e-06, "loss": 0.4241, "step": 10114 }, { "epoch": 1.87, "learning_rate": 6.548950998819943e-06, "loss": 0.4261, "step": 10115 }, { "epoch": 1.87, "learning_rate": 6.547076330810105e-06, "loss": 0.4483, "step": 10116 }, { "epoch": 1.87, "learning_rate": 6.545201800565534e-06, "loss": 0.4553, "step": 10117 }, { "epoch": 1.87, "learning_rate": 6.54332740816101e-06, "loss": 0.4364, "step": 10118 }, { "epoch": 1.87, "learning_rate": 6.541453153671327e-06, "loss": 0.429, "step": 10119 }, { "epoch": 1.87, "learning_rate": 6.53957903717126e-06, "loss": 0.4196, "step": 10120 }, { "epoch": 1.87, "learning_rate": 6.537705058735577e-06, "loss": 0.4192, "step": 10121 }, { "epoch": 1.87, "learning_rate": 6.535831218439057e-06, "loss": 0.4228, "step": 10122 }, { "epoch": 1.87, "learning_rate": 6.533957516356455e-06, "loss": 0.4271, "step": 10123 }, { "epoch": 1.87, "learning_rate": 6.532083952562533e-06, "loss": 0.439, "step": 10124 }, { "epoch": 1.87, "learning_rate": 6.530210527132039e-06, "loss": 0.4108, "step": 10125 }, { "epoch": 1.87, "learning_rate": 6.528337240139722e-06, "loss": 0.4432, "step": 10126 }, { "epoch": 1.87, "learning_rate": 6.52646409166032e-06, "loss": 0.4404, "step": 10127 }, { "epoch": 1.87, "learning_rate": 6.52459108176857e-06, "loss": 0.4293, "step": 10128 }, { "epoch": 1.87, "learning_rate": 6.522718210539202e-06, "loss": 0.4229, "step": 10129 }, { "epoch": 1.87, "learning_rate": 6.520845478046939e-06, "loss": 0.4377, "step": 10130 }, { "epoch": 1.87, "learning_rate": 6.518972884366499e-06, "loss": 0.4168, "step": 10131 }, { "epoch": 1.87, "learning_rate": 6.517100429572601e-06, "loss": 0.4022, "step": 10132 }, { "epoch": 1.87, "learning_rate": 6.51522811373994e-06, "loss": 0.4152, "step": 10133 }, { "epoch": 1.87, "learning_rate": 6.513355936943231e-06, "loss": 0.4312, "step": 10134 }, { "epoch": 1.88, "learning_rate": 6.5114838992571604e-06, "loss": 0.4337, "step": 10135 }, { "epoch": 1.88, "learning_rate": 6.5096120007564265e-06, "loss": 0.4255, "step": 10136 }, { "epoch": 1.88, "learning_rate": 6.507740241515713e-06, "loss": 0.4238, "step": 10137 }, { "epoch": 1.88, "learning_rate": 6.505868621609694e-06, "loss": 0.4094, "step": 10138 }, { "epoch": 1.88, "learning_rate": 6.5039971411130505e-06, "loss": 0.4188, "step": 10139 }, { "epoch": 1.88, "learning_rate": 6.502125800100445e-06, "loss": 0.4136, "step": 10140 }, { "epoch": 1.88, "learning_rate": 6.50025459864655e-06, "loss": 0.4346, "step": 10141 }, { "epoch": 1.88, "learning_rate": 6.498383536826014e-06, "loss": 0.4369, "step": 10142 }, { "epoch": 1.88, "learning_rate": 6.496512614713489e-06, "loss": 0.4301, "step": 10143 }, { "epoch": 1.88, "learning_rate": 6.494641832383628e-06, "loss": 0.4304, "step": 10144 }, { "epoch": 1.88, "learning_rate": 6.492771189911064e-06, "loss": 0.4341, "step": 10145 }, { "epoch": 1.88, "learning_rate": 6.490900687370439e-06, "loss": 0.4219, "step": 10146 }, { "epoch": 1.88, "learning_rate": 6.489030324836381e-06, "loss": 0.4373, "step": 10147 }, { "epoch": 1.88, "learning_rate": 6.487160102383508e-06, "loss": 0.4136, "step": 10148 }, { "epoch": 1.88, "learning_rate": 6.4852900200864475e-06, "loss": 0.4531, "step": 10149 }, { "epoch": 1.88, "learning_rate": 6.483420078019804e-06, "loss": 0.4205, "step": 10150 }, { "epoch": 1.88, "learning_rate": 6.481550276258193e-06, "loss": 0.4223, "step": 10151 }, { "epoch": 1.88, "learning_rate": 6.479680614876207e-06, "loss": 0.399, "step": 10152 }, { "epoch": 1.88, "learning_rate": 6.47781109394845e-06, "loss": 0.4304, "step": 10153 }, { "epoch": 1.88, "learning_rate": 6.4759417135495085e-06, "loss": 0.4247, "step": 10154 }, { "epoch": 1.88, "learning_rate": 6.474072473753968e-06, "loss": 0.4462, "step": 10155 }, { "epoch": 1.88, "learning_rate": 6.4722033746364066e-06, "loss": 0.4279, "step": 10156 }, { "epoch": 1.88, "learning_rate": 6.4703344162713995e-06, "loss": 0.4497, "step": 10157 }, { "epoch": 1.88, "learning_rate": 6.468465598733515e-06, "loss": 0.4074, "step": 10158 }, { "epoch": 1.88, "learning_rate": 6.466596922097315e-06, "loss": 0.4293, "step": 10159 }, { "epoch": 1.88, "learning_rate": 6.464728386437353e-06, "loss": 0.3978, "step": 10160 }, { "epoch": 1.88, "learning_rate": 6.462859991828188e-06, "loss": 0.4148, "step": 10161 }, { "epoch": 1.88, "learning_rate": 6.460991738344355e-06, "loss": 0.444, "step": 10162 }, { "epoch": 1.88, "learning_rate": 6.459123626060404e-06, "loss": 0.4122, "step": 10163 }, { "epoch": 1.88, "learning_rate": 6.457255655050865e-06, "loss": 0.407, "step": 10164 }, { "epoch": 1.88, "learning_rate": 6.4553878253902605e-06, "loss": 0.4425, "step": 10165 }, { "epoch": 1.88, "learning_rate": 6.453520137153124e-06, "loss": 0.4159, "step": 10166 }, { "epoch": 1.88, "learning_rate": 6.451652590413963e-06, "loss": 0.4279, "step": 10167 }, { "epoch": 1.88, "learning_rate": 6.449785185247299e-06, "loss": 0.4439, "step": 10168 }, { "epoch": 1.88, "learning_rate": 6.447917921727633e-06, "loss": 0.4197, "step": 10169 }, { "epoch": 1.88, "learning_rate": 6.446050799929462e-06, "loss": 0.4284, "step": 10170 }, { "epoch": 1.88, "learning_rate": 6.4441838199272875e-06, "loss": 0.4259, "step": 10171 }, { "epoch": 1.88, "learning_rate": 6.442316981795591e-06, "loss": 0.4197, "step": 10172 }, { "epoch": 1.88, "learning_rate": 6.4404502856088655e-06, "loss": 0.4373, "step": 10173 }, { "epoch": 1.88, "learning_rate": 6.438583731441577e-06, "loss": 0.4248, "step": 10174 }, { "epoch": 1.88, "learning_rate": 6.436717319368209e-06, "loss": 0.4195, "step": 10175 }, { "epoch": 1.88, "learning_rate": 6.434851049463221e-06, "loss": 0.4107, "step": 10176 }, { "epoch": 1.88, "learning_rate": 6.432984921801075e-06, "loss": 0.4221, "step": 10177 }, { "epoch": 1.88, "learning_rate": 6.4311189364562266e-06, "loss": 0.4172, "step": 10178 }, { "epoch": 1.88, "learning_rate": 6.429253093503125e-06, "loss": 0.4304, "step": 10179 }, { "epoch": 1.88, "learning_rate": 6.427387393016213e-06, "loss": 0.419, "step": 10180 }, { "epoch": 1.88, "learning_rate": 6.425521835069933e-06, "loss": 0.4279, "step": 10181 }, { "epoch": 1.88, "learning_rate": 6.423656419738709e-06, "loss": 0.4294, "step": 10182 }, { "epoch": 1.88, "learning_rate": 6.421791147096976e-06, "loss": 0.4182, "step": 10183 }, { "epoch": 1.88, "learning_rate": 6.419926017219149e-06, "loss": 0.4293, "step": 10184 }, { "epoch": 1.88, "learning_rate": 6.418061030179648e-06, "loss": 0.4265, "step": 10185 }, { "epoch": 1.88, "learning_rate": 6.416196186052881e-06, "loss": 0.4143, "step": 10186 }, { "epoch": 1.88, "learning_rate": 6.414331484913246e-06, "loss": 0.4071, "step": 10187 }, { "epoch": 1.88, "learning_rate": 6.412466926835151e-06, "loss": 0.4392, "step": 10188 }, { "epoch": 1.89, "learning_rate": 6.410602511892979e-06, "loss": 0.4331, "step": 10189 }, { "epoch": 1.89, "learning_rate": 6.408738240161125e-06, "loss": 0.4366, "step": 10190 }, { "epoch": 1.89, "learning_rate": 6.406874111713968e-06, "loss": 0.4136, "step": 10191 }, { "epoch": 1.89, "learning_rate": 6.4050101266258745e-06, "loss": 0.434, "step": 10192 }, { "epoch": 1.89, "learning_rate": 6.403146284971227e-06, "loss": 0.4318, "step": 10193 }, { "epoch": 1.89, "learning_rate": 6.4012825868243775e-06, "loss": 0.4082, "step": 10194 }, { "epoch": 1.89, "learning_rate": 6.399419032259696e-06, "loss": 0.3967, "step": 10195 }, { "epoch": 1.89, "learning_rate": 6.397555621351525e-06, "loss": 0.4484, "step": 10196 }, { "epoch": 1.89, "learning_rate": 6.3956923541742165e-06, "loss": 0.4361, "step": 10197 }, { "epoch": 1.89, "learning_rate": 6.393829230802112e-06, "loss": 0.4255, "step": 10198 }, { "epoch": 1.89, "learning_rate": 6.39196625130954e-06, "loss": 0.4336, "step": 10199 }, { "epoch": 1.89, "learning_rate": 6.390103415770838e-06, "loss": 0.4232, "step": 10200 }, { "epoch": 1.89, "learning_rate": 6.388240724260323e-06, "loss": 0.4249, "step": 10201 }, { "epoch": 1.89, "learning_rate": 6.386378176852319e-06, "loss": 0.4167, "step": 10202 }, { "epoch": 1.89, "learning_rate": 6.3845157736211335e-06, "loss": 0.4159, "step": 10203 }, { "epoch": 1.89, "learning_rate": 6.3826535146410765e-06, "loss": 0.4216, "step": 10204 }, { "epoch": 1.89, "learning_rate": 6.380791399986446e-06, "loss": 0.4243, "step": 10205 }, { "epoch": 1.89, "learning_rate": 6.378929429731537e-06, "loss": 0.4433, "step": 10206 }, { "epoch": 1.89, "learning_rate": 6.377067603950639e-06, "loss": 0.4195, "step": 10207 }, { "epoch": 1.89, "learning_rate": 6.37520592271804e-06, "loss": 0.4288, "step": 10208 }, { "epoch": 1.89, "learning_rate": 6.373344386108008e-06, "loss": 0.4142, "step": 10209 }, { "epoch": 1.89, "learning_rate": 6.371482994194824e-06, "loss": 0.3955, "step": 10210 }, { "epoch": 1.89, "learning_rate": 6.3696217470527475e-06, "loss": 0.4279, "step": 10211 }, { "epoch": 1.89, "learning_rate": 6.367760644756047e-06, "loss": 0.4334, "step": 10212 }, { "epoch": 1.89, "learning_rate": 6.36589968737897e-06, "loss": 0.4421, "step": 10213 }, { "epoch": 1.89, "learning_rate": 6.364038874995764e-06, "loss": 0.4303, "step": 10214 }, { "epoch": 1.89, "learning_rate": 6.362178207680678e-06, "loss": 0.4261, "step": 10215 }, { "epoch": 1.89, "learning_rate": 6.360317685507944e-06, "loss": 0.4145, "step": 10216 }, { "epoch": 1.89, "learning_rate": 6.358457308551798e-06, "loss": 0.4202, "step": 10217 }, { "epoch": 1.89, "learning_rate": 6.35659707688646e-06, "loss": 0.4244, "step": 10218 }, { "epoch": 1.89, "learning_rate": 6.354736990586157e-06, "loss": 0.4229, "step": 10219 }, { "epoch": 1.89, "learning_rate": 6.352877049725099e-06, "loss": 0.417, "step": 10220 }, { "epoch": 1.89, "learning_rate": 6.35101725437749e-06, "loss": 0.4287, "step": 10221 }, { "epoch": 1.89, "learning_rate": 6.349157604617542e-06, "loss": 0.4091, "step": 10222 }, { "epoch": 1.89, "learning_rate": 6.347298100519441e-06, "loss": 0.4056, "step": 10223 }, { "epoch": 1.89, "learning_rate": 6.345438742157387e-06, "loss": 0.4111, "step": 10224 }, { "epoch": 1.89, "learning_rate": 6.343579529605559e-06, "loss": 0.4383, "step": 10225 }, { "epoch": 1.89, "learning_rate": 6.341720462938138e-06, "loss": 0.4196, "step": 10226 }, { "epoch": 1.89, "learning_rate": 6.3398615422292974e-06, "loss": 0.4291, "step": 10227 }, { "epoch": 1.89, "learning_rate": 6.338002767553205e-06, "loss": 0.4311, "step": 10228 }, { "epoch": 1.89, "learning_rate": 6.336144138984022e-06, "loss": 0.4373, "step": 10229 }, { "epoch": 1.89, "learning_rate": 6.3342856565959064e-06, "loss": 0.4214, "step": 10230 }, { "epoch": 1.89, "learning_rate": 6.332427320463002e-06, "loss": 0.4174, "step": 10231 }, { "epoch": 1.89, "learning_rate": 6.330569130659462e-06, "loss": 0.4125, "step": 10232 }, { "epoch": 1.89, "learning_rate": 6.328711087259416e-06, "loss": 0.4108, "step": 10233 }, { "epoch": 1.89, "learning_rate": 6.326853190337003e-06, "loss": 0.4036, "step": 10234 }, { "epoch": 1.89, "learning_rate": 6.324995439966348e-06, "loss": 0.4306, "step": 10235 }, { "epoch": 1.89, "learning_rate": 6.323137836221567e-06, "loss": 0.4029, "step": 10236 }, { "epoch": 1.89, "learning_rate": 6.321280379176782e-06, "loss": 0.4306, "step": 10237 }, { "epoch": 1.89, "learning_rate": 6.319423068906095e-06, "loss": 0.424, "step": 10238 }, { "epoch": 1.89, "learning_rate": 6.317565905483618e-06, "loss": 0.4273, "step": 10239 }, { "epoch": 1.89, "learning_rate": 6.3157088889834396e-06, "loss": 0.4315, "step": 10240 }, { "epoch": 1.89, "learning_rate": 6.313852019479658e-06, "loss": 0.4375, "step": 10241 }, { "epoch": 1.89, "learning_rate": 6.311995297046357e-06, "loss": 0.4113, "step": 10242 }, { "epoch": 1.9, "learning_rate": 6.310138721757612e-06, "loss": 0.4104, "step": 10243 }, { "epoch": 1.9, "learning_rate": 6.308282293687503e-06, "loss": 0.4457, "step": 10244 }, { "epoch": 1.9, "learning_rate": 6.306426012910092e-06, "loss": 0.4187, "step": 10245 }, { "epoch": 1.9, "learning_rate": 6.304569879499449e-06, "loss": 0.4022, "step": 10246 }, { "epoch": 1.9, "learning_rate": 6.302713893529626e-06, "loss": 0.4216, "step": 10247 }, { "epoch": 1.9, "learning_rate": 6.300858055074669e-06, "loss": 0.417, "step": 10248 }, { "epoch": 1.9, "learning_rate": 6.299002364208631e-06, "loss": 0.4234, "step": 10249 }, { "epoch": 1.9, "learning_rate": 6.297146821005542e-06, "loss": 0.4259, "step": 10250 }, { "epoch": 1.9, "learning_rate": 6.2952914255394425e-06, "loss": 0.432, "step": 10251 }, { "epoch": 1.9, "learning_rate": 6.293436177884356e-06, "loss": 0.4427, "step": 10252 }, { "epoch": 1.9, "learning_rate": 6.291581078114301e-06, "loss": 0.4122, "step": 10253 }, { "epoch": 1.9, "learning_rate": 6.289726126303297e-06, "loss": 0.4226, "step": 10254 }, { "epoch": 1.9, "learning_rate": 6.287871322525352e-06, "loss": 0.4363, "step": 10255 }, { "epoch": 1.9, "learning_rate": 6.286016666854466e-06, "loss": 0.4262, "step": 10256 }, { "epoch": 1.9, "learning_rate": 6.284162159364642e-06, "loss": 0.4477, "step": 10257 }, { "epoch": 1.9, "learning_rate": 6.282307800129864e-06, "loss": 0.4174, "step": 10258 }, { "epoch": 1.9, "learning_rate": 6.280453589224126e-06, "loss": 0.4297, "step": 10259 }, { "epoch": 1.9, "learning_rate": 6.278599526721398e-06, "loss": 0.4116, "step": 10260 }, { "epoch": 1.9, "learning_rate": 6.276745612695665e-06, "loss": 0.4341, "step": 10261 }, { "epoch": 1.9, "learning_rate": 6.274891847220883e-06, "loss": 0.4194, "step": 10262 }, { "epoch": 1.9, "learning_rate": 6.273038230371023e-06, "loss": 0.43, "step": 10263 }, { "epoch": 1.9, "learning_rate": 6.2711847622200394e-06, "loss": 0.4356, "step": 10264 }, { "epoch": 1.9, "learning_rate": 6.269331442841875e-06, "loss": 0.4366, "step": 10265 }, { "epoch": 1.9, "learning_rate": 6.267478272310482e-06, "loss": 0.4292, "step": 10266 }, { "epoch": 1.9, "learning_rate": 6.265625250699792e-06, "loss": 0.4247, "step": 10267 }, { "epoch": 1.9, "learning_rate": 6.263772378083745e-06, "loss": 0.4412, "step": 10268 }, { "epoch": 1.9, "learning_rate": 6.261919654536261e-06, "loss": 0.4195, "step": 10269 }, { "epoch": 1.9, "learning_rate": 6.26006708013126e-06, "loss": 0.4383, "step": 10270 }, { "epoch": 1.9, "learning_rate": 6.258214654942662e-06, "loss": 0.4319, "step": 10271 }, { "epoch": 1.9, "learning_rate": 6.256362379044366e-06, "loss": 0.4096, "step": 10272 }, { "epoch": 1.9, "learning_rate": 6.254510252510285e-06, "loss": 0.4275, "step": 10273 }, { "epoch": 1.9, "learning_rate": 6.25265827541431e-06, "loss": 0.4358, "step": 10274 }, { "epoch": 1.9, "learning_rate": 6.250806447830329e-06, "loss": 0.4168, "step": 10275 }, { "epoch": 1.9, "learning_rate": 6.248954769832231e-06, "loss": 0.4269, "step": 10276 }, { "epoch": 1.9, "learning_rate": 6.247103241493891e-06, "loss": 0.4364, "step": 10277 }, { "epoch": 1.9, "learning_rate": 6.245251862889186e-06, "loss": 0.4477, "step": 10278 }, { "epoch": 1.9, "learning_rate": 6.243400634091978e-06, "loss": 0.4254, "step": 10279 }, { "epoch": 1.9, "learning_rate": 6.241549555176129e-06, "loss": 0.4344, "step": 10280 }, { "epoch": 1.9, "learning_rate": 6.239698626215496e-06, "loss": 0.4441, "step": 10281 }, { "epoch": 1.9, "learning_rate": 6.237847847283924e-06, "loss": 0.4195, "step": 10282 }, { "epoch": 1.9, "learning_rate": 6.235997218455259e-06, "loss": 0.4146, "step": 10283 }, { "epoch": 1.9, "learning_rate": 6.234146739803335e-06, "loss": 0.4161, "step": 10284 }, { "epoch": 1.9, "learning_rate": 6.2322964114019834e-06, "loss": 0.4206, "step": 10285 }, { "epoch": 1.9, "learning_rate": 6.230446233325033e-06, "loss": 0.4508, "step": 10286 }, { "epoch": 1.9, "learning_rate": 6.228596205646293e-06, "loss": 0.4116, "step": 10287 }, { "epoch": 1.9, "learning_rate": 6.226746328439588e-06, "loss": 0.4219, "step": 10288 }, { "epoch": 1.9, "learning_rate": 6.2248966017787114e-06, "loss": 0.4192, "step": 10289 }, { "epoch": 1.9, "learning_rate": 6.223047025737478e-06, "loss": 0.4328, "step": 10290 }, { "epoch": 1.9, "learning_rate": 6.2211976003896746e-06, "loss": 0.4285, "step": 10291 }, { "epoch": 1.9, "learning_rate": 6.219348325809085e-06, "loss": 0.4133, "step": 10292 }, { "epoch": 1.9, "learning_rate": 6.217499202069504e-06, "loss": 0.4413, "step": 10293 }, { "epoch": 1.9, "learning_rate": 6.215650229244695e-06, "loss": 0.4151, "step": 10294 }, { "epoch": 1.9, "learning_rate": 6.213801407408442e-06, "loss": 0.4172, "step": 10295 }, { "epoch": 1.9, "learning_rate": 6.211952736634501e-06, "loss": 0.412, "step": 10296 }, { "epoch": 1.91, "learning_rate": 6.210104216996628e-06, "loss": 0.426, "step": 10297 }, { "epoch": 1.91, "learning_rate": 6.208255848568585e-06, "loss": 0.417, "step": 10298 }, { "epoch": 1.91, "learning_rate": 6.206407631424109e-06, "loss": 0.4025, "step": 10299 }, { "epoch": 1.91, "learning_rate": 6.204559565636951e-06, "loss": 0.4228, "step": 10300 }, { "epoch": 1.91, "learning_rate": 6.2027116512808346e-06, "loss": 0.4228, "step": 10301 }, { "epoch": 1.91, "learning_rate": 6.200863888429494e-06, "loss": 0.415, "step": 10302 }, { "epoch": 1.91, "learning_rate": 6.199016277156651e-06, "loss": 0.4232, "step": 10303 }, { "epoch": 1.91, "learning_rate": 6.197168817536019e-06, "loss": 0.4154, "step": 10304 }, { "epoch": 1.91, "learning_rate": 6.195321509641312e-06, "loss": 0.4363, "step": 10305 }, { "epoch": 1.91, "learning_rate": 6.193474353546233e-06, "loss": 0.4221, "step": 10306 }, { "epoch": 1.91, "learning_rate": 6.191627349324478e-06, "loss": 0.4111, "step": 10307 }, { "epoch": 1.91, "learning_rate": 6.189780497049744e-06, "loss": 0.4297, "step": 10308 }, { "epoch": 1.91, "learning_rate": 6.18793379679571e-06, "loss": 0.4079, "step": 10309 }, { "epoch": 1.91, "learning_rate": 6.1860872486360636e-06, "loss": 0.3989, "step": 10310 }, { "epoch": 1.91, "learning_rate": 6.18424085264447e-06, "loss": 0.4032, "step": 10311 }, { "epoch": 1.91, "learning_rate": 6.182394608894605e-06, "loss": 0.4281, "step": 10312 }, { "epoch": 1.91, "learning_rate": 6.180548517460128e-06, "loss": 0.433, "step": 10313 }, { "epoch": 1.91, "learning_rate": 6.17870257841469e-06, "loss": 0.4246, "step": 10314 }, { "epoch": 1.91, "learning_rate": 6.176856791831948e-06, "loss": 0.4124, "step": 10315 }, { "epoch": 1.91, "learning_rate": 6.175011157785537e-06, "loss": 0.4343, "step": 10316 }, { "epoch": 1.91, "learning_rate": 6.173165676349103e-06, "loss": 0.4094, "step": 10317 }, { "epoch": 1.91, "learning_rate": 6.171320347596275e-06, "loss": 0.4275, "step": 10318 }, { "epoch": 1.91, "learning_rate": 6.169475171600671e-06, "loss": 0.4279, "step": 10319 }, { "epoch": 1.91, "learning_rate": 6.167630148435919e-06, "loss": 0.4316, "step": 10320 }, { "epoch": 1.91, "learning_rate": 6.165785278175625e-06, "loss": 0.4102, "step": 10321 }, { "epoch": 1.91, "learning_rate": 6.163940560893405e-06, "loss": 0.406, "step": 10322 }, { "epoch": 1.91, "learning_rate": 6.162095996662853e-06, "loss": 0.4033, "step": 10323 }, { "epoch": 1.91, "learning_rate": 6.160251585557562e-06, "loss": 0.4214, "step": 10324 }, { "epoch": 1.91, "learning_rate": 6.158407327651127e-06, "loss": 0.4229, "step": 10325 }, { "epoch": 1.91, "learning_rate": 6.1565632230171225e-06, "loss": 0.4386, "step": 10326 }, { "epoch": 1.91, "learning_rate": 6.154719271729135e-06, "loss": 0.4274, "step": 10327 }, { "epoch": 1.91, "learning_rate": 6.152875473860726e-06, "loss": 0.3933, "step": 10328 }, { "epoch": 1.91, "learning_rate": 6.151031829485464e-06, "loss": 0.4201, "step": 10329 }, { "epoch": 1.91, "learning_rate": 6.149188338676903e-06, "loss": 0.4033, "step": 10330 }, { "epoch": 1.91, "learning_rate": 6.1473450015086014e-06, "loss": 0.4263, "step": 10331 }, { "epoch": 1.91, "learning_rate": 6.1455018180540995e-06, "loss": 0.4408, "step": 10332 }, { "epoch": 1.91, "learning_rate": 6.143658788386938e-06, "loss": 0.4202, "step": 10333 }, { "epoch": 1.91, "learning_rate": 6.1418159125806524e-06, "loss": 0.4293, "step": 10334 }, { "epoch": 1.91, "learning_rate": 6.13997319070877e-06, "loss": 0.4332, "step": 10335 }, { "epoch": 1.91, "learning_rate": 6.138130622844807e-06, "loss": 0.4121, "step": 10336 }, { "epoch": 1.91, "learning_rate": 6.136288209062285e-06, "loss": 0.4393, "step": 10337 }, { "epoch": 1.91, "learning_rate": 6.134445949434706e-06, "loss": 0.4369, "step": 10338 }, { "epoch": 1.91, "learning_rate": 6.132603844035582e-06, "loss": 0.4235, "step": 10339 }, { "epoch": 1.91, "learning_rate": 6.130761892938404e-06, "loss": 0.4197, "step": 10340 }, { "epoch": 1.91, "learning_rate": 6.128920096216658e-06, "loss": 0.4292, "step": 10341 }, { "epoch": 1.91, "learning_rate": 6.127078453943838e-06, "loss": 0.4338, "step": 10342 }, { "epoch": 1.91, "learning_rate": 6.125236966193413e-06, "loss": 0.4051, "step": 10343 }, { "epoch": 1.91, "learning_rate": 6.123395633038862e-06, "loss": 0.4285, "step": 10344 }, { "epoch": 1.91, "learning_rate": 6.121554454553649e-06, "loss": 0.42, "step": 10345 }, { "epoch": 1.91, "learning_rate": 6.119713430811228e-06, "loss": 0.4229, "step": 10346 }, { "epoch": 1.91, "learning_rate": 6.117872561885061e-06, "loss": 0.4336, "step": 10347 }, { "epoch": 1.91, "learning_rate": 6.116031847848588e-06, "loss": 0.3941, "step": 10348 }, { "epoch": 1.91, "learning_rate": 6.1141912887752575e-06, "loss": 0.3935, "step": 10349 }, { "epoch": 1.91, "learning_rate": 6.112350884738496e-06, "loss": 0.4171, "step": 10350 }, { "epoch": 1.92, "learning_rate": 6.110510635811739e-06, "loss": 0.426, "step": 10351 }, { "epoch": 1.92, "learning_rate": 6.108670542068404e-06, "loss": 0.4273, "step": 10352 }, { "epoch": 1.92, "learning_rate": 6.1068306035819115e-06, "loss": 0.4237, "step": 10353 }, { "epoch": 1.92, "learning_rate": 6.104990820425669e-06, "loss": 0.4083, "step": 10354 }, { "epoch": 1.92, "learning_rate": 6.103151192673082e-06, "loss": 0.4157, "step": 10355 }, { "epoch": 1.92, "learning_rate": 6.101311720397547e-06, "loss": 0.4243, "step": 10356 }, { "epoch": 1.92, "learning_rate": 6.099472403672459e-06, "loss": 0.457, "step": 10357 }, { "epoch": 1.92, "learning_rate": 6.097633242571196e-06, "loss": 0.4346, "step": 10358 }, { "epoch": 1.92, "learning_rate": 6.095794237167145e-06, "loss": 0.4173, "step": 10359 }, { "epoch": 1.92, "learning_rate": 6.093955387533672e-06, "loss": 0.4403, "step": 10360 }, { "epoch": 1.92, "learning_rate": 6.092116693744152e-06, "loss": 0.411, "step": 10361 }, { "epoch": 1.92, "learning_rate": 6.09027815587194e-06, "loss": 0.4296, "step": 10362 }, { "epoch": 1.92, "learning_rate": 6.088439773990387e-06, "loss": 0.4423, "step": 10363 }, { "epoch": 1.92, "learning_rate": 6.086601548172848e-06, "loss": 0.4215, "step": 10364 }, { "epoch": 1.92, "learning_rate": 6.084763478492659e-06, "loss": 0.4427, "step": 10365 }, { "epoch": 1.92, "learning_rate": 6.082925565023161e-06, "loss": 0.4225, "step": 10366 }, { "epoch": 1.92, "learning_rate": 6.081087807837682e-06, "loss": 0.4124, "step": 10367 }, { "epoch": 1.92, "learning_rate": 6.079250207009539e-06, "loss": 0.4169, "step": 10368 }, { "epoch": 1.92, "learning_rate": 6.077412762612058e-06, "loss": 0.4195, "step": 10369 }, { "epoch": 1.92, "learning_rate": 6.075575474718543e-06, "loss": 0.4291, "step": 10370 }, { "epoch": 1.92, "learning_rate": 6.073738343402302e-06, "loss": 0.4121, "step": 10371 }, { "epoch": 1.92, "learning_rate": 6.0719013687366325e-06, "loss": 0.4499, "step": 10372 }, { "epoch": 1.92, "learning_rate": 6.070064550794822e-06, "loss": 0.443, "step": 10373 }, { "epoch": 1.92, "learning_rate": 6.068227889650164e-06, "loss": 0.4402, "step": 10374 }, { "epoch": 1.92, "learning_rate": 6.066391385375929e-06, "loss": 0.4282, "step": 10375 }, { "epoch": 1.92, "learning_rate": 6.0645550380454e-06, "loss": 0.4179, "step": 10376 }, { "epoch": 1.92, "learning_rate": 6.062718847731835e-06, "loss": 0.4453, "step": 10377 }, { "epoch": 1.92, "learning_rate": 6.0608828145085005e-06, "loss": 0.4245, "step": 10378 }, { "epoch": 1.92, "learning_rate": 6.059046938448647e-06, "loss": 0.4213, "step": 10379 }, { "epoch": 1.92, "learning_rate": 6.057211219625525e-06, "loss": 0.4464, "step": 10380 }, { "epoch": 1.92, "learning_rate": 6.055375658112374e-06, "loss": 0.4227, "step": 10381 }, { "epoch": 1.92, "learning_rate": 6.053540253982433e-06, "loss": 0.4249, "step": 10382 }, { "epoch": 1.92, "learning_rate": 6.051705007308929e-06, "loss": 0.4222, "step": 10383 }, { "epoch": 1.92, "learning_rate": 6.049869918165086e-06, "loss": 0.4247, "step": 10384 }, { "epoch": 1.92, "learning_rate": 6.048034986624116e-06, "loss": 0.447, "step": 10385 }, { "epoch": 1.92, "learning_rate": 6.046200212759238e-06, "loss": 0.419, "step": 10386 }, { "epoch": 1.92, "learning_rate": 6.044365596643646e-06, "loss": 0.428, "step": 10387 }, { "epoch": 1.92, "learning_rate": 6.042531138350548e-06, "loss": 0.4473, "step": 10388 }, { "epoch": 1.92, "learning_rate": 6.0406968379531305e-06, "loss": 0.42, "step": 10389 }, { "epoch": 1.92, "learning_rate": 6.038862695524574e-06, "loss": 0.4181, "step": 10390 }, { "epoch": 1.92, "learning_rate": 6.037028711138067e-06, "loss": 0.4172, "step": 10391 }, { "epoch": 1.92, "learning_rate": 6.035194884866773e-06, "loss": 0.4457, "step": 10392 }, { "epoch": 1.92, "learning_rate": 6.033361216783866e-06, "loss": 0.4213, "step": 10393 }, { "epoch": 1.92, "learning_rate": 6.031527706962502e-06, "loss": 0.4137, "step": 10394 }, { "epoch": 1.92, "learning_rate": 6.029694355475833e-06, "loss": 0.4088, "step": 10395 }, { "epoch": 1.92, "learning_rate": 6.027861162397011e-06, "loss": 0.42, "step": 10396 }, { "epoch": 1.92, "learning_rate": 6.026028127799169e-06, "loss": 0.4235, "step": 10397 }, { "epoch": 1.92, "learning_rate": 6.024195251755454e-06, "loss": 0.4298, "step": 10398 }, { "epoch": 1.92, "learning_rate": 6.022362534338982e-06, "loss": 0.4455, "step": 10399 }, { "epoch": 1.92, "learning_rate": 6.0205299756228845e-06, "loss": 0.4552, "step": 10400 }, { "epoch": 1.92, "learning_rate": 6.018697575680272e-06, "loss": 0.4157, "step": 10401 }, { "epoch": 1.92, "learning_rate": 6.016865334584252e-06, "loss": 0.4351, "step": 10402 }, { "epoch": 1.92, "learning_rate": 6.015033252407934e-06, "loss": 0.4158, "step": 10403 }, { "epoch": 1.92, "learning_rate": 6.013201329224408e-06, "loss": 0.4383, "step": 10404 }, { "epoch": 1.93, "learning_rate": 6.011369565106773e-06, "loss": 0.4247, "step": 10405 }, { "epoch": 1.93, "learning_rate": 6.009537960128103e-06, "loss": 0.4175, "step": 10406 }, { "epoch": 1.93, "learning_rate": 6.007706514361482e-06, "loss": 0.4166, "step": 10407 }, { "epoch": 1.93, "learning_rate": 6.0058752278799796e-06, "loss": 0.397, "step": 10408 }, { "epoch": 1.93, "learning_rate": 6.0040441007566595e-06, "loss": 0.4245, "step": 10409 }, { "epoch": 1.93, "learning_rate": 6.002213133064583e-06, "loss": 0.3999, "step": 10410 }, { "epoch": 1.93, "learning_rate": 6.000382324876801e-06, "loss": 0.4287, "step": 10411 }, { "epoch": 1.93, "learning_rate": 5.9985516762663555e-06, "loss": 0.4389, "step": 10412 }, { "epoch": 1.93, "learning_rate": 5.9967211873062935e-06, "loss": 0.4179, "step": 10413 }, { "epoch": 1.93, "learning_rate": 5.994890858069642e-06, "loss": 0.434, "step": 10414 }, { "epoch": 1.93, "learning_rate": 5.993060688629433e-06, "loss": 0.4354, "step": 10415 }, { "epoch": 1.93, "learning_rate": 5.991230679058684e-06, "loss": 0.4282, "step": 10416 }, { "epoch": 1.93, "learning_rate": 5.989400829430404e-06, "loss": 0.4267, "step": 10417 }, { "epoch": 1.93, "learning_rate": 5.987571139817609e-06, "loss": 0.4291, "step": 10418 }, { "epoch": 1.93, "learning_rate": 5.9857416102932946e-06, "loss": 0.412, "step": 10419 }, { "epoch": 1.93, "learning_rate": 5.9839122409304605e-06, "loss": 0.4198, "step": 10420 }, { "epoch": 1.93, "learning_rate": 5.982083031802089e-06, "loss": 0.4156, "step": 10421 }, { "epoch": 1.93, "learning_rate": 5.98025398298117e-06, "loss": 0.4374, "step": 10422 }, { "epoch": 1.93, "learning_rate": 5.978425094540674e-06, "loss": 0.4038, "step": 10423 }, { "epoch": 1.93, "learning_rate": 5.976596366553567e-06, "loss": 0.4317, "step": 10424 }, { "epoch": 1.93, "learning_rate": 5.97476779909282e-06, "loss": 0.4385, "step": 10425 }, { "epoch": 1.93, "learning_rate": 5.97293939223138e-06, "loss": 0.4313, "step": 10426 }, { "epoch": 1.93, "learning_rate": 5.9711111460422075e-06, "loss": 0.4215, "step": 10427 }, { "epoch": 1.93, "learning_rate": 5.96928306059824e-06, "loss": 0.4011, "step": 10428 }, { "epoch": 1.93, "learning_rate": 5.9674551359724155e-06, "loss": 0.4009, "step": 10429 }, { "epoch": 1.93, "learning_rate": 5.965627372237664e-06, "loss": 0.4079, "step": 10430 }, { "epoch": 1.93, "learning_rate": 5.9637997694669115e-06, "loss": 0.4352, "step": 10431 }, { "epoch": 1.93, "learning_rate": 5.961972327733074e-06, "loss": 0.422, "step": 10432 }, { "epoch": 1.93, "learning_rate": 5.960145047109067e-06, "loss": 0.4273, "step": 10433 }, { "epoch": 1.93, "learning_rate": 5.9583179276677895e-06, "loss": 0.4469, "step": 10434 }, { "epoch": 1.93, "learning_rate": 5.956490969482148e-06, "loss": 0.4228, "step": 10435 }, { "epoch": 1.93, "learning_rate": 5.9546641726250264e-06, "loss": 0.4229, "step": 10436 }, { "epoch": 1.93, "learning_rate": 5.952837537169318e-06, "loss": 0.4417, "step": 10437 }, { "epoch": 1.93, "learning_rate": 5.951011063187899e-06, "loss": 0.4316, "step": 10438 }, { "epoch": 1.93, "learning_rate": 5.949184750753638e-06, "loss": 0.408, "step": 10439 }, { "epoch": 1.93, "learning_rate": 5.94735859993941e-06, "loss": 0.4186, "step": 10440 }, { "epoch": 1.93, "learning_rate": 5.9455326108180665e-06, "loss": 0.4248, "step": 10441 }, { "epoch": 1.93, "learning_rate": 5.943706783462468e-06, "loss": 0.4491, "step": 10442 }, { "epoch": 1.93, "learning_rate": 5.941881117945457e-06, "loss": 0.4064, "step": 10443 }, { "epoch": 1.93, "learning_rate": 5.940055614339879e-06, "loss": 0.4399, "step": 10444 }, { "epoch": 1.93, "learning_rate": 5.938230272718565e-06, "loss": 0.4257, "step": 10445 }, { "epoch": 1.93, "learning_rate": 5.936405093154338e-06, "loss": 0.4216, "step": 10446 }, { "epoch": 1.93, "learning_rate": 5.93458007572003e-06, "loss": 0.4392, "step": 10447 }, { "epoch": 1.93, "learning_rate": 5.932755220488446e-06, "loss": 0.4229, "step": 10448 }, { "epoch": 1.93, "learning_rate": 5.9309305275324014e-06, "loss": 0.4329, "step": 10449 }, { "epoch": 1.93, "learning_rate": 5.929105996924695e-06, "loss": 0.4218, "step": 10450 }, { "epoch": 1.93, "learning_rate": 5.927281628738117e-06, "loss": 0.4266, "step": 10451 }, { "epoch": 1.93, "learning_rate": 5.925457423045468e-06, "loss": 0.4279, "step": 10452 }, { "epoch": 1.93, "learning_rate": 5.92363337991952e-06, "loss": 0.4223, "step": 10453 }, { "epoch": 1.93, "learning_rate": 5.921809499433055e-06, "loss": 0.4367, "step": 10454 }, { "epoch": 1.93, "learning_rate": 5.91998578165884e-06, "loss": 0.4434, "step": 10455 }, { "epoch": 1.93, "learning_rate": 5.918162226669638e-06, "loss": 0.4096, "step": 10456 }, { "epoch": 1.93, "learning_rate": 5.916338834538205e-06, "loss": 0.4224, "step": 10457 }, { "epoch": 1.93, "learning_rate": 5.914515605337293e-06, "loss": 0.4164, "step": 10458 }, { "epoch": 1.94, "learning_rate": 5.912692539139644e-06, "loss": 0.4396, "step": 10459 }, { "epoch": 1.94, "learning_rate": 5.910869636017998e-06, "loss": 0.4214, "step": 10460 }, { "epoch": 1.94, "learning_rate": 5.909046896045076e-06, "loss": 0.4318, "step": 10461 }, { "epoch": 1.94, "learning_rate": 5.907224319293615e-06, "loss": 0.4237, "step": 10462 }, { "epoch": 1.94, "learning_rate": 5.905401905836321e-06, "loss": 0.4247, "step": 10463 }, { "epoch": 1.94, "learning_rate": 5.903579655745914e-06, "loss": 0.4157, "step": 10464 }, { "epoch": 1.94, "learning_rate": 5.901757569095093e-06, "loss": 0.4464, "step": 10465 }, { "epoch": 1.94, "learning_rate": 5.899935645956558e-06, "loss": 0.4167, "step": 10466 }, { "epoch": 1.94, "learning_rate": 5.898113886403001e-06, "loss": 0.4183, "step": 10467 }, { "epoch": 1.94, "learning_rate": 5.896292290507102e-06, "loss": 0.407, "step": 10468 }, { "epoch": 1.94, "learning_rate": 5.894470858341546e-06, "loss": 0.4286, "step": 10469 }, { "epoch": 1.94, "learning_rate": 5.892649589978997e-06, "loss": 0.4136, "step": 10470 }, { "epoch": 1.94, "learning_rate": 5.890828485492129e-06, "loss": 0.4105, "step": 10471 }, { "epoch": 1.94, "learning_rate": 5.8890075449535974e-06, "loss": 0.4123, "step": 10472 }, { "epoch": 1.94, "learning_rate": 5.88718676843605e-06, "loss": 0.4006, "step": 10473 }, { "epoch": 1.94, "learning_rate": 5.885366156012138e-06, "loss": 0.4012, "step": 10474 }, { "epoch": 1.94, "learning_rate": 5.883545707754496e-06, "loss": 0.4191, "step": 10475 }, { "epoch": 1.94, "learning_rate": 5.881725423735762e-06, "loss": 0.4458, "step": 10476 }, { "epoch": 1.94, "learning_rate": 5.879905304028557e-06, "loss": 0.4091, "step": 10477 }, { "epoch": 1.94, "learning_rate": 5.8780853487055025e-06, "loss": 0.4233, "step": 10478 }, { "epoch": 1.94, "learning_rate": 5.876265557839209e-06, "loss": 0.423, "step": 10479 }, { "epoch": 1.94, "learning_rate": 5.874445931502287e-06, "loss": 0.4186, "step": 10480 }, { "epoch": 1.94, "learning_rate": 5.8726264697673344e-06, "loss": 0.4292, "step": 10481 }, { "epoch": 1.94, "learning_rate": 5.870807172706945e-06, "loss": 0.4157, "step": 10482 }, { "epoch": 1.94, "learning_rate": 5.868988040393701e-06, "loss": 0.4092, "step": 10483 }, { "epoch": 1.94, "learning_rate": 5.867169072900189e-06, "loss": 0.4131, "step": 10484 }, { "epoch": 1.94, "learning_rate": 5.865350270298975e-06, "loss": 0.4225, "step": 10485 }, { "epoch": 1.94, "learning_rate": 5.863531632662636e-06, "loss": 0.4106, "step": 10486 }, { "epoch": 1.94, "learning_rate": 5.861713160063721e-06, "loss": 0.4292, "step": 10487 }, { "epoch": 1.94, "learning_rate": 5.859894852574793e-06, "loss": 0.4258, "step": 10488 }, { "epoch": 1.94, "learning_rate": 5.858076710268395e-06, "loss": 0.4265, "step": 10489 }, { "epoch": 1.94, "learning_rate": 5.856258733217065e-06, "loss": 0.3963, "step": 10490 }, { "epoch": 1.94, "learning_rate": 5.854440921493343e-06, "loss": 0.4107, "step": 10491 }, { "epoch": 1.94, "learning_rate": 5.852623275169748e-06, "loss": 0.4167, "step": 10492 }, { "epoch": 1.94, "learning_rate": 5.850805794318811e-06, "loss": 0.435, "step": 10493 }, { "epoch": 1.94, "learning_rate": 5.8489884790130406e-06, "loss": 0.4343, "step": 10494 }, { "epoch": 1.94, "learning_rate": 5.84717132932494e-06, "loss": 0.4309, "step": 10495 }, { "epoch": 1.94, "learning_rate": 5.845354345327019e-06, "loss": 0.4118, "step": 10496 }, { "epoch": 1.94, "learning_rate": 5.843537527091763e-06, "loss": 0.4477, "step": 10497 }, { "epoch": 1.94, "learning_rate": 5.841720874691667e-06, "loss": 0.4359, "step": 10498 }, { "epoch": 1.94, "learning_rate": 5.839904388199211e-06, "loss": 0.4253, "step": 10499 }, { "epoch": 1.94, "learning_rate": 5.8380880676868625e-06, "loss": 0.42, "step": 10500 }, { "epoch": 1.94, "learning_rate": 5.8362719132270984e-06, "loss": 0.4139, "step": 10501 }, { "epoch": 1.94, "learning_rate": 5.8344559248923725e-06, "loss": 0.4397, "step": 10502 }, { "epoch": 1.94, "learning_rate": 5.832640102755148e-06, "loss": 0.4337, "step": 10503 }, { "epoch": 1.94, "learning_rate": 5.830824446887867e-06, "loss": 0.4225, "step": 10504 }, { "epoch": 1.94, "learning_rate": 5.829008957362967e-06, "loss": 0.4249, "step": 10505 }, { "epoch": 1.94, "learning_rate": 5.827193634252892e-06, "loss": 0.4098, "step": 10506 }, { "epoch": 1.94, "learning_rate": 5.825378477630061e-06, "loss": 0.4074, "step": 10507 }, { "epoch": 1.94, "learning_rate": 5.8235634875669046e-06, "loss": 0.4245, "step": 10508 }, { "epoch": 1.94, "learning_rate": 5.821748664135828e-06, "loss": 0.4147, "step": 10509 }, { "epoch": 1.94, "learning_rate": 5.819934007409247e-06, "loss": 0.4082, "step": 10510 }, { "epoch": 1.94, "learning_rate": 5.818119517459562e-06, "loss": 0.4332, "step": 10511 }, { "epoch": 1.94, "learning_rate": 5.8163051943591594e-06, "loss": 0.42, "step": 10512 }, { "epoch": 1.95, "learning_rate": 5.814491038180439e-06, "loss": 0.4031, "step": 10513 }, { "epoch": 1.95, "learning_rate": 5.812677048995772e-06, "loss": 0.4068, "step": 10514 }, { "epoch": 1.95, "learning_rate": 5.810863226877542e-06, "loss": 0.4151, "step": 10515 }, { "epoch": 1.95, "learning_rate": 5.809049571898113e-06, "loss": 0.4127, "step": 10516 }, { "epoch": 1.95, "learning_rate": 5.8072360841298435e-06, "loss": 0.4242, "step": 10517 }, { "epoch": 1.95, "learning_rate": 5.805422763645097e-06, "loss": 0.4204, "step": 10518 }, { "epoch": 1.95, "learning_rate": 5.8036096105162095e-06, "loss": 0.3976, "step": 10519 }, { "epoch": 1.95, "learning_rate": 5.801796624815534e-06, "loss": 0.4266, "step": 10520 }, { "epoch": 1.95, "learning_rate": 5.799983806615401e-06, "loss": 0.4257, "step": 10521 }, { "epoch": 1.95, "learning_rate": 5.7981711559881346e-06, "loss": 0.425, "step": 10522 }, { "epoch": 1.95, "learning_rate": 5.796358673006063e-06, "loss": 0.423, "step": 10523 }, { "epoch": 1.95, "learning_rate": 5.794546357741493e-06, "loss": 0.4146, "step": 10524 }, { "epoch": 1.95, "learning_rate": 5.7927342102667415e-06, "loss": 0.4263, "step": 10525 }, { "epoch": 1.95, "learning_rate": 5.790922230654105e-06, "loss": 0.4241, "step": 10526 }, { "epoch": 1.95, "learning_rate": 5.7891104189758765e-06, "loss": 0.4273, "step": 10527 }, { "epoch": 1.95, "learning_rate": 5.787298775304347e-06, "loss": 0.4315, "step": 10528 }, { "epoch": 1.95, "learning_rate": 5.785487299711794e-06, "loss": 0.4206, "step": 10529 }, { "epoch": 1.95, "learning_rate": 5.7836759922705e-06, "loss": 0.4165, "step": 10530 }, { "epoch": 1.95, "learning_rate": 5.781864853052722e-06, "loss": 0.4226, "step": 10531 }, { "epoch": 1.95, "learning_rate": 5.780053882130732e-06, "loss": 0.423, "step": 10532 }, { "epoch": 1.95, "learning_rate": 5.778243079576777e-06, "loss": 0.4265, "step": 10533 }, { "epoch": 1.95, "learning_rate": 5.776432445463105e-06, "loss": 0.4102, "step": 10534 }, { "epoch": 1.95, "learning_rate": 5.774621979861963e-06, "loss": 0.4201, "step": 10535 }, { "epoch": 1.95, "learning_rate": 5.772811682845575e-06, "loss": 0.4177, "step": 10536 }, { "epoch": 1.95, "learning_rate": 5.77100155448618e-06, "loss": 0.4191, "step": 10537 }, { "epoch": 1.95, "learning_rate": 5.7691915948559916e-06, "loss": 0.4098, "step": 10538 }, { "epoch": 1.95, "learning_rate": 5.7673818040272225e-06, "loss": 0.422, "step": 10539 }, { "epoch": 1.95, "learning_rate": 5.765572182072086e-06, "loss": 0.4339, "step": 10540 }, { "epoch": 1.95, "learning_rate": 5.7637627290627766e-06, "loss": 0.4452, "step": 10541 }, { "epoch": 1.95, "learning_rate": 5.761953445071495e-06, "loss": 0.422, "step": 10542 }, { "epoch": 1.95, "learning_rate": 5.760144330170421e-06, "loss": 0.4418, "step": 10543 }, { "epoch": 1.95, "learning_rate": 5.758335384431741e-06, "loss": 0.4169, "step": 10544 }, { "epoch": 1.95, "learning_rate": 5.756526607927622e-06, "loss": 0.4001, "step": 10545 }, { "epoch": 1.95, "learning_rate": 5.754718000730239e-06, "loss": 0.4136, "step": 10546 }, { "epoch": 1.95, "learning_rate": 5.752909562911744e-06, "loss": 0.4202, "step": 10547 }, { "epoch": 1.95, "learning_rate": 5.751101294544299e-06, "loss": 0.4352, "step": 10548 }, { "epoch": 1.95, "learning_rate": 5.749293195700041e-06, "loss": 0.4267, "step": 10549 }, { "epoch": 1.95, "learning_rate": 5.747485266451118e-06, "loss": 0.4256, "step": 10550 }, { "epoch": 1.95, "learning_rate": 5.745677506869656e-06, "loss": 0.4332, "step": 10551 }, { "epoch": 1.95, "learning_rate": 5.743869917027789e-06, "loss": 0.4463, "step": 10552 }, { "epoch": 1.95, "learning_rate": 5.742062496997628e-06, "loss": 0.411, "step": 10553 }, { "epoch": 1.95, "learning_rate": 5.740255246851294e-06, "loss": 0.4198, "step": 10554 }, { "epoch": 1.95, "learning_rate": 5.738448166660889e-06, "loss": 0.4672, "step": 10555 }, { "epoch": 1.95, "learning_rate": 5.7366412564985085e-06, "loss": 0.4397, "step": 10556 }, { "epoch": 1.95, "learning_rate": 5.734834516436252e-06, "loss": 0.4323, "step": 10557 }, { "epoch": 1.95, "learning_rate": 5.733027946546198e-06, "loss": 0.446, "step": 10558 }, { "epoch": 1.95, "learning_rate": 5.731221546900432e-06, "loss": 0.3995, "step": 10559 }, { "epoch": 1.95, "learning_rate": 5.729415317571023e-06, "loss": 0.4219, "step": 10560 }, { "epoch": 1.95, "learning_rate": 5.727609258630034e-06, "loss": 0.4335, "step": 10561 }, { "epoch": 1.95, "learning_rate": 5.725803370149527e-06, "loss": 0.4048, "step": 10562 }, { "epoch": 1.95, "learning_rate": 5.723997652201549e-06, "loss": 0.4166, "step": 10563 }, { "epoch": 1.95, "learning_rate": 5.722192104858152e-06, "loss": 0.4238, "step": 10564 }, { "epoch": 1.95, "learning_rate": 5.72038672819137e-06, "loss": 0.412, "step": 10565 }, { "epoch": 1.95, "learning_rate": 5.71858152227323e-06, "loss": 0.42, "step": 10566 }, { "epoch": 1.96, "learning_rate": 5.7167764871757636e-06, "loss": 0.4164, "step": 10567 }, { "epoch": 1.96, "learning_rate": 5.714971622970982e-06, "loss": 0.418, "step": 10568 }, { "epoch": 1.96, "learning_rate": 5.713166929730903e-06, "loss": 0.4349, "step": 10569 }, { "epoch": 1.96, "learning_rate": 5.711362407527527e-06, "loss": 0.4262, "step": 10570 }, { "epoch": 1.96, "learning_rate": 5.7095580564328455e-06, "loss": 0.4173, "step": 10571 }, { "epoch": 1.96, "learning_rate": 5.707753876518859e-06, "loss": 0.4416, "step": 10572 }, { "epoch": 1.96, "learning_rate": 5.705949867857541e-06, "loss": 0.4271, "step": 10573 }, { "epoch": 1.96, "learning_rate": 5.704146030520878e-06, "loss": 0.4217, "step": 10574 }, { "epoch": 1.96, "learning_rate": 5.70234236458083e-06, "loss": 0.4208, "step": 10575 }, { "epoch": 1.96, "learning_rate": 5.70053887010937e-06, "loss": 0.4224, "step": 10576 }, { "epoch": 1.96, "learning_rate": 5.698735547178449e-06, "loss": 0.4406, "step": 10577 }, { "epoch": 1.96, "learning_rate": 5.696932395860011e-06, "loss": 0.4239, "step": 10578 }, { "epoch": 1.96, "learning_rate": 5.695129416226008e-06, "loss": 0.4195, "step": 10579 }, { "epoch": 1.96, "learning_rate": 5.693326608348366e-06, "loss": 0.4233, "step": 10580 }, { "epoch": 1.96, "learning_rate": 5.691523972299024e-06, "loss": 0.451, "step": 10581 }, { "epoch": 1.96, "learning_rate": 5.689721508149898e-06, "loss": 0.4471, "step": 10582 }, { "epoch": 1.96, "learning_rate": 5.687919215972899e-06, "loss": 0.445, "step": 10583 }, { "epoch": 1.96, "learning_rate": 5.6861170958399445e-06, "loss": 0.4348, "step": 10584 }, { "epoch": 1.96, "learning_rate": 5.684315147822927e-06, "loss": 0.4287, "step": 10585 }, { "epoch": 1.96, "learning_rate": 5.682513371993749e-06, "loss": 0.4252, "step": 10586 }, { "epoch": 1.96, "learning_rate": 5.680711768424294e-06, "loss": 0.4301, "step": 10587 }, { "epoch": 1.96, "learning_rate": 5.6789103371864375e-06, "loss": 0.4225, "step": 10588 }, { "epoch": 1.96, "learning_rate": 5.677109078352064e-06, "loss": 0.397, "step": 10589 }, { "epoch": 1.96, "learning_rate": 5.675307991993028e-06, "loss": 0.4098, "step": 10590 }, { "epoch": 1.96, "learning_rate": 5.673507078181202e-06, "loss": 0.4065, "step": 10591 }, { "epoch": 1.96, "learning_rate": 5.6717063369884285e-06, "loss": 0.4326, "step": 10592 }, { "epoch": 1.96, "learning_rate": 5.669905768486563e-06, "loss": 0.4042, "step": 10593 }, { "epoch": 1.96, "learning_rate": 5.668105372747436e-06, "loss": 0.4316, "step": 10594 }, { "epoch": 1.96, "learning_rate": 5.666305149842888e-06, "loss": 0.4224, "step": 10595 }, { "epoch": 1.96, "learning_rate": 5.664505099844737e-06, "loss": 0.444, "step": 10596 }, { "epoch": 1.96, "learning_rate": 5.6627052228248116e-06, "loss": 0.4136, "step": 10597 }, { "epoch": 1.96, "learning_rate": 5.660905518854911e-06, "loss": 0.4271, "step": 10598 }, { "epoch": 1.96, "learning_rate": 5.659105988006852e-06, "loss": 0.4287, "step": 10599 }, { "epoch": 1.96, "learning_rate": 5.657306630352421e-06, "loss": 0.4392, "step": 10600 }, { "epoch": 1.96, "learning_rate": 5.655507445963422e-06, "loss": 0.4198, "step": 10601 }, { "epoch": 1.96, "learning_rate": 5.6537084349116265e-06, "loss": 0.4383, "step": 10602 }, { "epoch": 1.96, "learning_rate": 5.651909597268823e-06, "loss": 0.4071, "step": 10603 }, { "epoch": 1.96, "learning_rate": 5.650110933106776e-06, "loss": 0.4202, "step": 10604 }, { "epoch": 1.96, "learning_rate": 5.648312442497244e-06, "loss": 0.4224, "step": 10605 }, { "epoch": 1.96, "learning_rate": 5.646514125511993e-06, "loss": 0.4186, "step": 10606 }, { "epoch": 1.96, "learning_rate": 5.644715982222764e-06, "loss": 0.4146, "step": 10607 }, { "epoch": 1.96, "learning_rate": 5.642918012701308e-06, "loss": 0.4326, "step": 10608 }, { "epoch": 1.96, "learning_rate": 5.6411202170193564e-06, "loss": 0.4182, "step": 10609 }, { "epoch": 1.96, "learning_rate": 5.639322595248634e-06, "loss": 0.4289, "step": 10610 }, { "epoch": 1.96, "learning_rate": 5.63752514746087e-06, "loss": 0.4303, "step": 10611 }, { "epoch": 1.96, "learning_rate": 5.635727873727772e-06, "loss": 0.417, "step": 10612 }, { "epoch": 1.96, "learning_rate": 5.633930774121057e-06, "loss": 0.4097, "step": 10613 }, { "epoch": 1.96, "learning_rate": 5.632133848712419e-06, "loss": 0.4051, "step": 10614 }, { "epoch": 1.96, "learning_rate": 5.630337097573549e-06, "loss": 0.423, "step": 10615 }, { "epoch": 1.96, "learning_rate": 5.628540520776145e-06, "loss": 0.4265, "step": 10616 }, { "epoch": 1.96, "learning_rate": 5.626744118391874e-06, "loss": 0.4125, "step": 10617 }, { "epoch": 1.96, "learning_rate": 5.62494789049242e-06, "loss": 0.4074, "step": 10618 }, { "epoch": 1.96, "learning_rate": 5.623151837149443e-06, "loss": 0.428, "step": 10619 }, { "epoch": 1.96, "learning_rate": 5.6213559584346065e-06, "loss": 0.4275, "step": 10620 }, { "epoch": 1.97, "learning_rate": 5.61956025441956e-06, "loss": 0.4332, "step": 10621 }, { "epoch": 1.97, "learning_rate": 5.617764725175947e-06, "loss": 0.4295, "step": 10622 }, { "epoch": 1.97, "learning_rate": 5.615969370775412e-06, "loss": 0.4309, "step": 10623 }, { "epoch": 1.97, "learning_rate": 5.6141741912895765e-06, "loss": 0.4092, "step": 10624 }, { "epoch": 1.97, "learning_rate": 5.612379186790075e-06, "loss": 0.4158, "step": 10625 }, { "epoch": 1.97, "learning_rate": 5.610584357348521e-06, "loss": 0.4135, "step": 10626 }, { "epoch": 1.97, "learning_rate": 5.6087897030365215e-06, "loss": 0.4358, "step": 10627 }, { "epoch": 1.97, "learning_rate": 5.606995223925684e-06, "loss": 0.4296, "step": 10628 }, { "epoch": 1.97, "learning_rate": 5.605200920087601e-06, "loss": 0.4254, "step": 10629 }, { "epoch": 1.97, "learning_rate": 5.603406791593869e-06, "loss": 0.4217, "step": 10630 }, { "epoch": 1.97, "learning_rate": 5.601612838516066e-06, "loss": 0.4109, "step": 10631 }, { "epoch": 1.97, "learning_rate": 5.599819060925764e-06, "loss": 0.4194, "step": 10632 }, { "epoch": 1.97, "learning_rate": 5.598025458894537e-06, "loss": 0.443, "step": 10633 }, { "epoch": 1.97, "learning_rate": 5.596232032493941e-06, "loss": 0.4246, "step": 10634 }, { "epoch": 1.97, "learning_rate": 5.594438781795537e-06, "loss": 0.4421, "step": 10635 }, { "epoch": 1.97, "learning_rate": 5.592645706870869e-06, "loss": 0.4333, "step": 10636 }, { "epoch": 1.97, "learning_rate": 5.590852807791475e-06, "loss": 0.425, "step": 10637 }, { "epoch": 1.97, "learning_rate": 5.589060084628892e-06, "loss": 0.4315, "step": 10638 }, { "epoch": 1.97, "learning_rate": 5.587267537454643e-06, "loss": 0.42, "step": 10639 }, { "epoch": 1.97, "learning_rate": 5.585475166340253e-06, "loss": 0.4495, "step": 10640 }, { "epoch": 1.97, "learning_rate": 5.583682971357226e-06, "loss": 0.4419, "step": 10641 }, { "epoch": 1.97, "learning_rate": 5.581890952577076e-06, "loss": 0.4104, "step": 10642 }, { "epoch": 1.97, "learning_rate": 5.580099110071293e-06, "loss": 0.4205, "step": 10643 }, { "epoch": 1.97, "learning_rate": 5.578307443911377e-06, "loss": 0.4277, "step": 10644 }, { "epoch": 1.97, "learning_rate": 5.576515954168802e-06, "loss": 0.4512, "step": 10645 }, { "epoch": 1.97, "learning_rate": 5.574724640915057e-06, "loss": 0.4132, "step": 10646 }, { "epoch": 1.97, "learning_rate": 5.572933504221599e-06, "loss": 0.4342, "step": 10647 }, { "epoch": 1.97, "learning_rate": 5.571142544159903e-06, "loss": 0.432, "step": 10648 }, { "epoch": 1.97, "learning_rate": 5.569351760801416e-06, "loss": 0.4235, "step": 10649 }, { "epoch": 1.97, "learning_rate": 5.567561154217594e-06, "loss": 0.4154, "step": 10650 }, { "epoch": 1.97, "learning_rate": 5.565770724479871e-06, "loss": 0.4135, "step": 10651 }, { "epoch": 1.97, "learning_rate": 5.563980471659691e-06, "loss": 0.433, "step": 10652 }, { "epoch": 1.97, "learning_rate": 5.562190395828478e-06, "loss": 0.4305, "step": 10653 }, { "epoch": 1.97, "learning_rate": 5.560400497057645e-06, "loss": 0.4355, "step": 10654 }, { "epoch": 1.97, "learning_rate": 5.558610775418619e-06, "loss": 0.4481, "step": 10655 }, { "epoch": 1.97, "learning_rate": 5.556821230982796e-06, "loss": 0.4107, "step": 10656 }, { "epoch": 1.97, "learning_rate": 5.555031863821582e-06, "loss": 0.4145, "step": 10657 }, { "epoch": 1.97, "learning_rate": 5.553242674006368e-06, "loss": 0.4178, "step": 10658 }, { "epoch": 1.97, "learning_rate": 5.551453661608534e-06, "loss": 0.4298, "step": 10659 }, { "epoch": 1.97, "learning_rate": 5.549664826699468e-06, "loss": 0.4227, "step": 10660 }, { "epoch": 1.97, "learning_rate": 5.54787616935053e-06, "loss": 0.4373, "step": 10661 }, { "epoch": 1.97, "learning_rate": 5.546087689633095e-06, "loss": 0.4383, "step": 10662 }, { "epoch": 1.97, "learning_rate": 5.5442993876185145e-06, "loss": 0.4114, "step": 10663 }, { "epoch": 1.97, "learning_rate": 5.542511263378136e-06, "loss": 0.4505, "step": 10664 }, { "epoch": 1.97, "learning_rate": 5.5407233169833075e-06, "loss": 0.4174, "step": 10665 }, { "epoch": 1.97, "learning_rate": 5.5389355485053596e-06, "loss": 0.4161, "step": 10666 }, { "epoch": 1.97, "learning_rate": 5.537147958015627e-06, "loss": 0.4209, "step": 10667 }, { "epoch": 1.97, "learning_rate": 5.535360545585425e-06, "loss": 0.4118, "step": 10668 }, { "epoch": 1.97, "learning_rate": 5.533573311286075e-06, "loss": 0.416, "step": 10669 }, { "epoch": 1.97, "learning_rate": 5.53178625518888e-06, "loss": 0.428, "step": 10670 }, { "epoch": 1.97, "learning_rate": 5.529999377365138e-06, "loss": 0.4392, "step": 10671 }, { "epoch": 1.97, "learning_rate": 5.528212677886148e-06, "loss": 0.4182, "step": 10672 }, { "epoch": 1.97, "learning_rate": 5.526426156823188e-06, "loss": 0.4238, "step": 10673 }, { "epoch": 1.97, "learning_rate": 5.524639814247547e-06, "loss": 0.4133, "step": 10674 }, { "epoch": 1.98, "learning_rate": 5.5228536502304915e-06, "loss": 0.42, "step": 10675 }, { "epoch": 1.98, "learning_rate": 5.521067664843282e-06, "loss": 0.4116, "step": 10676 }, { "epoch": 1.98, "learning_rate": 5.519281858157184e-06, "loss": 0.4046, "step": 10677 }, { "epoch": 1.98, "learning_rate": 5.51749623024344e-06, "loss": 0.4222, "step": 10678 }, { "epoch": 1.98, "learning_rate": 5.515710781173302e-06, "loss": 0.4089, "step": 10679 }, { "epoch": 1.98, "learning_rate": 5.513925511018e-06, "loss": 0.4065, "step": 10680 }, { "epoch": 1.98, "learning_rate": 5.512140419848761e-06, "loss": 0.4281, "step": 10681 }, { "epoch": 1.98, "learning_rate": 5.510355507736814e-06, "loss": 0.4093, "step": 10682 }, { "epoch": 1.98, "learning_rate": 5.508570774753366e-06, "loss": 0.4376, "step": 10683 }, { "epoch": 1.98, "learning_rate": 5.506786220969633e-06, "loss": 0.4158, "step": 10684 }, { "epoch": 1.98, "learning_rate": 5.50500184645681e-06, "loss": 0.4362, "step": 10685 }, { "epoch": 1.98, "learning_rate": 5.503217651286088e-06, "loss": 0.4189, "step": 10686 }, { "epoch": 1.98, "learning_rate": 5.501433635528659e-06, "loss": 0.4127, "step": 10687 }, { "epoch": 1.98, "learning_rate": 5.499649799255695e-06, "loss": 0.4067, "step": 10688 }, { "epoch": 1.98, "learning_rate": 5.497866142538377e-06, "loss": 0.4266, "step": 10689 }, { "epoch": 1.98, "learning_rate": 5.496082665447859e-06, "loss": 0.4314, "step": 10690 }, { "epoch": 1.98, "learning_rate": 5.494299368055309e-06, "loss": 0.4373, "step": 10691 }, { "epoch": 1.98, "learning_rate": 5.492516250431869e-06, "loss": 0.436, "step": 10692 }, { "epoch": 1.98, "learning_rate": 5.490733312648689e-06, "loss": 0.4166, "step": 10693 }, { "epoch": 1.98, "learning_rate": 5.488950554776895e-06, "loss": 0.4219, "step": 10694 }, { "epoch": 1.98, "learning_rate": 5.4871679768876275e-06, "loss": 0.4212, "step": 10695 }, { "epoch": 1.98, "learning_rate": 5.485385579051998e-06, "loss": 0.4352, "step": 10696 }, { "epoch": 1.98, "learning_rate": 5.48360336134113e-06, "loss": 0.4106, "step": 10697 }, { "epoch": 1.98, "learning_rate": 5.481821323826121e-06, "loss": 0.432, "step": 10698 }, { "epoch": 1.98, "learning_rate": 5.4800394665780795e-06, "loss": 0.4015, "step": 10699 }, { "epoch": 1.98, "learning_rate": 5.478257789668092e-06, "loss": 0.418, "step": 10700 }, { "epoch": 1.98, "learning_rate": 5.476476293167251e-06, "loss": 0.4423, "step": 10701 }, { "epoch": 1.98, "learning_rate": 5.474694977146631e-06, "loss": 0.4132, "step": 10702 }, { "epoch": 1.98, "learning_rate": 5.472913841677297e-06, "loss": 0.4146, "step": 10703 }, { "epoch": 1.98, "learning_rate": 5.4711328868303245e-06, "loss": 0.4083, "step": 10704 }, { "epoch": 1.98, "learning_rate": 5.469352112676761e-06, "loss": 0.4361, "step": 10705 }, { "epoch": 1.98, "learning_rate": 5.467571519287665e-06, "loss": 0.4218, "step": 10706 }, { "epoch": 1.98, "learning_rate": 5.465791106734072e-06, "loss": 0.4176, "step": 10707 }, { "epoch": 1.98, "learning_rate": 5.464010875087016e-06, "loss": 0.4056, "step": 10708 }, { "epoch": 1.98, "learning_rate": 5.462230824417531e-06, "loss": 0.4415, "step": 10709 }, { "epoch": 1.98, "learning_rate": 5.460450954796631e-06, "loss": 0.4323, "step": 10710 }, { "epoch": 1.98, "learning_rate": 5.458671266295336e-06, "loss": 0.4362, "step": 10711 }, { "epoch": 1.98, "learning_rate": 5.456891758984648e-06, "loss": 0.4177, "step": 10712 }, { "epoch": 1.98, "learning_rate": 5.45511243293557e-06, "loss": 0.4132, "step": 10713 }, { "epoch": 1.98, "learning_rate": 5.453333288219091e-06, "loss": 0.4216, "step": 10714 }, { "epoch": 1.98, "learning_rate": 5.4515543249061935e-06, "loss": 0.4166, "step": 10715 }, { "epoch": 1.98, "learning_rate": 5.449775543067859e-06, "loss": 0.4217, "step": 10716 }, { "epoch": 1.98, "learning_rate": 5.447996942775053e-06, "loss": 0.4237, "step": 10717 }, { "epoch": 1.98, "learning_rate": 5.446218524098745e-06, "loss": 0.4351, "step": 10718 }, { "epoch": 1.98, "learning_rate": 5.4444402871098865e-06, "loss": 0.4118, "step": 10719 }, { "epoch": 1.98, "learning_rate": 5.442662231879423e-06, "loss": 0.4244, "step": 10720 }, { "epoch": 1.98, "learning_rate": 5.440884358478302e-06, "loss": 0.3975, "step": 10721 }, { "epoch": 1.98, "learning_rate": 5.439106666977451e-06, "loss": 0.4246, "step": 10722 }, { "epoch": 1.98, "learning_rate": 5.437329157447803e-06, "loss": 0.4201, "step": 10723 }, { "epoch": 1.98, "learning_rate": 5.435551829960274e-06, "loss": 0.4227, "step": 10724 }, { "epoch": 1.98, "learning_rate": 5.433774684585772e-06, "loss": 0.4335, "step": 10725 }, { "epoch": 1.98, "learning_rate": 5.43199772139521e-06, "loss": 0.4239, "step": 10726 }, { "epoch": 1.98, "learning_rate": 5.430220940459478e-06, "loss": 0.4099, "step": 10727 }, { "epoch": 1.98, "learning_rate": 5.4284443418494735e-06, "loss": 0.4565, "step": 10728 }, { "epoch": 1.99, "learning_rate": 5.426667925636076e-06, "loss": 0.4391, "step": 10729 }, { "epoch": 1.99, "learning_rate": 5.424891691890156e-06, "loss": 0.4171, "step": 10730 }, { "epoch": 1.99, "learning_rate": 5.423115640682592e-06, "loss": 0.4147, "step": 10731 }, { "epoch": 1.99, "learning_rate": 5.421339772084236e-06, "loss": 0.4247, "step": 10732 }, { "epoch": 1.99, "learning_rate": 5.419564086165949e-06, "loss": 0.4175, "step": 10733 }, { "epoch": 1.99, "learning_rate": 5.417788582998571e-06, "loss": 0.4406, "step": 10734 }, { "epoch": 1.99, "learning_rate": 5.416013262652949e-06, "loss": 0.4205, "step": 10735 }, { "epoch": 1.99, "learning_rate": 5.414238125199911e-06, "loss": 0.4239, "step": 10736 }, { "epoch": 1.99, "learning_rate": 5.412463170710277e-06, "loss": 0.4257, "step": 10737 }, { "epoch": 1.99, "learning_rate": 5.410688399254873e-06, "loss": 0.441, "step": 10738 }, { "epoch": 1.99, "learning_rate": 5.4089138109045015e-06, "loss": 0.4117, "step": 10739 }, { "epoch": 1.99, "learning_rate": 5.407139405729972e-06, "loss": 0.4146, "step": 10740 }, { "epoch": 1.99, "learning_rate": 5.405365183802077e-06, "loss": 0.4456, "step": 10741 }, { "epoch": 1.99, "learning_rate": 5.4035911451916e-06, "loss": 0.4274, "step": 10742 }, { "epoch": 1.99, "learning_rate": 5.401817289969331e-06, "loss": 0.4448, "step": 10743 }, { "epoch": 1.99, "learning_rate": 5.400043618206034e-06, "loss": 0.4183, "step": 10744 }, { "epoch": 1.99, "learning_rate": 5.398270129972485e-06, "loss": 0.4211, "step": 10745 }, { "epoch": 1.99, "learning_rate": 5.396496825339435e-06, "loss": 0.4322, "step": 10746 }, { "epoch": 1.99, "learning_rate": 5.39472370437764e-06, "loss": 0.4098, "step": 10747 }, { "epoch": 1.99, "learning_rate": 5.392950767157841e-06, "loss": 0.4246, "step": 10748 }, { "epoch": 1.99, "learning_rate": 5.3911780137507786e-06, "loss": 0.432, "step": 10749 }, { "epoch": 1.99, "learning_rate": 5.389405444227177e-06, "loss": 0.4224, "step": 10750 }, { "epoch": 1.99, "learning_rate": 5.387633058657766e-06, "loss": 0.4055, "step": 10751 }, { "epoch": 1.99, "learning_rate": 5.385860857113253e-06, "loss": 0.4396, "step": 10752 }, { "epoch": 1.99, "learning_rate": 5.384088839664352e-06, "loss": 0.4176, "step": 10753 }, { "epoch": 1.99, "learning_rate": 5.382317006381758e-06, "loss": 0.4589, "step": 10754 }, { "epoch": 1.99, "learning_rate": 5.380545357336168e-06, "loss": 0.4329, "step": 10755 }, { "epoch": 1.99, "learning_rate": 5.3787738925982626e-06, "loss": 0.4213, "step": 10756 }, { "epoch": 1.99, "learning_rate": 5.377002612238726e-06, "loss": 0.418, "step": 10757 }, { "epoch": 1.99, "learning_rate": 5.375231516328228e-06, "loss": 0.4052, "step": 10758 }, { "epoch": 1.99, "learning_rate": 5.373460604937424e-06, "loss": 0.4248, "step": 10759 }, { "epoch": 1.99, "learning_rate": 5.371689878136981e-06, "loss": 0.4173, "step": 10760 }, { "epoch": 1.99, "learning_rate": 5.3699193359975375e-06, "loss": 0.4209, "step": 10761 }, { "epoch": 1.99, "learning_rate": 5.368148978589745e-06, "loss": 0.4268, "step": 10762 }, { "epoch": 1.99, "learning_rate": 5.366378805984233e-06, "loss": 0.4136, "step": 10763 }, { "epoch": 1.99, "learning_rate": 5.364608818251623e-06, "loss": 0.4156, "step": 10764 }, { "epoch": 1.99, "learning_rate": 5.362839015462543e-06, "loss": 0.4157, "step": 10765 }, { "epoch": 1.99, "learning_rate": 5.361069397687597e-06, "loss": 0.4186, "step": 10766 }, { "epoch": 1.99, "learning_rate": 5.359299964997397e-06, "loss": 0.4192, "step": 10767 }, { "epoch": 1.99, "learning_rate": 5.357530717462538e-06, "loss": 0.4342, "step": 10768 }, { "epoch": 1.99, "learning_rate": 5.355761655153602e-06, "loss": 0.4142, "step": 10769 }, { "epoch": 1.99, "learning_rate": 5.353992778141182e-06, "loss": 0.4278, "step": 10770 }, { "epoch": 1.99, "learning_rate": 5.352224086495845e-06, "loss": 0.4187, "step": 10771 }, { "epoch": 1.99, "learning_rate": 5.350455580288165e-06, "loss": 0.4103, "step": 10772 }, { "epoch": 1.99, "learning_rate": 5.3486872595886995e-06, "loss": 0.4104, "step": 10773 }, { "epoch": 1.99, "learning_rate": 5.346919124467997e-06, "loss": 0.4273, "step": 10774 }, { "epoch": 1.99, "learning_rate": 5.34515117499661e-06, "loss": 0.4158, "step": 10775 }, { "epoch": 1.99, "learning_rate": 5.343383411245069e-06, "loss": 0.4254, "step": 10776 }, { "epoch": 1.99, "learning_rate": 5.341615833283911e-06, "loss": 0.4137, "step": 10777 }, { "epoch": 1.99, "learning_rate": 5.3398484411836545e-06, "loss": 0.4335, "step": 10778 }, { "epoch": 1.99, "learning_rate": 5.33808123501482e-06, "loss": 0.4222, "step": 10779 }, { "epoch": 1.99, "learning_rate": 5.336314214847913e-06, "loss": 0.4219, "step": 10780 }, { "epoch": 1.99, "learning_rate": 5.33454738075343e-06, "loss": 0.4179, "step": 10781 }, { "epoch": 1.99, "learning_rate": 5.332780732801874e-06, "loss": 0.4229, "step": 10782 }, { "epoch": 2.0, "learning_rate": 5.331014271063721e-06, "loss": 0.4245, "step": 10783 }, { "epoch": 2.0, "learning_rate": 5.329247995609457e-06, "loss": 0.4071, "step": 10784 }, { "epoch": 2.0, "learning_rate": 5.327481906509552e-06, "loss": 0.4243, "step": 10785 }, { "epoch": 2.0, "learning_rate": 5.325716003834462e-06, "loss": 0.4187, "step": 10786 }, { "epoch": 2.0, "learning_rate": 5.323950287654656e-06, "loss": 0.4147, "step": 10787 }, { "epoch": 2.0, "learning_rate": 5.322184758040569e-06, "loss": 0.4167, "step": 10788 }, { "epoch": 2.0, "learning_rate": 5.3204194150626564e-06, "loss": 0.4258, "step": 10789 }, { "epoch": 2.0, "learning_rate": 5.3186542587913425e-06, "loss": 0.4223, "step": 10790 }, { "epoch": 2.0, "learning_rate": 5.316889289297054e-06, "loss": 0.4211, "step": 10791 }, { "epoch": 2.0, "learning_rate": 5.315124506650215e-06, "loss": 0.4527, "step": 10792 }, { "epoch": 2.0, "learning_rate": 5.313359910921232e-06, "loss": 0.4074, "step": 10793 }, { "epoch": 2.0, "learning_rate": 5.3115955021805155e-06, "loss": 0.4324, "step": 10794 }, { "epoch": 2.0, "learning_rate": 5.309831280498453e-06, "loss": 0.4053, "step": 10795 }, { "epoch": 2.0, "learning_rate": 5.308067245945443e-06, "loss": 0.4117, "step": 10796 }, { "epoch": 2.0, "learning_rate": 5.3063033985918585e-06, "loss": 0.4489, "step": 10797 }, { "epoch": 2.0, "learning_rate": 5.304539738508083e-06, "loss": 0.4191, "step": 10798 }, { "epoch": 2.0, "learning_rate": 5.302776265764475e-06, "loss": 0.4267, "step": 10799 }, { "epoch": 2.0, "learning_rate": 5.301012980431401e-06, "loss": 0.4406, "step": 10800 }, { "epoch": 2.0, "learning_rate": 5.299249882579205e-06, "loss": 0.4122, "step": 10801 }, { "epoch": 2.0, "learning_rate": 5.297486972278239e-06, "loss": 0.4312, "step": 10802 }, { "epoch": 2.0, "learning_rate": 5.295724249598833e-06, "loss": 0.4401, "step": 10803 }, { "epoch": 2.0, "learning_rate": 5.2939617146113235e-06, "loss": 0.4464, "step": 10804 }, { "epoch": 2.0, "learning_rate": 5.292199367386024e-06, "loss": 0.417, "step": 10805 }, { "epoch": 2.0, "learning_rate": 5.290437207993257e-06, "loss": 0.4186, "step": 10806 }, { "epoch": 2.0, "learning_rate": 5.2886752365033275e-06, "loss": 0.4265, "step": 10807 }, { "epoch": 2.0, "learning_rate": 5.2869134529865285e-06, "loss": 0.4051, "step": 10808 }, { "epoch": 2.0, "learning_rate": 5.285151857513161e-06, "loss": 0.42, "step": 10809 }, { "epoch": 2.0, "learning_rate": 5.2833904501535e-06, "loss": 0.4191, "step": 10810 }, { "epoch": 2.0, "learning_rate": 5.281629230977834e-06, "loss": 0.4255, "step": 10811 }, { "epoch": 2.0, "learning_rate": 5.279868200056424e-06, "loss": 0.4189, "step": 10812 }, { "epoch": 2.0, "learning_rate": 5.27810735745953e-06, "loss": 0.4271, "step": 10813 }, { "epoch": 2.0, "learning_rate": 5.276346703257414e-06, "loss": 0.4161, "step": 10814 }, { "epoch": 2.0, "learning_rate": 5.274586237520314e-06, "loss": 0.3974, "step": 10815 }, { "epoch": 2.0, "learning_rate": 5.272825960318479e-06, "loss": 0.4244, "step": 10816 }, { "epoch": 2.0, "learning_rate": 5.271065871722136e-06, "loss": 0.4384, "step": 10817 }, { "epoch": 2.0, "learning_rate": 5.269305971801506e-06, "loss": 0.4244, "step": 10818 }, { "epoch": 2.0, "learning_rate": 5.2675462606268125e-06, "loss": 0.4014, "step": 10819 }, { "epoch": 2.0, "learning_rate": 5.265786738268258e-06, "loss": 0.4142, "step": 10820 }, { "epoch": 2.0, "learning_rate": 5.264027404796051e-06, "loss": 0.4265, "step": 10821 }, { "epoch": 2.0, "learning_rate": 5.262268260280377e-06, "loss": 0.4189, "step": 10822 }, { "epoch": 2.0, "learning_rate": 5.2605093047914334e-06, "loss": 0.4111, "step": 10823 }, { "epoch": 2.0, "learning_rate": 5.258750538399393e-06, "loss": 0.4159, "step": 10824 }, { "epoch": 2.0, "learning_rate": 5.256991961174425e-06, "loss": 0.4131, "step": 10825 }, { "epoch": 2.0, "learning_rate": 5.255233573186698e-06, "loss": 0.433, "step": 10826 }, { "epoch": 2.0, "learning_rate": 5.253475374506365e-06, "loss": 0.4065, "step": 10827 }, { "epoch": 2.0, "learning_rate": 5.251717365203579e-06, "loss": 0.4184, "step": 10828 }, { "epoch": 2.0, "learning_rate": 5.249959545348479e-06, "loss": 0.4302, "step": 10829 }, { "epoch": 2.0, "learning_rate": 5.2482019150111955e-06, "loss": 0.4331, "step": 10830 }, { "epoch": 2.0, "learning_rate": 5.2464444742618615e-06, "loss": 0.4252, "step": 10831 }, { "epoch": 2.0, "learning_rate": 5.244687223170588e-06, "loss": 0.4208, "step": 10832 }, { "epoch": 2.0, "learning_rate": 5.242930161807493e-06, "loss": 0.4057, "step": 10833 }, { "epoch": 2.0, "learning_rate": 5.241173290242679e-06, "loss": 0.4044, "step": 10834 }, { "epoch": 2.0, "learning_rate": 5.239416608546235e-06, "loss": 0.4194, "step": 10835 }, { "epoch": 2.0, "learning_rate": 5.237660116788259e-06, "loss": 0.4227, "step": 10836 }, { "epoch": 2.0, "learning_rate": 5.235903815038823e-06, "loss": 0.4026, "step": 10837 }, { "epoch": 2.01, "learning_rate": 5.2341477033680065e-06, "loss": 0.4119, "step": 10838 }, { "epoch": 2.01, "learning_rate": 5.232391781845875e-06, "loss": 0.3998, "step": 10839 }, { "epoch": 2.01, "learning_rate": 5.230636050542479e-06, "loss": 0.4402, "step": 10840 }, { "epoch": 2.01, "learning_rate": 5.22888050952788e-06, "loss": 0.4166, "step": 10841 }, { "epoch": 2.01, "learning_rate": 5.2271251588721105e-06, "loss": 0.4218, "step": 10842 }, { "epoch": 2.01, "learning_rate": 5.2253699986452136e-06, "loss": 0.43, "step": 10843 }, { "epoch": 2.01, "learning_rate": 5.223615028917211e-06, "loss": 0.4025, "step": 10844 }, { "epoch": 2.01, "learning_rate": 5.221860249758128e-06, "loss": 0.4116, "step": 10845 }, { "epoch": 2.01, "learning_rate": 5.220105661237971e-06, "loss": 0.4033, "step": 10846 }, { "epoch": 2.01, "learning_rate": 5.218351263426753e-06, "loss": 0.4133, "step": 10847 }, { "epoch": 2.01, "learning_rate": 5.216597056394462e-06, "loss": 0.4181, "step": 10848 }, { "epoch": 2.01, "learning_rate": 5.2148430402110974e-06, "loss": 0.4361, "step": 10849 }, { "epoch": 2.01, "learning_rate": 5.213089214946631e-06, "loss": 0.4219, "step": 10850 }, { "epoch": 2.01, "learning_rate": 5.211335580671046e-06, "loss": 0.4118, "step": 10851 }, { "epoch": 2.01, "learning_rate": 5.209582137454301e-06, "loss": 0.426, "step": 10852 }, { "epoch": 2.01, "learning_rate": 5.207828885366364e-06, "loss": 0.4183, "step": 10853 }, { "epoch": 2.01, "learning_rate": 5.206075824477179e-06, "loss": 0.4219, "step": 10854 }, { "epoch": 2.01, "learning_rate": 5.204322954856695e-06, "loss": 0.4155, "step": 10855 }, { "epoch": 2.01, "learning_rate": 5.2025702765748475e-06, "loss": 0.4091, "step": 10856 }, { "epoch": 2.01, "learning_rate": 5.2008177897015596e-06, "loss": 0.4076, "step": 10857 }, { "epoch": 2.01, "learning_rate": 5.199065494306761e-06, "loss": 0.4298, "step": 10858 }, { "epoch": 2.01, "learning_rate": 5.1973133904603555e-06, "loss": 0.4276, "step": 10859 }, { "epoch": 2.01, "learning_rate": 5.195561478232258e-06, "loss": 0.4159, "step": 10860 }, { "epoch": 2.01, "learning_rate": 5.193809757692363e-06, "loss": 0.4144, "step": 10861 }, { "epoch": 2.01, "learning_rate": 5.192058228910555e-06, "loss": 0.4337, "step": 10862 }, { "epoch": 2.01, "learning_rate": 5.190306891956727e-06, "loss": 0.414, "step": 10863 }, { "epoch": 2.01, "learning_rate": 5.188555746900745e-06, "loss": 0.4263, "step": 10864 }, { "epoch": 2.01, "learning_rate": 5.186804793812483e-06, "loss": 0.4219, "step": 10865 }, { "epoch": 2.01, "learning_rate": 5.185054032761796e-06, "loss": 0.4121, "step": 10866 }, { "epoch": 2.01, "learning_rate": 5.183303463818543e-06, "loss": 0.4051, "step": 10867 }, { "epoch": 2.01, "learning_rate": 5.181553087052562e-06, "loss": 0.4181, "step": 10868 }, { "epoch": 2.01, "learning_rate": 5.17980290253369e-06, "loss": 0.4141, "step": 10869 }, { "epoch": 2.01, "learning_rate": 5.17805291033176e-06, "loss": 0.4372, "step": 10870 }, { "epoch": 2.01, "learning_rate": 5.176303110516587e-06, "loss": 0.4105, "step": 10871 }, { "epoch": 2.01, "learning_rate": 5.174553503157995e-06, "loss": 0.4147, "step": 10872 }, { "epoch": 2.01, "learning_rate": 5.172804088325783e-06, "loss": 0.4044, "step": 10873 }, { "epoch": 2.01, "learning_rate": 5.171054866089746e-06, "loss": 0.4253, "step": 10874 }, { "epoch": 2.01, "learning_rate": 5.1693058365196846e-06, "loss": 0.4097, "step": 10875 }, { "epoch": 2.01, "learning_rate": 5.1675569996853715e-06, "loss": 0.4045, "step": 10876 }, { "epoch": 2.01, "learning_rate": 5.165808355656592e-06, "loss": 0.4402, "step": 10877 }, { "epoch": 2.01, "learning_rate": 5.164059904503107e-06, "loss": 0.4338, "step": 10878 }, { "epoch": 2.01, "learning_rate": 5.162311646294676e-06, "loss": 0.4276, "step": 10879 }, { "epoch": 2.01, "learning_rate": 5.160563581101057e-06, "loss": 0.4141, "step": 10880 }, { "epoch": 2.01, "learning_rate": 5.158815708991988e-06, "loss": 0.4371, "step": 10881 }, { "epoch": 2.01, "learning_rate": 5.1570680300372114e-06, "loss": 0.4016, "step": 10882 }, { "epoch": 2.01, "learning_rate": 5.155320544306454e-06, "loss": 0.4081, "step": 10883 }, { "epoch": 2.01, "learning_rate": 5.153573251869435e-06, "loss": 0.4321, "step": 10884 }, { "epoch": 2.01, "learning_rate": 5.151826152795873e-06, "loss": 0.4223, "step": 10885 }, { "epoch": 2.01, "learning_rate": 5.1500792471554685e-06, "loss": 0.4157, "step": 10886 }, { "epoch": 2.01, "learning_rate": 5.148332535017926e-06, "loss": 0.4255, "step": 10887 }, { "epoch": 2.01, "learning_rate": 5.146586016452928e-06, "loss": 0.4149, "step": 10888 }, { "epoch": 2.01, "learning_rate": 5.144839691530167e-06, "loss": 0.4162, "step": 10889 }, { "epoch": 2.01, "learning_rate": 5.143093560319312e-06, "loss": 0.421, "step": 10890 }, { "epoch": 2.01, "learning_rate": 5.14134762289003e-06, "loss": 0.4284, "step": 10891 }, { "epoch": 2.02, "learning_rate": 5.139601879311984e-06, "loss": 0.4141, "step": 10892 }, { "epoch": 2.02, "learning_rate": 5.13785632965482e-06, "loss": 0.4453, "step": 10893 }, { "epoch": 2.02, "learning_rate": 5.136110973988192e-06, "loss": 0.3984, "step": 10894 }, { "epoch": 2.02, "learning_rate": 5.134365812381726e-06, "loss": 0.4201, "step": 10895 }, { "epoch": 2.02, "learning_rate": 5.132620844905061e-06, "loss": 0.4144, "step": 10896 }, { "epoch": 2.02, "learning_rate": 5.130876071627807e-06, "loss": 0.4033, "step": 10897 }, { "epoch": 2.02, "learning_rate": 5.129131492619588e-06, "loss": 0.418, "step": 10898 }, { "epoch": 2.02, "learning_rate": 5.127387107949999e-06, "loss": 0.4198, "step": 10899 }, { "epoch": 2.02, "learning_rate": 5.1256429176886465e-06, "loss": 0.43, "step": 10900 }, { "epoch": 2.02, "learning_rate": 5.123898921905115e-06, "loss": 0.423, "step": 10901 }, { "epoch": 2.02, "learning_rate": 5.122155120668992e-06, "loss": 0.4202, "step": 10902 }, { "epoch": 2.02, "learning_rate": 5.120411514049843e-06, "loss": 0.4132, "step": 10903 }, { "epoch": 2.02, "learning_rate": 5.118668102117246e-06, "loss": 0.417, "step": 10904 }, { "epoch": 2.02, "learning_rate": 5.116924884940754e-06, "loss": 0.4492, "step": 10905 }, { "epoch": 2.02, "learning_rate": 5.115181862589914e-06, "loss": 0.4293, "step": 10906 }, { "epoch": 2.02, "learning_rate": 5.113439035134278e-06, "loss": 0.4432, "step": 10907 }, { "epoch": 2.02, "learning_rate": 5.111696402643373e-06, "loss": 0.425, "step": 10908 }, { "epoch": 2.02, "learning_rate": 5.109953965186734e-06, "loss": 0.4249, "step": 10909 }, { "epoch": 2.02, "learning_rate": 5.108211722833876e-06, "loss": 0.4031, "step": 10910 }, { "epoch": 2.02, "learning_rate": 5.106469675654316e-06, "loss": 0.4111, "step": 10911 }, { "epoch": 2.02, "learning_rate": 5.104727823717557e-06, "loss": 0.4094, "step": 10912 }, { "epoch": 2.02, "learning_rate": 5.102986167093089e-06, "loss": 0.4361, "step": 10913 }, { "epoch": 2.02, "learning_rate": 5.101244705850412e-06, "loss": 0.4339, "step": 10914 }, { "epoch": 2.02, "learning_rate": 5.099503440058997e-06, "loss": 0.4088, "step": 10915 }, { "epoch": 2.02, "learning_rate": 5.097762369788325e-06, "loss": 0.4155, "step": 10916 }, { "epoch": 2.02, "learning_rate": 5.096021495107859e-06, "loss": 0.4163, "step": 10917 }, { "epoch": 2.02, "learning_rate": 5.094280816087052e-06, "loss": 0.4327, "step": 10918 }, { "epoch": 2.02, "learning_rate": 5.092540332795359e-06, "loss": 0.4246, "step": 10919 }, { "epoch": 2.02, "learning_rate": 5.09080004530222e-06, "loss": 0.4212, "step": 10920 }, { "epoch": 2.02, "learning_rate": 5.089059953677073e-06, "loss": 0.4299, "step": 10921 }, { "epoch": 2.02, "learning_rate": 5.087320057989341e-06, "loss": 0.4393, "step": 10922 }, { "epoch": 2.02, "learning_rate": 5.08558035830844e-06, "loss": 0.4248, "step": 10923 }, { "epoch": 2.02, "learning_rate": 5.0838408547037875e-06, "loss": 0.4123, "step": 10924 }, { "epoch": 2.02, "learning_rate": 5.082101547244779e-06, "loss": 0.4379, "step": 10925 }, { "epoch": 2.02, "learning_rate": 5.080362436000817e-06, "loss": 0.4048, "step": 10926 }, { "epoch": 2.02, "learning_rate": 5.078623521041286e-06, "loss": 0.4052, "step": 10927 }, { "epoch": 2.02, "learning_rate": 5.07688480243556e-06, "loss": 0.4168, "step": 10928 }, { "epoch": 2.02, "learning_rate": 5.075146280253021e-06, "loss": 0.4072, "step": 10929 }, { "epoch": 2.02, "learning_rate": 5.073407954563021e-06, "loss": 0.4316, "step": 10930 }, { "epoch": 2.02, "learning_rate": 5.071669825434929e-06, "loss": 0.4099, "step": 10931 }, { "epoch": 2.02, "learning_rate": 5.06993189293808e-06, "loss": 0.4178, "step": 10932 }, { "epoch": 2.02, "learning_rate": 5.068194157141826e-06, "loss": 0.4116, "step": 10933 }, { "epoch": 2.02, "learning_rate": 5.066456618115494e-06, "loss": 0.4092, "step": 10934 }, { "epoch": 2.02, "learning_rate": 5.0647192759284046e-06, "loss": 0.4235, "step": 10935 }, { "epoch": 2.02, "learning_rate": 5.0629821306498825e-06, "loss": 0.4084, "step": 10936 }, { "epoch": 2.02, "learning_rate": 5.061245182349228e-06, "loss": 0.4326, "step": 10937 }, { "epoch": 2.02, "learning_rate": 5.059508431095752e-06, "loss": 0.4183, "step": 10938 }, { "epoch": 2.02, "learning_rate": 5.0577718769587415e-06, "loss": 0.4245, "step": 10939 }, { "epoch": 2.02, "learning_rate": 5.056035520007481e-06, "loss": 0.418, "step": 10940 }, { "epoch": 2.02, "learning_rate": 5.054299360311252e-06, "loss": 0.4245, "step": 10941 }, { "epoch": 2.02, "learning_rate": 5.052563397939317e-06, "loss": 0.3985, "step": 10942 }, { "epoch": 2.02, "learning_rate": 5.050827632960948e-06, "loss": 0.4332, "step": 10943 }, { "epoch": 2.02, "learning_rate": 5.049092065445389e-06, "loss": 0.4244, "step": 10944 }, { "epoch": 2.02, "learning_rate": 5.047356695461893e-06, "loss": 0.4116, "step": 10945 }, { "epoch": 2.03, "learning_rate": 5.045621523079694e-06, "loss": 0.4122, "step": 10946 }, { "epoch": 2.03, "learning_rate": 5.043886548368026e-06, "loss": 0.4314, "step": 10947 }, { "epoch": 2.03, "learning_rate": 5.042151771396104e-06, "loss": 0.4308, "step": 10948 }, { "epoch": 2.03, "learning_rate": 5.0404171922331515e-06, "loss": 0.4089, "step": 10949 }, { "epoch": 2.03, "learning_rate": 5.038682810948367e-06, "loss": 0.4203, "step": 10950 }, { "epoch": 2.03, "learning_rate": 5.036948627610956e-06, "loss": 0.4123, "step": 10951 }, { "epoch": 2.03, "learning_rate": 5.035214642290103e-06, "loss": 0.4306, "step": 10952 }, { "epoch": 2.03, "learning_rate": 5.033480855054998e-06, "loss": 0.411, "step": 10953 }, { "epoch": 2.03, "learning_rate": 5.031747265974805e-06, "loss": 0.4218, "step": 10954 }, { "epoch": 2.03, "learning_rate": 5.030013875118705e-06, "loss": 0.4183, "step": 10955 }, { "epoch": 2.03, "learning_rate": 5.0282806825558465e-06, "loss": 0.4162, "step": 10956 }, { "epoch": 2.03, "learning_rate": 5.0265476883553806e-06, "loss": 0.4314, "step": 10957 }, { "epoch": 2.03, "learning_rate": 5.024814892586459e-06, "loss": 0.4248, "step": 10958 }, { "epoch": 2.03, "learning_rate": 5.0230822953182075e-06, "loss": 0.4055, "step": 10959 }, { "epoch": 2.03, "learning_rate": 5.021349896619762e-06, "loss": 0.423, "step": 10960 }, { "epoch": 2.03, "learning_rate": 5.019617696560239e-06, "loss": 0.4279, "step": 10961 }, { "epoch": 2.03, "learning_rate": 5.017885695208743e-06, "loss": 0.4144, "step": 10962 }, { "epoch": 2.03, "learning_rate": 5.016153892634387e-06, "loss": 0.4183, "step": 10963 }, { "epoch": 2.03, "learning_rate": 5.014422288906262e-06, "loss": 0.4231, "step": 10964 }, { "epoch": 2.03, "learning_rate": 5.012690884093461e-06, "loss": 0.4061, "step": 10965 }, { "epoch": 2.03, "learning_rate": 5.010959678265057e-06, "loss": 0.419, "step": 10966 }, { "epoch": 2.03, "learning_rate": 5.009228671490123e-06, "loss": 0.4142, "step": 10967 }, { "epoch": 2.03, "learning_rate": 5.0074978638377295e-06, "loss": 0.4215, "step": 10968 }, { "epoch": 2.03, "learning_rate": 5.005767255376922e-06, "loss": 0.4094, "step": 10969 }, { "epoch": 2.03, "learning_rate": 5.00403684617676e-06, "loss": 0.4117, "step": 10970 }, { "epoch": 2.03, "learning_rate": 5.002306636306278e-06, "loss": 0.423, "step": 10971 }, { "epoch": 2.03, "learning_rate": 5.000576625834503e-06, "loss": 0.411, "step": 10972 }, { "epoch": 2.03, "learning_rate": 4.998846814830469e-06, "loss": 0.4224, "step": 10973 }, { "epoch": 2.03, "learning_rate": 4.997117203363183e-06, "loss": 0.4309, "step": 10974 }, { "epoch": 2.03, "learning_rate": 4.995387791501664e-06, "loss": 0.4292, "step": 10975 }, { "epoch": 2.03, "learning_rate": 4.993658579314904e-06, "loss": 0.4496, "step": 10976 }, { "epoch": 2.03, "learning_rate": 4.9919295668718945e-06, "loss": 0.4405, "step": 10977 }, { "epoch": 2.03, "learning_rate": 4.990200754241627e-06, "loss": 0.4138, "step": 10978 }, { "epoch": 2.03, "learning_rate": 4.988472141493072e-06, "loss": 0.4483, "step": 10979 }, { "epoch": 2.03, "learning_rate": 4.986743728695202e-06, "loss": 0.4157, "step": 10980 }, { "epoch": 2.03, "learning_rate": 4.985015515916971e-06, "loss": 0.4055, "step": 10981 }, { "epoch": 2.03, "learning_rate": 4.9832875032273406e-06, "loss": 0.4318, "step": 10982 }, { "epoch": 2.03, "learning_rate": 4.981559690695251e-06, "loss": 0.4152, "step": 10983 }, { "epoch": 2.03, "learning_rate": 4.979832078389633e-06, "loss": 0.4355, "step": 10984 }, { "epoch": 2.03, "learning_rate": 4.978104666379426e-06, "loss": 0.4241, "step": 10985 }, { "epoch": 2.03, "learning_rate": 4.976377454733541e-06, "loss": 0.4292, "step": 10986 }, { "epoch": 2.03, "learning_rate": 4.974650443520899e-06, "loss": 0.4093, "step": 10987 }, { "epoch": 2.03, "learning_rate": 4.972923632810398e-06, "loss": 0.416, "step": 10988 }, { "epoch": 2.03, "learning_rate": 4.971197022670935e-06, "loss": 0.4267, "step": 10989 }, { "epoch": 2.03, "learning_rate": 4.969470613171402e-06, "loss": 0.4404, "step": 10990 }, { "epoch": 2.03, "learning_rate": 4.967744404380676e-06, "loss": 0.4343, "step": 10991 }, { "epoch": 2.03, "learning_rate": 4.966018396367633e-06, "loss": 0.4267, "step": 10992 }, { "epoch": 2.03, "learning_rate": 4.964292589201134e-06, "loss": 0.43, "step": 10993 }, { "epoch": 2.03, "learning_rate": 4.96256698295004e-06, "loss": 0.4215, "step": 10994 }, { "epoch": 2.03, "learning_rate": 4.9608415776831934e-06, "loss": 0.4007, "step": 10995 }, { "epoch": 2.03, "learning_rate": 4.959116373469441e-06, "loss": 0.4211, "step": 10996 }, { "epoch": 2.03, "learning_rate": 4.95739137037761e-06, "loss": 0.422, "step": 10997 }, { "epoch": 2.03, "learning_rate": 4.95566656847653e-06, "loss": 0.4306, "step": 10998 }, { "epoch": 2.03, "learning_rate": 4.953941967835011e-06, "loss": 0.4226, "step": 10999 }, { "epoch": 2.04, "learning_rate": 4.952217568521869e-06, "loss": 0.4272, "step": 11000 }, { "epoch": 2.04, "learning_rate": 4.950493370605895e-06, "loss": 0.433, "step": 11001 }, { "epoch": 2.04, "learning_rate": 4.948769374155893e-06, "loss": 0.4141, "step": 11002 }, { "epoch": 2.04, "learning_rate": 4.947045579240636e-06, "loss": 0.4195, "step": 11003 }, { "epoch": 2.04, "learning_rate": 4.945321985928908e-06, "loss": 0.4103, "step": 11004 }, { "epoch": 2.04, "learning_rate": 4.9435985942894745e-06, "loss": 0.4085, "step": 11005 }, { "epoch": 2.04, "learning_rate": 4.941875404391092e-06, "loss": 0.4181, "step": 11006 }, { "epoch": 2.04, "learning_rate": 4.94015241630252e-06, "loss": 0.3959, "step": 11007 }, { "epoch": 2.04, "learning_rate": 4.938429630092495e-06, "loss": 0.428, "step": 11008 }, { "epoch": 2.04, "learning_rate": 4.936707045829759e-06, "loss": 0.4045, "step": 11009 }, { "epoch": 2.04, "learning_rate": 4.934984663583039e-06, "loss": 0.41, "step": 11010 }, { "epoch": 2.04, "learning_rate": 4.9332624834210484e-06, "loss": 0.4215, "step": 11011 }, { "epoch": 2.04, "learning_rate": 4.9315405054125084e-06, "loss": 0.4282, "step": 11012 }, { "epoch": 2.04, "learning_rate": 4.929818729626114e-06, "loss": 0.3934, "step": 11013 }, { "epoch": 2.04, "learning_rate": 4.928097156130569e-06, "loss": 0.4058, "step": 11014 }, { "epoch": 2.04, "learning_rate": 4.926375784994558e-06, "loss": 0.4257, "step": 11015 }, { "epoch": 2.04, "learning_rate": 4.924654616286755e-06, "loss": 0.4253, "step": 11016 }, { "epoch": 2.04, "learning_rate": 4.92293365007584e-06, "loss": 0.4031, "step": 11017 }, { "epoch": 2.04, "learning_rate": 4.921212886430467e-06, "loss": 0.4271, "step": 11018 }, { "epoch": 2.04, "learning_rate": 4.9194923254193026e-06, "loss": 0.4261, "step": 11019 }, { "epoch": 2.04, "learning_rate": 4.917771967110988e-06, "loss": 0.4312, "step": 11020 }, { "epoch": 2.04, "learning_rate": 4.916051811574157e-06, "loss": 0.4272, "step": 11021 }, { "epoch": 2.04, "learning_rate": 4.9143318588774514e-06, "loss": 0.4307, "step": 11022 }, { "epoch": 2.04, "learning_rate": 4.912612109089485e-06, "loss": 0.4094, "step": 11023 }, { "epoch": 2.04, "learning_rate": 4.9108925622788794e-06, "loss": 0.395, "step": 11024 }, { "epoch": 2.04, "learning_rate": 4.909173218514235e-06, "loss": 0.42, "step": 11025 }, { "epoch": 2.04, "learning_rate": 4.907454077864157e-06, "loss": 0.4175, "step": 11026 }, { "epoch": 2.04, "learning_rate": 4.905735140397233e-06, "loss": 0.4233, "step": 11027 }, { "epoch": 2.04, "learning_rate": 4.904016406182041e-06, "loss": 0.4141, "step": 11028 }, { "epoch": 2.04, "learning_rate": 4.902297875287164e-06, "loss": 0.3914, "step": 11029 }, { "epoch": 2.04, "learning_rate": 4.900579547781159e-06, "loss": 0.4216, "step": 11030 }, { "epoch": 2.04, "learning_rate": 4.898861423732594e-06, "loss": 0.4302, "step": 11031 }, { "epoch": 2.04, "learning_rate": 4.8971435032100125e-06, "loss": 0.4344, "step": 11032 }, { "epoch": 2.04, "learning_rate": 4.8954257862819535e-06, "loss": 0.4146, "step": 11033 }, { "epoch": 2.04, "learning_rate": 4.893708273016959e-06, "loss": 0.4011, "step": 11034 }, { "epoch": 2.04, "learning_rate": 4.891990963483546e-06, "loss": 0.4291, "step": 11035 }, { "epoch": 2.04, "learning_rate": 4.890273857750241e-06, "loss": 0.4294, "step": 11036 }, { "epoch": 2.04, "learning_rate": 4.888556955885548e-06, "loss": 0.4126, "step": 11037 }, { "epoch": 2.04, "learning_rate": 4.886840257957966e-06, "loss": 0.4002, "step": 11038 }, { "epoch": 2.04, "learning_rate": 4.885123764035994e-06, "loss": 0.3942, "step": 11039 }, { "epoch": 2.04, "learning_rate": 4.88340747418811e-06, "loss": 0.4247, "step": 11040 }, { "epoch": 2.04, "learning_rate": 4.8816913884827985e-06, "loss": 0.4395, "step": 11041 }, { "epoch": 2.04, "learning_rate": 4.8799755069885245e-06, "loss": 0.4121, "step": 11042 }, { "epoch": 2.04, "learning_rate": 4.8782598297737445e-06, "loss": 0.4013, "step": 11043 }, { "epoch": 2.04, "learning_rate": 4.876544356906918e-06, "loss": 0.4257, "step": 11044 }, { "epoch": 2.04, "learning_rate": 4.874829088456483e-06, "loss": 0.4113, "step": 11045 }, { "epoch": 2.04, "learning_rate": 4.873114024490881e-06, "loss": 0.4379, "step": 11046 }, { "epoch": 2.04, "learning_rate": 4.871399165078534e-06, "loss": 0.4176, "step": 11047 }, { "epoch": 2.04, "learning_rate": 4.86968451028787e-06, "loss": 0.435, "step": 11048 }, { "epoch": 2.04, "learning_rate": 4.86797006018729e-06, "loss": 0.4156, "step": 11049 }, { "epoch": 2.04, "learning_rate": 4.866255814845208e-06, "loss": 0.422, "step": 11050 }, { "epoch": 2.04, "learning_rate": 4.864541774330008e-06, "loss": 0.4289, "step": 11051 }, { "epoch": 2.04, "learning_rate": 4.8628279387100895e-06, "loss": 0.4159, "step": 11052 }, { "epoch": 2.04, "learning_rate": 4.86111430805382e-06, "loss": 0.4215, "step": 11053 }, { "epoch": 2.05, "learning_rate": 4.859400882429579e-06, "loss": 0.4325, "step": 11054 }, { "epoch": 2.05, "learning_rate": 4.857687661905722e-06, "loss": 0.4067, "step": 11055 }, { "epoch": 2.05, "learning_rate": 4.85597464655061e-06, "loss": 0.4114, "step": 11056 }, { "epoch": 2.05, "learning_rate": 4.854261836432583e-06, "loss": 0.4347, "step": 11057 }, { "epoch": 2.05, "learning_rate": 4.852549231619983e-06, "loss": 0.4433, "step": 11058 }, { "epoch": 2.05, "learning_rate": 4.85083683218114e-06, "loss": 0.4184, "step": 11059 }, { "epoch": 2.05, "learning_rate": 4.849124638184369e-06, "loss": 0.4293, "step": 11060 }, { "epoch": 2.05, "learning_rate": 4.847412649697993e-06, "loss": 0.4191, "step": 11061 }, { "epoch": 2.05, "learning_rate": 4.845700866790309e-06, "loss": 0.4236, "step": 11062 }, { "epoch": 2.05, "learning_rate": 4.843989289529621e-06, "loss": 0.4078, "step": 11063 }, { "epoch": 2.05, "learning_rate": 4.842277917984215e-06, "loss": 0.4541, "step": 11064 }, { "epoch": 2.05, "learning_rate": 4.840566752222367e-06, "loss": 0.4158, "step": 11065 }, { "epoch": 2.05, "learning_rate": 4.838855792312356e-06, "loss": 0.4203, "step": 11066 }, { "epoch": 2.05, "learning_rate": 4.837145038322439e-06, "loss": 0.4056, "step": 11067 }, { "epoch": 2.05, "learning_rate": 4.835434490320881e-06, "loss": 0.4364, "step": 11068 }, { "epoch": 2.05, "learning_rate": 4.833724148375922e-06, "loss": 0.4153, "step": 11069 }, { "epoch": 2.05, "learning_rate": 4.832014012555805e-06, "loss": 0.407, "step": 11070 }, { "epoch": 2.05, "learning_rate": 4.830304082928764e-06, "loss": 0.4115, "step": 11071 }, { "epoch": 2.05, "learning_rate": 4.828594359563014e-06, "loss": 0.4185, "step": 11072 }, { "epoch": 2.05, "learning_rate": 4.826884842526777e-06, "loss": 0.4225, "step": 11073 }, { "epoch": 2.05, "learning_rate": 4.825175531888254e-06, "loss": 0.4269, "step": 11074 }, { "epoch": 2.05, "learning_rate": 4.8234664277156504e-06, "loss": 0.4143, "step": 11075 }, { "epoch": 2.05, "learning_rate": 4.821757530077151e-06, "loss": 0.4242, "step": 11076 }, { "epoch": 2.05, "learning_rate": 4.820048839040937e-06, "loss": 0.4042, "step": 11077 }, { "epoch": 2.05, "learning_rate": 4.818340354675186e-06, "loss": 0.4063, "step": 11078 }, { "epoch": 2.05, "learning_rate": 4.816632077048059e-06, "loss": 0.4106, "step": 11079 }, { "epoch": 2.05, "learning_rate": 4.814924006227718e-06, "loss": 0.4079, "step": 11080 }, { "epoch": 2.05, "learning_rate": 4.8132161422823096e-06, "loss": 0.43, "step": 11081 }, { "epoch": 2.05, "learning_rate": 4.811508485279971e-06, "loss": 0.4143, "step": 11082 }, { "epoch": 2.05, "learning_rate": 4.8098010352888405e-06, "loss": 0.4197, "step": 11083 }, { "epoch": 2.05, "learning_rate": 4.808093792377036e-06, "loss": 0.4145, "step": 11084 }, { "epoch": 2.05, "learning_rate": 4.80638675661268e-06, "loss": 0.3837, "step": 11085 }, { "epoch": 2.05, "learning_rate": 4.804679928063876e-06, "loss": 0.3657, "step": 11086 }, { "epoch": 2.05, "learning_rate": 4.8029733067987215e-06, "loss": 0.4331, "step": 11087 }, { "epoch": 2.05, "learning_rate": 4.801266892885314e-06, "loss": 0.4239, "step": 11088 }, { "epoch": 2.05, "learning_rate": 4.799560686391727e-06, "loss": 0.4182, "step": 11089 }, { "epoch": 2.05, "learning_rate": 4.7978546873860445e-06, "loss": 0.4269, "step": 11090 }, { "epoch": 2.05, "learning_rate": 4.796148895936325e-06, "loss": 0.4129, "step": 11091 }, { "epoch": 2.05, "learning_rate": 4.794443312110634e-06, "loss": 0.419, "step": 11092 }, { "epoch": 2.05, "learning_rate": 4.792737935977017e-06, "loss": 0.4066, "step": 11093 }, { "epoch": 2.05, "learning_rate": 4.7910327676035105e-06, "loss": 0.4384, "step": 11094 }, { "epoch": 2.05, "learning_rate": 4.789327807058157e-06, "loss": 0.4227, "step": 11095 }, { "epoch": 2.05, "learning_rate": 4.787623054408973e-06, "loss": 0.4343, "step": 11096 }, { "epoch": 2.05, "learning_rate": 4.785918509723982e-06, "loss": 0.4316, "step": 11097 }, { "epoch": 2.05, "learning_rate": 4.784214173071186e-06, "loss": 0.4137, "step": 11098 }, { "epoch": 2.05, "learning_rate": 4.782510044518592e-06, "loss": 0.432, "step": 11099 }, { "epoch": 2.05, "learning_rate": 4.780806124134181e-06, "loss": 0.421, "step": 11100 }, { "epoch": 2.05, "learning_rate": 4.779102411985947e-06, "loss": 0.4302, "step": 11101 }, { "epoch": 2.05, "learning_rate": 4.777398908141858e-06, "loss": 0.4222, "step": 11102 }, { "epoch": 2.05, "learning_rate": 4.7756956126698875e-06, "loss": 0.4357, "step": 11103 }, { "epoch": 2.05, "learning_rate": 4.773992525637984e-06, "loss": 0.4373, "step": 11104 }, { "epoch": 2.05, "learning_rate": 4.7722896471141075e-06, "loss": 0.4104, "step": 11105 }, { "epoch": 2.05, "learning_rate": 4.7705869771661915e-06, "loss": 0.4173, "step": 11106 }, { "epoch": 2.05, "learning_rate": 4.768884515862176e-06, "loss": 0.4182, "step": 11107 }, { "epoch": 2.06, "learning_rate": 4.7671822632699846e-06, "loss": 0.4209, "step": 11108 }, { "epoch": 2.06, "learning_rate": 4.765480219457529e-06, "loss": 0.4129, "step": 11109 }, { "epoch": 2.06, "learning_rate": 4.7637783844927245e-06, "loss": 0.4289, "step": 11110 }, { "epoch": 2.06, "learning_rate": 4.7620767584434635e-06, "loss": 0.4124, "step": 11111 }, { "epoch": 2.06, "learning_rate": 4.760375341377646e-06, "loss": 0.4045, "step": 11112 }, { "epoch": 2.06, "learning_rate": 4.758674133363148e-06, "loss": 0.4341, "step": 11113 }, { "epoch": 2.06, "learning_rate": 4.7569731344678516e-06, "loss": 0.4375, "step": 11114 }, { "epoch": 2.06, "learning_rate": 4.75527234475962e-06, "loss": 0.4213, "step": 11115 }, { "epoch": 2.06, "learning_rate": 4.753571764306308e-06, "loss": 0.4291, "step": 11116 }, { "epoch": 2.06, "learning_rate": 4.751871393175772e-06, "loss": 0.4273, "step": 11117 }, { "epoch": 2.06, "learning_rate": 4.750171231435847e-06, "loss": 0.4057, "step": 11118 }, { "epoch": 2.06, "learning_rate": 4.748471279154375e-06, "loss": 0.429, "step": 11119 }, { "epoch": 2.06, "learning_rate": 4.746771536399175e-06, "loss": 0.4419, "step": 11120 }, { "epoch": 2.06, "learning_rate": 4.745072003238062e-06, "loss": 0.4226, "step": 11121 }, { "epoch": 2.06, "learning_rate": 4.743372679738849e-06, "loss": 0.4297, "step": 11122 }, { "epoch": 2.06, "learning_rate": 4.741673565969331e-06, "loss": 0.4353, "step": 11123 }, { "epoch": 2.06, "learning_rate": 4.739974661997305e-06, "loss": 0.423, "step": 11124 }, { "epoch": 2.06, "learning_rate": 4.738275967890553e-06, "loss": 0.4327, "step": 11125 }, { "epoch": 2.06, "learning_rate": 4.736577483716843e-06, "loss": 0.4299, "step": 11126 }, { "epoch": 2.06, "learning_rate": 4.73487920954395e-06, "loss": 0.4422, "step": 11127 }, { "epoch": 2.06, "learning_rate": 4.733181145439626e-06, "loss": 0.4272, "step": 11128 }, { "epoch": 2.06, "learning_rate": 4.731483291471625e-06, "loss": 0.4084, "step": 11129 }, { "epoch": 2.06, "learning_rate": 4.729785647707688e-06, "loss": 0.4166, "step": 11130 }, { "epoch": 2.06, "learning_rate": 4.728088214215541e-06, "loss": 0.4386, "step": 11131 }, { "epoch": 2.06, "learning_rate": 4.726390991062918e-06, "loss": 0.4199, "step": 11132 }, { "epoch": 2.06, "learning_rate": 4.724693978317527e-06, "loss": 0.4323, "step": 11133 }, { "epoch": 2.06, "learning_rate": 4.722997176047083e-06, "loss": 0.4251, "step": 11134 }, { "epoch": 2.06, "learning_rate": 4.7213005843192785e-06, "loss": 0.4156, "step": 11135 }, { "epoch": 2.06, "learning_rate": 4.71960420320181e-06, "loss": 0.4308, "step": 11136 }, { "epoch": 2.06, "learning_rate": 4.717908032762357e-06, "loss": 0.4313, "step": 11137 }, { "epoch": 2.06, "learning_rate": 4.716212073068591e-06, "loss": 0.4229, "step": 11138 }, { "epoch": 2.06, "learning_rate": 4.714516324188184e-06, "loss": 0.4041, "step": 11139 }, { "epoch": 2.06, "learning_rate": 4.712820786188787e-06, "loss": 0.4224, "step": 11140 }, { "epoch": 2.06, "learning_rate": 4.711125459138055e-06, "loss": 0.428, "step": 11141 }, { "epoch": 2.06, "learning_rate": 4.709430343103625e-06, "loss": 0.403, "step": 11142 }, { "epoch": 2.06, "learning_rate": 4.707735438153125e-06, "loss": 0.4084, "step": 11143 }, { "epoch": 2.06, "learning_rate": 4.706040744354187e-06, "loss": 0.4269, "step": 11144 }, { "epoch": 2.06, "learning_rate": 4.704346261774418e-06, "loss": 0.4176, "step": 11145 }, { "epoch": 2.06, "learning_rate": 4.702651990481432e-06, "loss": 0.4192, "step": 11146 }, { "epoch": 2.06, "learning_rate": 4.70095793054282e-06, "loss": 0.4292, "step": 11147 }, { "epoch": 2.06, "learning_rate": 4.699264082026179e-06, "loss": 0.403, "step": 11148 }, { "epoch": 2.06, "learning_rate": 4.6975704449990835e-06, "loss": 0.4122, "step": 11149 }, { "epoch": 2.06, "learning_rate": 4.695877019529115e-06, "loss": 0.4338, "step": 11150 }, { "epoch": 2.06, "learning_rate": 4.694183805683827e-06, "loss": 0.42, "step": 11151 }, { "epoch": 2.06, "learning_rate": 4.692490803530788e-06, "loss": 0.4288, "step": 11152 }, { "epoch": 2.06, "learning_rate": 4.690798013137534e-06, "loss": 0.4401, "step": 11153 }, { "epoch": 2.06, "learning_rate": 4.689105434571614e-06, "loss": 0.4318, "step": 11154 }, { "epoch": 2.06, "learning_rate": 4.6874130679005505e-06, "loss": 0.4118, "step": 11155 }, { "epoch": 2.06, "learning_rate": 4.685720913191872e-06, "loss": 0.4125, "step": 11156 }, { "epoch": 2.06, "learning_rate": 4.684028970513088e-06, "loss": 0.4071, "step": 11157 }, { "epoch": 2.06, "learning_rate": 4.682337239931709e-06, "loss": 0.4303, "step": 11158 }, { "epoch": 2.06, "learning_rate": 4.680645721515229e-06, "loss": 0.4362, "step": 11159 }, { "epoch": 2.06, "learning_rate": 4.678954415331131e-06, "loss": 0.412, "step": 11160 }, { "epoch": 2.06, "learning_rate": 4.677263321446905e-06, "loss": 0.4144, "step": 11161 }, { "epoch": 2.07, "learning_rate": 4.675572439930015e-06, "loss": 0.4137, "step": 11162 }, { "epoch": 2.07, "learning_rate": 4.673881770847929e-06, "loss": 0.4278, "step": 11163 }, { "epoch": 2.07, "learning_rate": 4.6721913142681e-06, "loss": 0.415, "step": 11164 }, { "epoch": 2.07, "learning_rate": 4.670501070257969e-06, "loss": 0.4264, "step": 11165 }, { "epoch": 2.07, "learning_rate": 4.668811038884983e-06, "loss": 0.4217, "step": 11166 }, { "epoch": 2.07, "learning_rate": 4.66712122021656e-06, "loss": 0.4156, "step": 11167 }, { "epoch": 2.07, "learning_rate": 4.665431614320133e-06, "loss": 0.4163, "step": 11168 }, { "epoch": 2.07, "learning_rate": 4.663742221263107e-06, "loss": 0.424, "step": 11169 }, { "epoch": 2.07, "learning_rate": 4.662053041112882e-06, "loss": 0.4063, "step": 11170 }, { "epoch": 2.07, "learning_rate": 4.660364073936862e-06, "loss": 0.4117, "step": 11171 }, { "epoch": 2.07, "learning_rate": 4.658675319802427e-06, "loss": 0.4344, "step": 11172 }, { "epoch": 2.07, "learning_rate": 4.656986778776959e-06, "loss": 0.414, "step": 11173 }, { "epoch": 2.07, "learning_rate": 4.655298450927827e-06, "loss": 0.4262, "step": 11174 }, { "epoch": 2.07, "learning_rate": 4.653610336322388e-06, "loss": 0.4174, "step": 11175 }, { "epoch": 2.07, "learning_rate": 4.6519224350280025e-06, "loss": 0.4245, "step": 11176 }, { "epoch": 2.07, "learning_rate": 4.650234747112006e-06, "loss": 0.3992, "step": 11177 }, { "epoch": 2.07, "learning_rate": 4.648547272641741e-06, "loss": 0.409, "step": 11178 }, { "epoch": 2.07, "learning_rate": 4.646860011684528e-06, "loss": 0.4094, "step": 11179 }, { "epoch": 2.07, "learning_rate": 4.645172964307695e-06, "loss": 0.3949, "step": 11180 }, { "epoch": 2.07, "learning_rate": 4.643486130578545e-06, "loss": 0.4192, "step": 11181 }, { "epoch": 2.07, "learning_rate": 4.6417995105643775e-06, "loss": 0.4376, "step": 11182 }, { "epoch": 2.07, "learning_rate": 4.640113104332493e-06, "loss": 0.4179, "step": 11183 }, { "epoch": 2.07, "learning_rate": 4.638426911950169e-06, "loss": 0.4137, "step": 11184 }, { "epoch": 2.07, "learning_rate": 4.636740933484687e-06, "loss": 0.4381, "step": 11185 }, { "epoch": 2.07, "learning_rate": 4.635055169003313e-06, "loss": 0.4359, "step": 11186 }, { "epoch": 2.07, "learning_rate": 4.6333696185733e-06, "loss": 0.4137, "step": 11187 }, { "epoch": 2.07, "learning_rate": 4.631684282261908e-06, "loss": 0.4009, "step": 11188 }, { "epoch": 2.07, "learning_rate": 4.629999160136371e-06, "loss": 0.4057, "step": 11189 }, { "epoch": 2.07, "learning_rate": 4.628314252263927e-06, "loss": 0.4001, "step": 11190 }, { "epoch": 2.07, "learning_rate": 4.6266295587118e-06, "loss": 0.4346, "step": 11191 }, { "epoch": 2.07, "learning_rate": 4.6249450795472e-06, "loss": 0.4084, "step": 11192 }, { "epoch": 2.07, "learning_rate": 4.623260814837344e-06, "loss": 0.4056, "step": 11193 }, { "epoch": 2.07, "learning_rate": 4.6215767646494235e-06, "loss": 0.4134, "step": 11194 }, { "epoch": 2.07, "learning_rate": 4.619892929050637e-06, "loss": 0.4229, "step": 11195 }, { "epoch": 2.07, "learning_rate": 4.6182093081081555e-06, "loss": 0.4091, "step": 11196 }, { "epoch": 2.07, "learning_rate": 4.616525901889164e-06, "loss": 0.4247, "step": 11197 }, { "epoch": 2.07, "learning_rate": 4.614842710460818e-06, "loss": 0.4182, "step": 11198 }, { "epoch": 2.07, "learning_rate": 4.61315973389028e-06, "loss": 0.4382, "step": 11199 }, { "epoch": 2.07, "learning_rate": 4.611476972244693e-06, "loss": 0.4148, "step": 11200 }, { "epoch": 2.07, "learning_rate": 4.609794425591201e-06, "loss": 0.4234, "step": 11201 }, { "epoch": 2.07, "learning_rate": 4.608112093996928e-06, "loss": 0.4239, "step": 11202 }, { "epoch": 2.07, "learning_rate": 4.606429977529004e-06, "loss": 0.4151, "step": 11203 }, { "epoch": 2.07, "learning_rate": 4.604748076254533e-06, "loss": 0.4252, "step": 11204 }, { "epoch": 2.07, "learning_rate": 4.603066390240629e-06, "loss": 0.4142, "step": 11205 }, { "epoch": 2.07, "learning_rate": 4.60138491955438e-06, "loss": 0.4251, "step": 11206 }, { "epoch": 2.07, "learning_rate": 4.5997036642628825e-06, "loss": 0.4181, "step": 11207 }, { "epoch": 2.07, "learning_rate": 4.59802262443321e-06, "loss": 0.4076, "step": 11208 }, { "epoch": 2.07, "learning_rate": 4.596341800132428e-06, "loss": 0.4097, "step": 11209 }, { "epoch": 2.07, "learning_rate": 4.594661191427608e-06, "loss": 0.4311, "step": 11210 }, { "epoch": 2.07, "learning_rate": 4.5929807983857955e-06, "loss": 0.4185, "step": 11211 }, { "epoch": 2.07, "learning_rate": 4.591300621074042e-06, "loss": 0.4168, "step": 11212 }, { "epoch": 2.07, "learning_rate": 4.5896206595593794e-06, "loss": 0.397, "step": 11213 }, { "epoch": 2.07, "learning_rate": 4.587940913908832e-06, "loss": 0.4073, "step": 11214 }, { "epoch": 2.07, "learning_rate": 4.5862613841894255e-06, "loss": 0.4167, "step": 11215 }, { "epoch": 2.08, "learning_rate": 4.584582070468163e-06, "loss": 0.4003, "step": 11216 }, { "epoch": 2.08, "learning_rate": 4.582902972812053e-06, "loss": 0.4283, "step": 11217 }, { "epoch": 2.08, "learning_rate": 4.581224091288085e-06, "loss": 0.4286, "step": 11218 }, { "epoch": 2.08, "learning_rate": 4.579545425963239e-06, "loss": 0.42, "step": 11219 }, { "epoch": 2.08, "learning_rate": 4.577866976904499e-06, "loss": 0.4155, "step": 11220 }, { "epoch": 2.08, "learning_rate": 4.576188744178824e-06, "loss": 0.4246, "step": 11221 }, { "epoch": 2.08, "learning_rate": 4.5745107278531795e-06, "loss": 0.4178, "step": 11222 }, { "epoch": 2.08, "learning_rate": 4.572832927994509e-06, "loss": 0.4413, "step": 11223 }, { "epoch": 2.08, "learning_rate": 4.57115534466976e-06, "loss": 0.4183, "step": 11224 }, { "epoch": 2.08, "learning_rate": 4.569477977945862e-06, "loss": 0.43, "step": 11225 }, { "epoch": 2.08, "learning_rate": 4.567800827889734e-06, "loss": 0.4267, "step": 11226 }, { "epoch": 2.08, "learning_rate": 4.5661238945683e-06, "loss": 0.4123, "step": 11227 }, { "epoch": 2.08, "learning_rate": 4.564447178048457e-06, "loss": 0.4227, "step": 11228 }, { "epoch": 2.08, "learning_rate": 4.562770678397111e-06, "loss": 0.4194, "step": 11229 }, { "epoch": 2.08, "learning_rate": 4.56109439568115e-06, "loss": 0.4222, "step": 11230 }, { "epoch": 2.08, "learning_rate": 4.559418329967449e-06, "loss": 0.4194, "step": 11231 }, { "epoch": 2.08, "learning_rate": 4.557742481322886e-06, "loss": 0.4245, "step": 11232 }, { "epoch": 2.08, "learning_rate": 4.55606684981432e-06, "loss": 0.4006, "step": 11233 }, { "epoch": 2.08, "learning_rate": 4.554391435508611e-06, "loss": 0.4043, "step": 11234 }, { "epoch": 2.08, "learning_rate": 4.5527162384726e-06, "loss": 0.3997, "step": 11235 }, { "epoch": 2.08, "learning_rate": 4.551041258773122e-06, "loss": 0.4036, "step": 11236 }, { "epoch": 2.08, "learning_rate": 4.549366496477015e-06, "loss": 0.4166, "step": 11237 }, { "epoch": 2.08, "learning_rate": 4.547691951651088e-06, "loss": 0.4127, "step": 11238 }, { "epoch": 2.08, "learning_rate": 4.546017624362161e-06, "loss": 0.4257, "step": 11239 }, { "epoch": 2.08, "learning_rate": 4.544343514677033e-06, "loss": 0.4251, "step": 11240 }, { "epoch": 2.08, "learning_rate": 4.542669622662496e-06, "loss": 0.4179, "step": 11241 }, { "epoch": 2.08, "learning_rate": 4.5409959483853385e-06, "loss": 0.4151, "step": 11242 }, { "epoch": 2.08, "learning_rate": 4.539322491912333e-06, "loss": 0.4159, "step": 11243 }, { "epoch": 2.08, "learning_rate": 4.537649253310253e-06, "loss": 0.4149, "step": 11244 }, { "epoch": 2.08, "learning_rate": 4.535976232645851e-06, "loss": 0.4195, "step": 11245 }, { "epoch": 2.08, "learning_rate": 4.534303429985885e-06, "loss": 0.4135, "step": 11246 }, { "epoch": 2.08, "learning_rate": 4.5326308453970895e-06, "loss": 0.4066, "step": 11247 }, { "epoch": 2.08, "learning_rate": 4.530958478946203e-06, "loss": 0.441, "step": 11248 }, { "epoch": 2.08, "learning_rate": 4.529286330699945e-06, "loss": 0.4089, "step": 11249 }, { "epoch": 2.08, "learning_rate": 4.527614400725037e-06, "loss": 0.4371, "step": 11250 }, { "epoch": 2.08, "learning_rate": 4.525942689088179e-06, "loss": 0.4307, "step": 11251 }, { "epoch": 2.08, "learning_rate": 4.524271195856076e-06, "loss": 0.4445, "step": 11252 }, { "epoch": 2.08, "learning_rate": 4.5225999210954095e-06, "loss": 0.43, "step": 11253 }, { "epoch": 2.08, "learning_rate": 4.520928864872871e-06, "loss": 0.4355, "step": 11254 }, { "epoch": 2.08, "learning_rate": 4.519258027255121e-06, "loss": 0.4018, "step": 11255 }, { "epoch": 2.08, "learning_rate": 4.517587408308833e-06, "loss": 0.4436, "step": 11256 }, { "epoch": 2.08, "learning_rate": 4.515917008100657e-06, "loss": 0.4208, "step": 11257 }, { "epoch": 2.08, "learning_rate": 4.514246826697235e-06, "loss": 0.4203, "step": 11258 }, { "epoch": 2.08, "learning_rate": 4.512576864165213e-06, "loss": 0.4331, "step": 11259 }, { "epoch": 2.08, "learning_rate": 4.510907120571208e-06, "loss": 0.4265, "step": 11260 }, { "epoch": 2.08, "learning_rate": 4.509237595981853e-06, "loss": 0.4267, "step": 11261 }, { "epoch": 2.08, "learning_rate": 4.5075682904637495e-06, "loss": 0.41, "step": 11262 }, { "epoch": 2.08, "learning_rate": 4.505899204083499e-06, "loss": 0.4238, "step": 11263 }, { "epoch": 2.08, "learning_rate": 4.5042303369077025e-06, "loss": 0.3952, "step": 11264 }, { "epoch": 2.08, "learning_rate": 4.502561689002937e-06, "loss": 0.4323, "step": 11265 }, { "epoch": 2.08, "learning_rate": 4.500893260435785e-06, "loss": 0.4129, "step": 11266 }, { "epoch": 2.08, "learning_rate": 4.499225051272806e-06, "loss": 0.4163, "step": 11267 }, { "epoch": 2.08, "learning_rate": 4.497557061580569e-06, "loss": 0.4217, "step": 11268 }, { "epoch": 2.08, "learning_rate": 4.495889291425616e-06, "loss": 0.4256, "step": 11269 }, { "epoch": 2.09, "learning_rate": 4.494221740874486e-06, "loss": 0.4237, "step": 11270 }, { "epoch": 2.09, "learning_rate": 4.492554409993719e-06, "loss": 0.4178, "step": 11271 }, { "epoch": 2.09, "learning_rate": 4.490887298849831e-06, "loss": 0.414, "step": 11272 }, { "epoch": 2.09, "learning_rate": 4.489220407509342e-06, "loss": 0.441, "step": 11273 }, { "epoch": 2.09, "learning_rate": 4.487553736038758e-06, "loss": 0.42, "step": 11274 }, { "epoch": 2.09, "learning_rate": 4.485887284504569e-06, "loss": 0.4214, "step": 11275 }, { "epoch": 2.09, "learning_rate": 4.484221052973272e-06, "loss": 0.4402, "step": 11276 }, { "epoch": 2.09, "learning_rate": 4.482555041511339e-06, "loss": 0.4405, "step": 11277 }, { "epoch": 2.09, "learning_rate": 4.48088925018525e-06, "loss": 0.4179, "step": 11278 }, { "epoch": 2.09, "learning_rate": 4.479223679061459e-06, "loss": 0.3959, "step": 11279 }, { "epoch": 2.09, "learning_rate": 4.477558328206419e-06, "loss": 0.4504, "step": 11280 }, { "epoch": 2.09, "learning_rate": 4.475893197686582e-06, "loss": 0.4093, "step": 11281 }, { "epoch": 2.09, "learning_rate": 4.474228287568373e-06, "loss": 0.4165, "step": 11282 }, { "epoch": 2.09, "learning_rate": 4.4725635979182305e-06, "loss": 0.4129, "step": 11283 }, { "epoch": 2.09, "learning_rate": 4.470899128802565e-06, "loss": 0.4215, "step": 11284 }, { "epoch": 2.09, "learning_rate": 4.4692348802877835e-06, "loss": 0.4327, "step": 11285 }, { "epoch": 2.09, "learning_rate": 4.467570852440296e-06, "loss": 0.4351, "step": 11286 }, { "epoch": 2.09, "learning_rate": 4.465907045326483e-06, "loss": 0.4097, "step": 11287 }, { "epoch": 2.09, "learning_rate": 4.4642434590127374e-06, "loss": 0.3951, "step": 11288 }, { "epoch": 2.09, "learning_rate": 4.462580093565425e-06, "loss": 0.4176, "step": 11289 }, { "epoch": 2.09, "learning_rate": 4.460916949050917e-06, "loss": 0.4425, "step": 11290 }, { "epoch": 2.09, "learning_rate": 4.459254025535569e-06, "loss": 0.4096, "step": 11291 }, { "epoch": 2.09, "learning_rate": 4.4575913230857226e-06, "loss": 0.4159, "step": 11292 }, { "epoch": 2.09, "learning_rate": 4.455928841767725e-06, "loss": 0.4167, "step": 11293 }, { "epoch": 2.09, "learning_rate": 4.454266581647897e-06, "loss": 0.4107, "step": 11294 }, { "epoch": 2.09, "learning_rate": 4.4526045427925705e-06, "loss": 0.433, "step": 11295 }, { "epoch": 2.09, "learning_rate": 4.45094272526805e-06, "loss": 0.4149, "step": 11296 }, { "epoch": 2.09, "learning_rate": 4.449281129140638e-06, "loss": 0.4145, "step": 11297 }, { "epoch": 2.09, "learning_rate": 4.447619754476636e-06, "loss": 0.4299, "step": 11298 }, { "epoch": 2.09, "learning_rate": 4.445958601342322e-06, "loss": 0.4279, "step": 11299 }, { "epoch": 2.09, "learning_rate": 4.444297669803981e-06, "loss": 0.4151, "step": 11300 }, { "epoch": 2.09, "learning_rate": 4.442636959927872e-06, "loss": 0.4114, "step": 11301 }, { "epoch": 2.09, "learning_rate": 4.440976471780261e-06, "loss": 0.4215, "step": 11302 }, { "epoch": 2.09, "learning_rate": 4.439316205427399e-06, "loss": 0.4215, "step": 11303 }, { "epoch": 2.09, "learning_rate": 4.437656160935521e-06, "loss": 0.4298, "step": 11304 }, { "epoch": 2.09, "learning_rate": 4.435996338370867e-06, "loss": 0.411, "step": 11305 }, { "epoch": 2.09, "learning_rate": 4.434336737799659e-06, "loss": 0.4211, "step": 11306 }, { "epoch": 2.09, "learning_rate": 4.432677359288107e-06, "loss": 0.4027, "step": 11307 }, { "epoch": 2.09, "learning_rate": 4.431018202902423e-06, "loss": 0.4232, "step": 11308 }, { "epoch": 2.09, "learning_rate": 4.429359268708799e-06, "loss": 0.4389, "step": 11309 }, { "epoch": 2.09, "learning_rate": 4.427700556773431e-06, "loss": 0.3906, "step": 11310 }, { "epoch": 2.09, "learning_rate": 4.426042067162493e-06, "loss": 0.4083, "step": 11311 }, { "epoch": 2.09, "learning_rate": 4.424383799942153e-06, "loss": 0.4177, "step": 11312 }, { "epoch": 2.09, "learning_rate": 4.4227257551785795e-06, "loss": 0.4206, "step": 11313 }, { "epoch": 2.09, "learning_rate": 4.4210679329379205e-06, "loss": 0.4089, "step": 11314 }, { "epoch": 2.09, "learning_rate": 4.419410333286324e-06, "loss": 0.4297, "step": 11315 }, { "epoch": 2.09, "learning_rate": 4.417752956289919e-06, "loss": 0.4099, "step": 11316 }, { "epoch": 2.09, "learning_rate": 4.416095802014841e-06, "loss": 0.4307, "step": 11317 }, { "epoch": 2.09, "learning_rate": 4.414438870527201e-06, "loss": 0.416, "step": 11318 }, { "epoch": 2.09, "learning_rate": 4.412782161893105e-06, "loss": 0.4314, "step": 11319 }, { "epoch": 2.09, "learning_rate": 4.41112567617866e-06, "loss": 0.4044, "step": 11320 }, { "epoch": 2.09, "learning_rate": 4.4094694134499505e-06, "loss": 0.4407, "step": 11321 }, { "epoch": 2.09, "learning_rate": 4.407813373773063e-06, "loss": 0.443, "step": 11322 }, { "epoch": 2.09, "learning_rate": 4.406157557214069e-06, "loss": 0.397, "step": 11323 }, { "epoch": 2.1, "learning_rate": 4.404501963839029e-06, "loss": 0.4227, "step": 11324 }, { "epoch": 2.1, "learning_rate": 4.402846593714003e-06, "loss": 0.4122, "step": 11325 }, { "epoch": 2.1, "learning_rate": 4.401191446905032e-06, "loss": 0.4354, "step": 11326 }, { "epoch": 2.1, "learning_rate": 4.39953652347816e-06, "loss": 0.3936, "step": 11327 }, { "epoch": 2.1, "learning_rate": 4.397881823499411e-06, "loss": 0.431, "step": 11328 }, { "epoch": 2.1, "learning_rate": 4.396227347034802e-06, "loss": 0.4137, "step": 11329 }, { "epoch": 2.1, "learning_rate": 4.39457309415035e-06, "loss": 0.4046, "step": 11330 }, { "epoch": 2.1, "learning_rate": 4.392919064912052e-06, "loss": 0.4232, "step": 11331 }, { "epoch": 2.1, "learning_rate": 4.391265259385903e-06, "loss": 0.421, "step": 11332 }, { "epoch": 2.1, "learning_rate": 4.389611677637887e-06, "loss": 0.4166, "step": 11333 }, { "epoch": 2.1, "learning_rate": 4.387958319733974e-06, "loss": 0.4109, "step": 11334 }, { "epoch": 2.1, "learning_rate": 4.386305185740136e-06, "loss": 0.4111, "step": 11335 }, { "epoch": 2.1, "learning_rate": 4.3846522757223255e-06, "loss": 0.3929, "step": 11336 }, { "epoch": 2.1, "learning_rate": 4.382999589746496e-06, "loss": 0.4118, "step": 11337 }, { "epoch": 2.1, "learning_rate": 4.38134712787858e-06, "loss": 0.4287, "step": 11338 }, { "epoch": 2.1, "learning_rate": 4.379694890184514e-06, "loss": 0.4126, "step": 11339 }, { "epoch": 2.1, "learning_rate": 4.3780428767302165e-06, "loss": 0.3982, "step": 11340 }, { "epoch": 2.1, "learning_rate": 4.376391087581595e-06, "loss": 0.4229, "step": 11341 }, { "epoch": 2.1, "learning_rate": 4.374739522804562e-06, "loss": 0.4149, "step": 11342 }, { "epoch": 2.1, "learning_rate": 4.373088182465003e-06, "loss": 0.4241, "step": 11343 }, { "epoch": 2.1, "learning_rate": 4.371437066628811e-06, "loss": 0.417, "step": 11344 }, { "epoch": 2.1, "learning_rate": 4.36978617536186e-06, "loss": 0.4312, "step": 11345 }, { "epoch": 2.1, "learning_rate": 4.368135508730011e-06, "loss": 0.437, "step": 11346 }, { "epoch": 2.1, "learning_rate": 4.3664850667991335e-06, "loss": 0.4509, "step": 11347 }, { "epoch": 2.1, "learning_rate": 4.364834849635067e-06, "loss": 0.4201, "step": 11348 }, { "epoch": 2.1, "learning_rate": 4.363184857303661e-06, "loss": 0.4012, "step": 11349 }, { "epoch": 2.1, "learning_rate": 4.361535089870739e-06, "loss": 0.3997, "step": 11350 }, { "epoch": 2.1, "learning_rate": 4.359885547402132e-06, "loss": 0.4094, "step": 11351 }, { "epoch": 2.1, "learning_rate": 4.358236229963644e-06, "loss": 0.4107, "step": 11352 }, { "epoch": 2.1, "learning_rate": 4.35658713762109e-06, "loss": 0.4339, "step": 11353 }, { "epoch": 2.1, "learning_rate": 4.354938270440257e-06, "loss": 0.4141, "step": 11354 }, { "epoch": 2.1, "learning_rate": 4.3532896284869384e-06, "loss": 0.4053, "step": 11355 }, { "epoch": 2.1, "learning_rate": 4.351641211826905e-06, "loss": 0.4078, "step": 11356 }, { "epoch": 2.1, "learning_rate": 4.349993020525934e-06, "loss": 0.4333, "step": 11357 }, { "epoch": 2.1, "learning_rate": 4.348345054649777e-06, "loss": 0.4245, "step": 11358 }, { "epoch": 2.1, "learning_rate": 4.3466973142641926e-06, "loss": 0.4363, "step": 11359 }, { "epoch": 2.1, "learning_rate": 4.345049799434915e-06, "loss": 0.42, "step": 11360 }, { "epoch": 2.1, "learning_rate": 4.343402510227683e-06, "loss": 0.4177, "step": 11361 }, { "epoch": 2.1, "learning_rate": 4.341755446708219e-06, "loss": 0.4215, "step": 11362 }, { "epoch": 2.1, "learning_rate": 4.340108608942233e-06, "loss": 0.4017, "step": 11363 }, { "epoch": 2.1, "learning_rate": 4.338461996995438e-06, "loss": 0.4259, "step": 11364 }, { "epoch": 2.1, "learning_rate": 4.336815610933524e-06, "loss": 0.4019, "step": 11365 }, { "epoch": 2.1, "learning_rate": 4.335169450822184e-06, "loss": 0.4055, "step": 11366 }, { "epoch": 2.1, "learning_rate": 4.333523516727096e-06, "loss": 0.4028, "step": 11367 }, { "epoch": 2.1, "learning_rate": 4.331877808713924e-06, "loss": 0.423, "step": 11368 }, { "epoch": 2.1, "learning_rate": 4.3302323268483384e-06, "loss": 0.4168, "step": 11369 }, { "epoch": 2.1, "learning_rate": 4.328587071195981e-06, "loss": 0.4277, "step": 11370 }, { "epoch": 2.1, "learning_rate": 4.326942041822502e-06, "loss": 0.4176, "step": 11371 }, { "epoch": 2.1, "learning_rate": 4.325297238793535e-06, "loss": 0.4353, "step": 11372 }, { "epoch": 2.1, "learning_rate": 4.323652662174696e-06, "loss": 0.4151, "step": 11373 }, { "epoch": 2.1, "learning_rate": 4.3220083120316095e-06, "loss": 0.4302, "step": 11374 }, { "epoch": 2.1, "learning_rate": 4.320364188429876e-06, "loss": 0.4078, "step": 11375 }, { "epoch": 2.1, "learning_rate": 4.318720291435099e-06, "loss": 0.4022, "step": 11376 }, { "epoch": 2.1, "learning_rate": 4.317076621112864e-06, "loss": 0.4201, "step": 11377 }, { "epoch": 2.11, "learning_rate": 4.315433177528747e-06, "loss": 0.417, "step": 11378 }, { "epoch": 2.11, "learning_rate": 4.313789960748325e-06, "loss": 0.4146, "step": 11379 }, { "epoch": 2.11, "learning_rate": 4.312146970837151e-06, "loss": 0.4273, "step": 11380 }, { "epoch": 2.11, "learning_rate": 4.310504207860787e-06, "loss": 0.436, "step": 11381 }, { "epoch": 2.11, "learning_rate": 4.308861671884767e-06, "loss": 0.4208, "step": 11382 }, { "epoch": 2.11, "learning_rate": 4.307219362974634e-06, "loss": 0.4397, "step": 11383 }, { "epoch": 2.11, "learning_rate": 4.305577281195908e-06, "loss": 0.4176, "step": 11384 }, { "epoch": 2.11, "learning_rate": 4.3039354266141005e-06, "loss": 0.4216, "step": 11385 }, { "epoch": 2.11, "learning_rate": 4.302293799294729e-06, "loss": 0.4201, "step": 11386 }, { "epoch": 2.11, "learning_rate": 4.300652399303283e-06, "loss": 0.401, "step": 11387 }, { "epoch": 2.11, "learning_rate": 4.299011226705255e-06, "loss": 0.4087, "step": 11388 }, { "epoch": 2.11, "learning_rate": 4.297370281566125e-06, "loss": 0.4318, "step": 11389 }, { "epoch": 2.11, "learning_rate": 4.295729563951361e-06, "loss": 0.4089, "step": 11390 }, { "epoch": 2.11, "learning_rate": 4.294089073926428e-06, "loss": 0.4214, "step": 11391 }, { "epoch": 2.11, "learning_rate": 4.292448811556773e-06, "loss": 0.4275, "step": 11392 }, { "epoch": 2.11, "learning_rate": 4.2908087769078475e-06, "loss": 0.4078, "step": 11393 }, { "epoch": 2.11, "learning_rate": 4.289168970045081e-06, "loss": 0.412, "step": 11394 }, { "epoch": 2.11, "learning_rate": 4.287529391033895e-06, "loss": 0.4371, "step": 11395 }, { "epoch": 2.11, "learning_rate": 4.285890039939715e-06, "loss": 0.4254, "step": 11396 }, { "epoch": 2.11, "learning_rate": 4.284250916827939e-06, "loss": 0.404, "step": 11397 }, { "epoch": 2.11, "learning_rate": 4.282612021763972e-06, "loss": 0.4294, "step": 11398 }, { "epoch": 2.11, "learning_rate": 4.280973354813197e-06, "loss": 0.4019, "step": 11399 }, { "epoch": 2.11, "learning_rate": 4.2793349160410005e-06, "loss": 0.4308, "step": 11400 }, { "epoch": 2.11, "learning_rate": 4.2776967055127446e-06, "loss": 0.4153, "step": 11401 }, { "epoch": 2.11, "learning_rate": 4.2760587232938e-06, "loss": 0.4213, "step": 11402 }, { "epoch": 2.11, "learning_rate": 4.274420969449511e-06, "loss": 0.427, "step": 11403 }, { "epoch": 2.11, "learning_rate": 4.272783444045229e-06, "loss": 0.3953, "step": 11404 }, { "epoch": 2.11, "learning_rate": 4.271146147146279e-06, "loss": 0.4046, "step": 11405 }, { "epoch": 2.11, "learning_rate": 4.269509078817995e-06, "loss": 0.424, "step": 11406 }, { "epoch": 2.11, "learning_rate": 4.267872239125685e-06, "loss": 0.4098, "step": 11407 }, { "epoch": 2.11, "learning_rate": 4.266235628134664e-06, "loss": 0.4251, "step": 11408 }, { "epoch": 2.11, "learning_rate": 4.264599245910223e-06, "loss": 0.4074, "step": 11409 }, { "epoch": 2.11, "learning_rate": 4.262963092517656e-06, "loss": 0.4214, "step": 11410 }, { "epoch": 2.11, "learning_rate": 4.261327168022239e-06, "loss": 0.4296, "step": 11411 }, { "epoch": 2.11, "learning_rate": 4.259691472489242e-06, "loss": 0.4199, "step": 11412 }, { "epoch": 2.11, "learning_rate": 4.258056005983928e-06, "loss": 0.4082, "step": 11413 }, { "epoch": 2.11, "learning_rate": 4.256420768571546e-06, "loss": 0.4022, "step": 11414 }, { "epoch": 2.11, "learning_rate": 4.254785760317345e-06, "loss": 0.4202, "step": 11415 }, { "epoch": 2.11, "learning_rate": 4.253150981286556e-06, "loss": 0.4258, "step": 11416 }, { "epoch": 2.11, "learning_rate": 4.251516431544398e-06, "loss": 0.424, "step": 11417 }, { "epoch": 2.11, "learning_rate": 4.249882111156095e-06, "loss": 0.4316, "step": 11418 }, { "epoch": 2.11, "learning_rate": 4.248248020186847e-06, "loss": 0.4158, "step": 11419 }, { "epoch": 2.11, "learning_rate": 4.2466141587018575e-06, "loss": 0.4221, "step": 11420 }, { "epoch": 2.11, "learning_rate": 4.244980526766311e-06, "loss": 0.422, "step": 11421 }, { "epoch": 2.11, "learning_rate": 4.243347124445382e-06, "loss": 0.401, "step": 11422 }, { "epoch": 2.11, "learning_rate": 4.241713951804248e-06, "loss": 0.4333, "step": 11423 }, { "epoch": 2.11, "learning_rate": 4.2400810089080625e-06, "loss": 0.4215, "step": 11424 }, { "epoch": 2.11, "learning_rate": 4.238448295821986e-06, "loss": 0.4263, "step": 11425 }, { "epoch": 2.11, "learning_rate": 4.2368158126111495e-06, "loss": 0.4351, "step": 11426 }, { "epoch": 2.11, "learning_rate": 4.235183559340697e-06, "loss": 0.4315, "step": 11427 }, { "epoch": 2.11, "learning_rate": 4.233551536075745e-06, "loss": 0.4195, "step": 11428 }, { "epoch": 2.11, "learning_rate": 4.231919742881409e-06, "loss": 0.4199, "step": 11429 }, { "epoch": 2.11, "learning_rate": 4.230288179822798e-06, "loss": 0.4223, "step": 11430 }, { "epoch": 2.11, "learning_rate": 4.228656846965004e-06, "loss": 0.4192, "step": 11431 }, { "epoch": 2.12, "learning_rate": 4.22702574437312e-06, "loss": 0.4113, "step": 11432 }, { "epoch": 2.12, "learning_rate": 4.2253948721122194e-06, "loss": 0.428, "step": 11433 }, { "epoch": 2.12, "learning_rate": 4.223764230247369e-06, "loss": 0.4041, "step": 11434 }, { "epoch": 2.12, "learning_rate": 4.222133818843634e-06, "loss": 0.4043, "step": 11435 }, { "epoch": 2.12, "learning_rate": 4.220503637966061e-06, "loss": 0.4248, "step": 11436 }, { "epoch": 2.12, "learning_rate": 4.218873687679694e-06, "loss": 0.4108, "step": 11437 }, { "epoch": 2.12, "learning_rate": 4.217243968049564e-06, "loss": 0.4177, "step": 11438 }, { "epoch": 2.12, "learning_rate": 4.215614479140689e-06, "loss": 0.4264, "step": 11439 }, { "epoch": 2.12, "learning_rate": 4.213985221018091e-06, "loss": 0.433, "step": 11440 }, { "epoch": 2.12, "learning_rate": 4.2123561937467674e-06, "loss": 0.4201, "step": 11441 }, { "epoch": 2.12, "learning_rate": 4.210727397391718e-06, "loss": 0.4038, "step": 11442 }, { "epoch": 2.12, "learning_rate": 4.209098832017928e-06, "loss": 0.4326, "step": 11443 }, { "epoch": 2.12, "learning_rate": 4.207470497690369e-06, "loss": 0.4054, "step": 11444 }, { "epoch": 2.12, "learning_rate": 4.2058423944740164e-06, "loss": 0.4134, "step": 11445 }, { "epoch": 2.12, "learning_rate": 4.20421452243382e-06, "loss": 0.4218, "step": 11446 }, { "epoch": 2.12, "learning_rate": 4.202586881634739e-06, "loss": 0.4061, "step": 11447 }, { "epoch": 2.12, "learning_rate": 4.200959472141703e-06, "loss": 0.4354, "step": 11448 }, { "epoch": 2.12, "learning_rate": 4.199332294019651e-06, "loss": 0.4128, "step": 11449 }, { "epoch": 2.12, "learning_rate": 4.1977053473334986e-06, "loss": 0.4258, "step": 11450 }, { "epoch": 2.12, "learning_rate": 4.196078632148162e-06, "loss": 0.4018, "step": 11451 }, { "epoch": 2.12, "learning_rate": 4.194452148528539e-06, "loss": 0.4197, "step": 11452 }, { "epoch": 2.12, "learning_rate": 4.192825896539531e-06, "loss": 0.437, "step": 11453 }, { "epoch": 2.12, "learning_rate": 4.191199876246014e-06, "loss": 0.3993, "step": 11454 }, { "epoch": 2.12, "learning_rate": 4.189574087712871e-06, "loss": 0.4142, "step": 11455 }, { "epoch": 2.12, "learning_rate": 4.18794853100496e-06, "loss": 0.4234, "step": 11456 }, { "epoch": 2.12, "learning_rate": 4.186323206187146e-06, "loss": 0.4136, "step": 11457 }, { "epoch": 2.12, "learning_rate": 4.184698113324269e-06, "loss": 0.4149, "step": 11458 }, { "epoch": 2.12, "learning_rate": 4.183073252481174e-06, "loss": 0.4124, "step": 11459 }, { "epoch": 2.12, "learning_rate": 4.181448623722686e-06, "loss": 0.4282, "step": 11460 }, { "epoch": 2.12, "learning_rate": 4.179824227113621e-06, "loss": 0.3964, "step": 11461 }, { "epoch": 2.12, "learning_rate": 4.1782000627187994e-06, "loss": 0.4463, "step": 11462 }, { "epoch": 2.12, "learning_rate": 4.176576130603011e-06, "loss": 0.4271, "step": 11463 }, { "epoch": 2.12, "learning_rate": 4.174952430831057e-06, "loss": 0.4396, "step": 11464 }, { "epoch": 2.12, "learning_rate": 4.173328963467717e-06, "loss": 0.4349, "step": 11465 }, { "epoch": 2.12, "learning_rate": 4.171705728577759e-06, "loss": 0.4163, "step": 11466 }, { "epoch": 2.12, "learning_rate": 4.170082726225956e-06, "loss": 0.4044, "step": 11467 }, { "epoch": 2.12, "learning_rate": 4.168459956477055e-06, "loss": 0.4336, "step": 11468 }, { "epoch": 2.12, "learning_rate": 4.1668374193958074e-06, "loss": 0.4073, "step": 11469 }, { "epoch": 2.12, "learning_rate": 4.1652151150469445e-06, "loss": 0.431, "step": 11470 }, { "epoch": 2.12, "learning_rate": 4.163593043495199e-06, "loss": 0.4187, "step": 11471 }, { "epoch": 2.12, "learning_rate": 4.1619712048052855e-06, "loss": 0.4195, "step": 11472 }, { "epoch": 2.12, "learning_rate": 4.160349599041908e-06, "loss": 0.4247, "step": 11473 }, { "epoch": 2.12, "learning_rate": 4.1587282262697726e-06, "loss": 0.4118, "step": 11474 }, { "epoch": 2.12, "learning_rate": 4.157107086553563e-06, "loss": 0.4283, "step": 11475 }, { "epoch": 2.12, "learning_rate": 4.155486179957967e-06, "loss": 0.3997, "step": 11476 }, { "epoch": 2.12, "learning_rate": 4.153865506547652e-06, "loss": 0.4332, "step": 11477 }, { "epoch": 2.12, "learning_rate": 4.152245066387275e-06, "loss": 0.4234, "step": 11478 }, { "epoch": 2.12, "learning_rate": 4.1506248595414965e-06, "loss": 0.4244, "step": 11479 }, { "epoch": 2.12, "learning_rate": 4.149004886074953e-06, "loss": 0.4339, "step": 11480 }, { "epoch": 2.12, "learning_rate": 4.147385146052285e-06, "loss": 0.408, "step": 11481 }, { "epoch": 2.12, "learning_rate": 4.145765639538114e-06, "loss": 0.4313, "step": 11482 }, { "epoch": 2.12, "learning_rate": 4.144146366597051e-06, "loss": 0.4237, "step": 11483 }, { "epoch": 2.12, "learning_rate": 4.1425273272937115e-06, "loss": 0.4053, "step": 11484 }, { "epoch": 2.12, "learning_rate": 4.140908521692683e-06, "loss": 0.4357, "step": 11485 }, { "epoch": 2.13, "learning_rate": 4.139289949858558e-06, "loss": 0.4115, "step": 11486 }, { "epoch": 2.13, "learning_rate": 4.137671611855915e-06, "loss": 0.4011, "step": 11487 }, { "epoch": 2.13, "learning_rate": 4.136053507749317e-06, "loss": 0.4207, "step": 11488 }, { "epoch": 2.13, "learning_rate": 4.13443563760333e-06, "loss": 0.4282, "step": 11489 }, { "epoch": 2.13, "learning_rate": 4.1328180014825e-06, "loss": 0.4169, "step": 11490 }, { "epoch": 2.13, "learning_rate": 4.131200599451369e-06, "loss": 0.4246, "step": 11491 }, { "epoch": 2.13, "learning_rate": 4.129583431574468e-06, "loss": 0.413, "step": 11492 }, { "epoch": 2.13, "learning_rate": 4.127966497916321e-06, "loss": 0.4167, "step": 11493 }, { "epoch": 2.13, "learning_rate": 4.126349798541439e-06, "loss": 0.4157, "step": 11494 }, { "epoch": 2.13, "learning_rate": 4.124733333514323e-06, "loss": 0.4243, "step": 11495 }, { "epoch": 2.13, "learning_rate": 4.123117102899471e-06, "loss": 0.4083, "step": 11496 }, { "epoch": 2.13, "learning_rate": 4.121501106761363e-06, "loss": 0.414, "step": 11497 }, { "epoch": 2.13, "learning_rate": 4.119885345164482e-06, "loss": 0.4101, "step": 11498 }, { "epoch": 2.13, "learning_rate": 4.118269818173284e-06, "loss": 0.4135, "step": 11499 }, { "epoch": 2.13, "learning_rate": 4.116654525852234e-06, "loss": 0.4085, "step": 11500 }, { "epoch": 2.13, "learning_rate": 4.115039468265773e-06, "loss": 0.4364, "step": 11501 }, { "epoch": 2.13, "learning_rate": 4.113424645478345e-06, "loss": 0.4091, "step": 11502 }, { "epoch": 2.13, "learning_rate": 4.111810057554369e-06, "loss": 0.4301, "step": 11503 }, { "epoch": 2.13, "learning_rate": 4.110195704558277e-06, "loss": 0.4167, "step": 11504 }, { "epoch": 2.13, "learning_rate": 4.108581586554467e-06, "loss": 0.415, "step": 11505 }, { "epoch": 2.13, "learning_rate": 4.106967703607346e-06, "loss": 0.4046, "step": 11506 }, { "epoch": 2.13, "learning_rate": 4.105354055781301e-06, "loss": 0.4058, "step": 11507 }, { "epoch": 2.13, "learning_rate": 4.103740643140719e-06, "loss": 0.4297, "step": 11508 }, { "epoch": 2.13, "learning_rate": 4.102127465749967e-06, "loss": 0.4104, "step": 11509 }, { "epoch": 2.13, "learning_rate": 4.100514523673409e-06, "loss": 0.4119, "step": 11510 }, { "epoch": 2.13, "learning_rate": 4.0989018169754004e-06, "loss": 0.423, "step": 11511 }, { "epoch": 2.13, "learning_rate": 4.09728934572028e-06, "loss": 0.4337, "step": 11512 }, { "epoch": 2.13, "learning_rate": 4.09567710997239e-06, "loss": 0.4194, "step": 11513 }, { "epoch": 2.13, "learning_rate": 4.094065109796049e-06, "loss": 0.4249, "step": 11514 }, { "epoch": 2.13, "learning_rate": 4.092453345255579e-06, "loss": 0.3986, "step": 11515 }, { "epoch": 2.13, "learning_rate": 4.0908418164152816e-06, "loss": 0.4057, "step": 11516 }, { "epoch": 2.13, "learning_rate": 4.089230523339454e-06, "loss": 0.4227, "step": 11517 }, { "epoch": 2.13, "learning_rate": 4.0876194660923865e-06, "loss": 0.4185, "step": 11518 }, { "epoch": 2.13, "learning_rate": 4.086008644738353e-06, "loss": 0.4064, "step": 11519 }, { "epoch": 2.13, "learning_rate": 4.084398059341629e-06, "loss": 0.4159, "step": 11520 }, { "epoch": 2.13, "learning_rate": 4.082787709966469e-06, "loss": 0.4118, "step": 11521 }, { "epoch": 2.13, "learning_rate": 4.081177596677122e-06, "loss": 0.4024, "step": 11522 }, { "epoch": 2.13, "learning_rate": 4.079567719537832e-06, "loss": 0.4214, "step": 11523 }, { "epoch": 2.13, "learning_rate": 4.077958078612827e-06, "loss": 0.4081, "step": 11524 }, { "epoch": 2.13, "learning_rate": 4.0763486739663326e-06, "loss": 0.4265, "step": 11525 }, { "epoch": 2.13, "learning_rate": 4.074739505662559e-06, "loss": 0.4273, "step": 11526 }, { "epoch": 2.13, "learning_rate": 4.073130573765706e-06, "loss": 0.4208, "step": 11527 }, { "epoch": 2.13, "learning_rate": 4.071521878339973e-06, "loss": 0.4119, "step": 11528 }, { "epoch": 2.13, "learning_rate": 4.069913419449536e-06, "loss": 0.4241, "step": 11529 }, { "epoch": 2.13, "learning_rate": 4.068305197158579e-06, "loss": 0.4111, "step": 11530 }, { "epoch": 2.13, "learning_rate": 4.066697211531262e-06, "loss": 0.4297, "step": 11531 }, { "epoch": 2.13, "learning_rate": 4.065089462631737e-06, "loss": 0.4168, "step": 11532 }, { "epoch": 2.13, "learning_rate": 4.0634819505241585e-06, "loss": 0.4224, "step": 11533 }, { "epoch": 2.13, "learning_rate": 4.061874675272655e-06, "loss": 0.4083, "step": 11534 }, { "epoch": 2.13, "learning_rate": 4.060267636941363e-06, "loss": 0.4016, "step": 11535 }, { "epoch": 2.13, "learning_rate": 4.05866083559439e-06, "loss": 0.39, "step": 11536 }, { "epoch": 2.13, "learning_rate": 4.057054271295854e-06, "loss": 0.4226, "step": 11537 }, { "epoch": 2.13, "learning_rate": 4.055447944109848e-06, "loss": 0.411, "step": 11538 }, { "epoch": 2.13, "learning_rate": 4.053841854100461e-06, "loss": 0.4299, "step": 11539 }, { "epoch": 2.14, "learning_rate": 4.052236001331778e-06, "loss": 0.4133, "step": 11540 }, { "epoch": 2.14, "learning_rate": 4.050630385867863e-06, "loss": 0.4441, "step": 11541 }, { "epoch": 2.14, "learning_rate": 4.049025007772784e-06, "loss": 0.4108, "step": 11542 }, { "epoch": 2.14, "learning_rate": 4.04741986711059e-06, "loss": 0.3996, "step": 11543 }, { "epoch": 2.14, "learning_rate": 4.045814963945318e-06, "loss": 0.4472, "step": 11544 }, { "epoch": 2.14, "learning_rate": 4.04421029834101e-06, "loss": 0.4023, "step": 11545 }, { "epoch": 2.14, "learning_rate": 4.042605870361679e-06, "loss": 0.4162, "step": 11546 }, { "epoch": 2.14, "learning_rate": 4.041001680071348e-06, "loss": 0.4012, "step": 11547 }, { "epoch": 2.14, "learning_rate": 4.039397727534013e-06, "loss": 0.4355, "step": 11548 }, { "epoch": 2.14, "learning_rate": 4.037794012813677e-06, "loss": 0.4316, "step": 11549 }, { "epoch": 2.14, "learning_rate": 4.036190535974318e-06, "loss": 0.4452, "step": 11550 }, { "epoch": 2.14, "learning_rate": 4.034587297079918e-06, "loss": 0.4254, "step": 11551 }, { "epoch": 2.14, "learning_rate": 4.032984296194438e-06, "loss": 0.4272, "step": 11552 }, { "epoch": 2.14, "learning_rate": 4.031381533381838e-06, "loss": 0.4215, "step": 11553 }, { "epoch": 2.14, "learning_rate": 4.029779008706063e-06, "loss": 0.3967, "step": 11554 }, { "epoch": 2.14, "learning_rate": 4.028176722231054e-06, "loss": 0.4249, "step": 11555 }, { "epoch": 2.14, "learning_rate": 4.0265746740207345e-06, "loss": 0.4148, "step": 11556 }, { "epoch": 2.14, "learning_rate": 4.02497286413903e-06, "loss": 0.4272, "step": 11557 }, { "epoch": 2.14, "learning_rate": 4.023371292649841e-06, "loss": 0.4147, "step": 11558 }, { "epoch": 2.14, "learning_rate": 4.0217699596170755e-06, "loss": 0.4148, "step": 11559 }, { "epoch": 2.14, "learning_rate": 4.020168865104621e-06, "loss": 0.4213, "step": 11560 }, { "epoch": 2.14, "learning_rate": 4.018568009176353e-06, "loss": 0.4077, "step": 11561 }, { "epoch": 2.14, "learning_rate": 4.016967391896153e-06, "loss": 0.4151, "step": 11562 }, { "epoch": 2.14, "learning_rate": 4.0153670133278714e-06, "loss": 0.4355, "step": 11563 }, { "epoch": 2.14, "learning_rate": 4.013766873535369e-06, "loss": 0.4008, "step": 11564 }, { "epoch": 2.14, "learning_rate": 4.0121669725824854e-06, "loss": 0.4252, "step": 11565 }, { "epoch": 2.14, "learning_rate": 4.01056731053305e-06, "loss": 0.4265, "step": 11566 }, { "epoch": 2.14, "learning_rate": 4.008967887450893e-06, "loss": 0.4, "step": 11567 }, { "epoch": 2.14, "learning_rate": 4.007368703399822e-06, "loss": 0.4068, "step": 11568 }, { "epoch": 2.14, "learning_rate": 4.005769758443648e-06, "loss": 0.4097, "step": 11569 }, { "epoch": 2.14, "learning_rate": 4.004171052646163e-06, "loss": 0.4103, "step": 11570 }, { "epoch": 2.14, "learning_rate": 4.002572586071148e-06, "loss": 0.4326, "step": 11571 }, { "epoch": 2.14, "learning_rate": 4.000974358782387e-06, "loss": 0.4088, "step": 11572 }, { "epoch": 2.14, "learning_rate": 3.999376370843639e-06, "loss": 0.4069, "step": 11573 }, { "epoch": 2.14, "learning_rate": 3.997778622318666e-06, "loss": 0.4249, "step": 11574 }, { "epoch": 2.14, "learning_rate": 3.9961811132712135e-06, "loss": 0.4115, "step": 11575 }, { "epoch": 2.14, "learning_rate": 3.994583843765016e-06, "loss": 0.4311, "step": 11576 }, { "epoch": 2.14, "learning_rate": 3.9929868138638085e-06, "loss": 0.4113, "step": 11577 }, { "epoch": 2.14, "learning_rate": 3.991390023631301e-06, "loss": 0.4303, "step": 11578 }, { "epoch": 2.14, "learning_rate": 3.98979347313121e-06, "loss": 0.4109, "step": 11579 }, { "epoch": 2.14, "learning_rate": 3.988197162427229e-06, "loss": 0.4066, "step": 11580 }, { "epoch": 2.14, "learning_rate": 3.986601091583054e-06, "loss": 0.4129, "step": 11581 }, { "epoch": 2.14, "learning_rate": 3.985005260662362e-06, "loss": 0.4225, "step": 11582 }, { "epoch": 2.14, "learning_rate": 3.983409669728819e-06, "loss": 0.4039, "step": 11583 }, { "epoch": 2.14, "learning_rate": 3.981814318846096e-06, "loss": 0.4043, "step": 11584 }, { "epoch": 2.14, "learning_rate": 3.980219208077835e-06, "loss": 0.4343, "step": 11585 }, { "epoch": 2.14, "learning_rate": 3.978624337487687e-06, "loss": 0.4176, "step": 11586 }, { "epoch": 2.14, "learning_rate": 3.977029707139278e-06, "loss": 0.4135, "step": 11587 }, { "epoch": 2.14, "learning_rate": 3.975435317096229e-06, "loss": 0.4343, "step": 11588 }, { "epoch": 2.14, "learning_rate": 3.973841167422161e-06, "loss": 0.4288, "step": 11589 }, { "epoch": 2.14, "learning_rate": 3.9722472581806696e-06, "loss": 0.4118, "step": 11590 }, { "epoch": 2.14, "learning_rate": 3.970653589435356e-06, "loss": 0.4266, "step": 11591 }, { "epoch": 2.14, "learning_rate": 3.969060161249801e-06, "loss": 0.4076, "step": 11592 }, { "epoch": 2.14, "learning_rate": 3.967466973687576e-06, "loss": 0.4218, "step": 11593 }, { "epoch": 2.15, "learning_rate": 3.965874026812253e-06, "loss": 0.3985, "step": 11594 }, { "epoch": 2.15, "learning_rate": 3.964281320687381e-06, "loss": 0.4093, "step": 11595 }, { "epoch": 2.15, "learning_rate": 3.962688855376514e-06, "loss": 0.4191, "step": 11596 }, { "epoch": 2.15, "learning_rate": 3.961096630943183e-06, "loss": 0.4147, "step": 11597 }, { "epoch": 2.15, "learning_rate": 3.9595046474509125e-06, "loss": 0.4179, "step": 11598 }, { "epoch": 2.15, "learning_rate": 3.957912904963226e-06, "loss": 0.4506, "step": 11599 }, { "epoch": 2.15, "learning_rate": 3.9563214035436244e-06, "loss": 0.4203, "step": 11600 }, { "epoch": 2.15, "learning_rate": 3.954730143255614e-06, "loss": 0.4153, "step": 11601 }, { "epoch": 2.15, "learning_rate": 3.953139124162674e-06, "loss": 0.436, "step": 11602 }, { "epoch": 2.15, "learning_rate": 3.95154834632829e-06, "loss": 0.4285, "step": 11603 }, { "epoch": 2.15, "learning_rate": 3.9499578098159265e-06, "loss": 0.4149, "step": 11604 }, { "epoch": 2.15, "learning_rate": 3.948367514689048e-06, "loss": 0.4153, "step": 11605 }, { "epoch": 2.15, "learning_rate": 3.946777461011097e-06, "loss": 0.4198, "step": 11606 }, { "epoch": 2.15, "learning_rate": 3.9451876488455236e-06, "loss": 0.4032, "step": 11607 }, { "epoch": 2.15, "learning_rate": 3.943598078255748e-06, "loss": 0.4268, "step": 11608 }, { "epoch": 2.15, "learning_rate": 3.9420087493051995e-06, "loss": 0.3998, "step": 11609 }, { "epoch": 2.15, "learning_rate": 3.940419662057282e-06, "loss": 0.4128, "step": 11610 }, { "epoch": 2.15, "learning_rate": 3.938830816575405e-06, "loss": 0.418, "step": 11611 }, { "epoch": 2.15, "learning_rate": 3.937242212922953e-06, "loss": 0.4185, "step": 11612 }, { "epoch": 2.15, "learning_rate": 3.935653851163315e-06, "loss": 0.4234, "step": 11613 }, { "epoch": 2.15, "learning_rate": 3.934065731359861e-06, "loss": 0.4087, "step": 11614 }, { "epoch": 2.15, "learning_rate": 3.93247785357595e-06, "loss": 0.4149, "step": 11615 }, { "epoch": 2.15, "learning_rate": 3.930890217874942e-06, "loss": 0.4291, "step": 11616 }, { "epoch": 2.15, "learning_rate": 3.929302824320173e-06, "loss": 0.4248, "step": 11617 }, { "epoch": 2.15, "learning_rate": 3.927715672974988e-06, "loss": 0.4151, "step": 11618 }, { "epoch": 2.15, "learning_rate": 3.926128763902703e-06, "loss": 0.426, "step": 11619 }, { "epoch": 2.15, "learning_rate": 3.9245420971666326e-06, "loss": 0.419, "step": 11620 }, { "epoch": 2.15, "learning_rate": 3.922955672830087e-06, "loss": 0.4264, "step": 11621 }, { "epoch": 2.15, "learning_rate": 3.921369490956355e-06, "loss": 0.4108, "step": 11622 }, { "epoch": 2.15, "learning_rate": 3.919783551608729e-06, "loss": 0.4205, "step": 11623 }, { "epoch": 2.15, "learning_rate": 3.91819785485048e-06, "loss": 0.4101, "step": 11624 }, { "epoch": 2.15, "learning_rate": 3.916612400744879e-06, "loss": 0.4179, "step": 11625 }, { "epoch": 2.15, "learning_rate": 3.9150271893551804e-06, "loss": 0.406, "step": 11626 }, { "epoch": 2.15, "learning_rate": 3.9134422207446274e-06, "loss": 0.4171, "step": 11627 }, { "epoch": 2.15, "learning_rate": 3.911857494976465e-06, "loss": 0.4208, "step": 11628 }, { "epoch": 2.15, "learning_rate": 3.910273012113912e-06, "loss": 0.4104, "step": 11629 }, { "epoch": 2.15, "learning_rate": 3.9086887722201946e-06, "loss": 0.4252, "step": 11630 }, { "epoch": 2.15, "learning_rate": 3.907104775358518e-06, "loss": 0.4257, "step": 11631 }, { "epoch": 2.15, "learning_rate": 3.905521021592076e-06, "loss": 0.4278, "step": 11632 }, { "epoch": 2.15, "learning_rate": 3.903937510984066e-06, "loss": 0.4059, "step": 11633 }, { "epoch": 2.15, "learning_rate": 3.902354243597658e-06, "loss": 0.4037, "step": 11634 }, { "epoch": 2.15, "learning_rate": 3.900771219496031e-06, "loss": 0.4271, "step": 11635 }, { "epoch": 2.15, "learning_rate": 3.899188438742339e-06, "loss": 0.405, "step": 11636 }, { "epoch": 2.15, "learning_rate": 3.89760590139973e-06, "loss": 0.4043, "step": 11637 }, { "epoch": 2.15, "learning_rate": 3.896023607531351e-06, "loss": 0.4177, "step": 11638 }, { "epoch": 2.15, "learning_rate": 3.894441557200324e-06, "loss": 0.4226, "step": 11639 }, { "epoch": 2.15, "learning_rate": 3.892859750469779e-06, "loss": 0.4066, "step": 11640 }, { "epoch": 2.15, "learning_rate": 3.8912781874028235e-06, "loss": 0.3902, "step": 11641 }, { "epoch": 2.15, "learning_rate": 3.8896968680625545e-06, "loss": 0.4161, "step": 11642 }, { "epoch": 2.15, "learning_rate": 3.888115792512072e-06, "loss": 0.4173, "step": 11643 }, { "epoch": 2.15, "learning_rate": 3.886534960814447e-06, "loss": 0.4108, "step": 11644 }, { "epoch": 2.15, "learning_rate": 3.8849543730327646e-06, "loss": 0.4304, "step": 11645 }, { "epoch": 2.15, "learning_rate": 3.88337402923008e-06, "loss": 0.4418, "step": 11646 }, { "epoch": 2.15, "learning_rate": 3.881793929469444e-06, "loss": 0.4007, "step": 11647 }, { "epoch": 2.16, "learning_rate": 3.880214073813906e-06, "loss": 0.4157, "step": 11648 }, { "epoch": 2.16, "learning_rate": 3.878634462326492e-06, "loss": 0.4229, "step": 11649 }, { "epoch": 2.16, "learning_rate": 3.877055095070233e-06, "loss": 0.4132, "step": 11650 }, { "epoch": 2.16, "learning_rate": 3.875475972108137e-06, "loss": 0.4084, "step": 11651 }, { "epoch": 2.16, "learning_rate": 3.873897093503213e-06, "loss": 0.428, "step": 11652 }, { "epoch": 2.16, "learning_rate": 3.872318459318449e-06, "loss": 0.4503, "step": 11653 }, { "epoch": 2.16, "learning_rate": 3.870740069616837e-06, "loss": 0.4266, "step": 11654 }, { "epoch": 2.16, "learning_rate": 3.8691619244613455e-06, "loss": 0.4141, "step": 11655 }, { "epoch": 2.16, "learning_rate": 3.867584023914946e-06, "loss": 0.4285, "step": 11656 }, { "epoch": 2.16, "learning_rate": 3.866006368040586e-06, "loss": 0.4171, "step": 11657 }, { "epoch": 2.16, "learning_rate": 3.864428956901217e-06, "loss": 0.4254, "step": 11658 }, { "epoch": 2.16, "learning_rate": 3.862851790559772e-06, "loss": 0.3916, "step": 11659 }, { "epoch": 2.16, "learning_rate": 3.86127486907918e-06, "loss": 0.4532, "step": 11660 }, { "epoch": 2.16, "learning_rate": 3.859698192522352e-06, "loss": 0.425, "step": 11661 }, { "epoch": 2.16, "learning_rate": 3.858121760952201e-06, "loss": 0.435, "step": 11662 }, { "epoch": 2.16, "learning_rate": 3.856545574431621e-06, "loss": 0.4129, "step": 11663 }, { "epoch": 2.16, "learning_rate": 3.854969633023494e-06, "loss": 0.4186, "step": 11664 }, { "epoch": 2.16, "learning_rate": 3.853393936790705e-06, "loss": 0.4255, "step": 11665 }, { "epoch": 2.16, "learning_rate": 3.8518184857961146e-06, "loss": 0.4292, "step": 11666 }, { "epoch": 2.16, "learning_rate": 3.850243280102587e-06, "loss": 0.4294, "step": 11667 }, { "epoch": 2.16, "learning_rate": 3.848668319772967e-06, "loss": 0.4081, "step": 11668 }, { "epoch": 2.16, "learning_rate": 3.8470936048700876e-06, "loss": 0.4134, "step": 11669 }, { "epoch": 2.16, "learning_rate": 3.845519135456786e-06, "loss": 0.4489, "step": 11670 }, { "epoch": 2.16, "learning_rate": 3.843944911595873e-06, "loss": 0.4387, "step": 11671 }, { "epoch": 2.16, "learning_rate": 3.842370933350163e-06, "loss": 0.4282, "step": 11672 }, { "epoch": 2.16, "learning_rate": 3.840797200782448e-06, "loss": 0.4236, "step": 11673 }, { "epoch": 2.16, "learning_rate": 3.8392237139555255e-06, "loss": 0.4037, "step": 11674 }, { "epoch": 2.16, "learning_rate": 3.83765047293217e-06, "loss": 0.4234, "step": 11675 }, { "epoch": 2.16, "learning_rate": 3.8360774777751494e-06, "loss": 0.4033, "step": 11676 }, { "epoch": 2.16, "learning_rate": 3.834504728547228e-06, "loss": 0.4237, "step": 11677 }, { "epoch": 2.16, "learning_rate": 3.832932225311149e-06, "loss": 0.4051, "step": 11678 }, { "epoch": 2.16, "learning_rate": 3.8313599681296595e-06, "loss": 0.4222, "step": 11679 }, { "epoch": 2.16, "learning_rate": 3.829787957065487e-06, "loss": 0.4339, "step": 11680 }, { "epoch": 2.16, "learning_rate": 3.8282161921813475e-06, "loss": 0.4125, "step": 11681 }, { "epoch": 2.16, "learning_rate": 3.826644673539958e-06, "loss": 0.4105, "step": 11682 }, { "epoch": 2.16, "learning_rate": 3.825073401204013e-06, "loss": 0.3834, "step": 11683 }, { "epoch": 2.16, "learning_rate": 3.823502375236211e-06, "loss": 0.4093, "step": 11684 }, { "epoch": 2.16, "learning_rate": 3.821931595699228e-06, "loss": 0.4004, "step": 11685 }, { "epoch": 2.16, "learning_rate": 3.820361062655733e-06, "loss": 0.4101, "step": 11686 }, { "epoch": 2.16, "learning_rate": 3.818790776168394e-06, "loss": 0.4124, "step": 11687 }, { "epoch": 2.16, "learning_rate": 3.817220736299855e-06, "loss": 0.4173, "step": 11688 }, { "epoch": 2.16, "learning_rate": 3.815650943112764e-06, "loss": 0.4223, "step": 11689 }, { "epoch": 2.16, "learning_rate": 3.8140813966697522e-06, "loss": 0.4201, "step": 11690 }, { "epoch": 2.16, "learning_rate": 3.812512097033435e-06, "loss": 0.4042, "step": 11691 }, { "epoch": 2.16, "learning_rate": 3.810943044266433e-06, "loss": 0.4174, "step": 11692 }, { "epoch": 2.16, "learning_rate": 3.8093742384313416e-06, "loss": 0.411, "step": 11693 }, { "epoch": 2.16, "learning_rate": 3.807805679590759e-06, "loss": 0.4318, "step": 11694 }, { "epoch": 2.16, "learning_rate": 3.806237367807263e-06, "loss": 0.431, "step": 11695 }, { "epoch": 2.16, "learning_rate": 3.8046693031434314e-06, "loss": 0.4195, "step": 11696 }, { "epoch": 2.16, "learning_rate": 3.8031014856618244e-06, "loss": 0.4159, "step": 11697 }, { "epoch": 2.16, "learning_rate": 3.801533915424991e-06, "loss": 0.412, "step": 11698 }, { "epoch": 2.16, "learning_rate": 3.799966592495482e-06, "loss": 0.435, "step": 11699 }, { "epoch": 2.16, "learning_rate": 3.7983995169358235e-06, "loss": 0.4202, "step": 11700 }, { "epoch": 2.16, "learning_rate": 3.796832688808546e-06, "loss": 0.4045, "step": 11701 }, { "epoch": 2.17, "learning_rate": 3.7952661081761555e-06, "loss": 0.4244, "step": 11702 }, { "epoch": 2.17, "learning_rate": 3.793699775101164e-06, "loss": 0.4101, "step": 11703 }, { "epoch": 2.17, "learning_rate": 3.792133689646056e-06, "loss": 0.45, "step": 11704 }, { "epoch": 2.17, "learning_rate": 3.7905678518733246e-06, "loss": 0.4196, "step": 11705 }, { "epoch": 2.17, "learning_rate": 3.789002261845436e-06, "loss": 0.4211, "step": 11706 }, { "epoch": 2.17, "learning_rate": 3.7874369196248606e-06, "loss": 0.4149, "step": 11707 }, { "epoch": 2.17, "learning_rate": 3.7858718252740467e-06, "loss": 0.4095, "step": 11708 }, { "epoch": 2.17, "learning_rate": 3.7843069788554453e-06, "loss": 0.4354, "step": 11709 }, { "epoch": 2.17, "learning_rate": 3.7827423804314835e-06, "loss": 0.4278, "step": 11710 }, { "epoch": 2.17, "learning_rate": 3.781178030064594e-06, "loss": 0.4257, "step": 11711 }, { "epoch": 2.17, "learning_rate": 3.779613927817186e-06, "loss": 0.4151, "step": 11712 }, { "epoch": 2.17, "learning_rate": 3.7780500737516633e-06, "loss": 0.405, "step": 11713 }, { "epoch": 2.17, "learning_rate": 3.7764864679304258e-06, "loss": 0.4158, "step": 11714 }, { "epoch": 2.17, "learning_rate": 3.7749231104158536e-06, "loss": 0.4365, "step": 11715 }, { "epoch": 2.17, "learning_rate": 3.7733600012703253e-06, "loss": 0.4106, "step": 11716 }, { "epoch": 2.17, "learning_rate": 3.7717971405562027e-06, "loss": 0.4122, "step": 11717 }, { "epoch": 2.17, "learning_rate": 3.7702345283358454e-06, "loss": 0.4253, "step": 11718 }, { "epoch": 2.17, "learning_rate": 3.7686721646715974e-06, "loss": 0.4034, "step": 11719 }, { "epoch": 2.17, "learning_rate": 3.7671100496257886e-06, "loss": 0.401, "step": 11720 }, { "epoch": 2.17, "learning_rate": 3.7655481832607533e-06, "loss": 0.4075, "step": 11721 }, { "epoch": 2.17, "learning_rate": 3.7639865656387985e-06, "loss": 0.4116, "step": 11722 }, { "epoch": 2.17, "learning_rate": 3.762425196822238e-06, "loss": 0.4423, "step": 11723 }, { "epoch": 2.17, "learning_rate": 3.760864076873363e-06, "loss": 0.4082, "step": 11724 }, { "epoch": 2.17, "learning_rate": 3.7593032058544566e-06, "loss": 0.4147, "step": 11725 }, { "epoch": 2.17, "learning_rate": 3.7577425838278015e-06, "loss": 0.4166, "step": 11726 }, { "epoch": 2.17, "learning_rate": 3.7561822108556568e-06, "loss": 0.4113, "step": 11727 }, { "epoch": 2.17, "learning_rate": 3.7546220870002856e-06, "loss": 0.4274, "step": 11728 }, { "epoch": 2.17, "learning_rate": 3.753062212323929e-06, "loss": 0.4176, "step": 11729 }, { "epoch": 2.17, "learning_rate": 3.751502586888822e-06, "loss": 0.4136, "step": 11730 }, { "epoch": 2.17, "learning_rate": 3.7499432107571955e-06, "loss": 0.407, "step": 11731 }, { "epoch": 2.17, "learning_rate": 3.74838408399126e-06, "loss": 0.4029, "step": 11732 }, { "epoch": 2.17, "learning_rate": 3.7468252066532297e-06, "loss": 0.4079, "step": 11733 }, { "epoch": 2.17, "learning_rate": 3.7452665788052946e-06, "loss": 0.416, "step": 11734 }, { "epoch": 2.17, "learning_rate": 3.7437082005096393e-06, "loss": 0.3987, "step": 11735 }, { "epoch": 2.17, "learning_rate": 3.7421500718284475e-06, "loss": 0.4201, "step": 11736 }, { "epoch": 2.17, "learning_rate": 3.7405921928238787e-06, "loss": 0.4289, "step": 11737 }, { "epoch": 2.17, "learning_rate": 3.739034563558095e-06, "loss": 0.4129, "step": 11738 }, { "epoch": 2.17, "learning_rate": 3.7374771840932376e-06, "loss": 0.4355, "step": 11739 }, { "epoch": 2.17, "learning_rate": 3.7359200544914487e-06, "loss": 0.4161, "step": 11740 }, { "epoch": 2.17, "learning_rate": 3.7343631748148523e-06, "loss": 0.4428, "step": 11741 }, { "epoch": 2.17, "learning_rate": 3.732806545125561e-06, "loss": 0.425, "step": 11742 }, { "epoch": 2.17, "learning_rate": 3.7312501654856892e-06, "loss": 0.4267, "step": 11743 }, { "epoch": 2.17, "learning_rate": 3.7296940359573252e-06, "loss": 0.4147, "step": 11744 }, { "epoch": 2.17, "learning_rate": 3.7281381566025643e-06, "loss": 0.4263, "step": 11745 }, { "epoch": 2.17, "learning_rate": 3.7265825274834786e-06, "loss": 0.3973, "step": 11746 }, { "epoch": 2.17, "learning_rate": 3.7250271486621313e-06, "loss": 0.4131, "step": 11747 }, { "epoch": 2.17, "learning_rate": 3.723472020200587e-06, "loss": 0.4419, "step": 11748 }, { "epoch": 2.17, "learning_rate": 3.7219171421608846e-06, "loss": 0.4155, "step": 11749 }, { "epoch": 2.17, "learning_rate": 3.720362514605068e-06, "loss": 0.4129, "step": 11750 }, { "epoch": 2.17, "learning_rate": 3.718808137595158e-06, "loss": 0.4187, "step": 11751 }, { "epoch": 2.17, "learning_rate": 3.7172540111931766e-06, "loss": 0.4088, "step": 11752 }, { "epoch": 2.17, "learning_rate": 3.7157001354611243e-06, "loss": 0.4122, "step": 11753 }, { "epoch": 2.17, "learning_rate": 3.7141465104610054e-06, "loss": 0.4023, "step": 11754 }, { "epoch": 2.17, "learning_rate": 3.7125931362547997e-06, "loss": 0.4299, "step": 11755 }, { "epoch": 2.18, "learning_rate": 3.7110400129044897e-06, "loss": 0.4189, "step": 11756 }, { "epoch": 2.18, "learning_rate": 3.709487140472037e-06, "loss": 0.4187, "step": 11757 }, { "epoch": 2.18, "learning_rate": 3.707934519019404e-06, "loss": 0.4222, "step": 11758 }, { "epoch": 2.18, "learning_rate": 3.7063821486085303e-06, "loss": 0.4188, "step": 11759 }, { "epoch": 2.18, "learning_rate": 3.7048300293013596e-06, "loss": 0.4285, "step": 11760 }, { "epoch": 2.18, "learning_rate": 3.7032781611598136e-06, "loss": 0.4032, "step": 11761 }, { "epoch": 2.18, "learning_rate": 3.701726544245813e-06, "loss": 0.4165, "step": 11762 }, { "epoch": 2.18, "learning_rate": 3.7001751786212624e-06, "loss": 0.4303, "step": 11763 }, { "epoch": 2.18, "learning_rate": 3.6986240643480552e-06, "loss": 0.419, "step": 11764 }, { "epoch": 2.18, "learning_rate": 3.697073201488085e-06, "loss": 0.4175, "step": 11765 }, { "epoch": 2.18, "learning_rate": 3.695522590103221e-06, "loss": 0.4143, "step": 11766 }, { "epoch": 2.18, "learning_rate": 3.693972230255336e-06, "loss": 0.4139, "step": 11767 }, { "epoch": 2.18, "learning_rate": 3.6924221220062837e-06, "loss": 0.4148, "step": 11768 }, { "epoch": 2.18, "learning_rate": 3.6908722654179085e-06, "loss": 0.4158, "step": 11769 }, { "epoch": 2.18, "learning_rate": 3.6893226605520516e-06, "loss": 0.4116, "step": 11770 }, { "epoch": 2.18, "learning_rate": 3.6877733074705322e-06, "loss": 0.4239, "step": 11771 }, { "epoch": 2.18, "learning_rate": 3.686224206235176e-06, "loss": 0.4104, "step": 11772 }, { "epoch": 2.18, "learning_rate": 3.684675356907783e-06, "loss": 0.3844, "step": 11773 }, { "epoch": 2.18, "learning_rate": 3.6831267595501485e-06, "loss": 0.4269, "step": 11774 }, { "epoch": 2.18, "learning_rate": 3.681578414224063e-06, "loss": 0.4169, "step": 11775 }, { "epoch": 2.18, "learning_rate": 3.680030320991298e-06, "loss": 0.3971, "step": 11776 }, { "epoch": 2.18, "learning_rate": 3.6784824799136255e-06, "loss": 0.4085, "step": 11777 }, { "epoch": 2.18, "learning_rate": 3.676934891052798e-06, "loss": 0.4187, "step": 11778 }, { "epoch": 2.18, "learning_rate": 3.6753875544705577e-06, "loss": 0.418, "step": 11779 }, { "epoch": 2.18, "learning_rate": 3.673840470228648e-06, "loss": 0.4014, "step": 11780 }, { "epoch": 2.18, "learning_rate": 3.6722936383887877e-06, "loss": 0.4143, "step": 11781 }, { "epoch": 2.18, "learning_rate": 3.670747059012699e-06, "loss": 0.4025, "step": 11782 }, { "epoch": 2.18, "learning_rate": 3.6692007321620815e-06, "loss": 0.414, "step": 11783 }, { "epoch": 2.18, "learning_rate": 3.667654657898636e-06, "loss": 0.4126, "step": 11784 }, { "epoch": 2.18, "learning_rate": 3.666108836284047e-06, "loss": 0.4229, "step": 11785 }, { "epoch": 2.18, "learning_rate": 3.6645632673799835e-06, "loss": 0.4188, "step": 11786 }, { "epoch": 2.18, "learning_rate": 3.66301795124812e-06, "loss": 0.4238, "step": 11787 }, { "epoch": 2.18, "learning_rate": 3.661472887950105e-06, "loss": 0.4285, "step": 11788 }, { "epoch": 2.18, "learning_rate": 3.6599280775475886e-06, "loss": 0.4454, "step": 11789 }, { "epoch": 2.18, "learning_rate": 3.6583835201022046e-06, "loss": 0.4305, "step": 11790 }, { "epoch": 2.18, "learning_rate": 3.6568392156755727e-06, "loss": 0.4148, "step": 11791 }, { "epoch": 2.18, "learning_rate": 3.6552951643293156e-06, "loss": 0.4305, "step": 11792 }, { "epoch": 2.18, "learning_rate": 3.6537513661250314e-06, "loss": 0.3994, "step": 11793 }, { "epoch": 2.18, "learning_rate": 3.6522078211243206e-06, "loss": 0.4162, "step": 11794 }, { "epoch": 2.18, "learning_rate": 3.6506645293887653e-06, "loss": 0.4039, "step": 11795 }, { "epoch": 2.18, "learning_rate": 3.649121490979937e-06, "loss": 0.4213, "step": 11796 }, { "epoch": 2.18, "learning_rate": 3.647578705959406e-06, "loss": 0.4001, "step": 11797 }, { "epoch": 2.18, "learning_rate": 3.646036174388721e-06, "loss": 0.4163, "step": 11798 }, { "epoch": 2.18, "learning_rate": 3.644493896329431e-06, "loss": 0.4405, "step": 11799 }, { "epoch": 2.18, "learning_rate": 3.6429518718430634e-06, "loss": 0.4039, "step": 11800 }, { "epoch": 2.18, "learning_rate": 3.6414101009911507e-06, "loss": 0.4237, "step": 11801 }, { "epoch": 2.18, "learning_rate": 3.6398685838351988e-06, "loss": 0.4254, "step": 11802 }, { "epoch": 2.18, "learning_rate": 3.6383273204367187e-06, "loss": 0.3994, "step": 11803 }, { "epoch": 2.18, "learning_rate": 3.6367863108571967e-06, "loss": 0.421, "step": 11804 }, { "epoch": 2.18, "learning_rate": 3.635245555158122e-06, "loss": 0.4195, "step": 11805 }, { "epoch": 2.18, "learning_rate": 3.6337050534009643e-06, "loss": 0.4177, "step": 11806 }, { "epoch": 2.18, "learning_rate": 3.63216480564719e-06, "loss": 0.4238, "step": 11807 }, { "epoch": 2.18, "learning_rate": 3.6306248119582466e-06, "loss": 0.3991, "step": 11808 }, { "epoch": 2.18, "learning_rate": 3.629085072395585e-06, "loss": 0.44, "step": 11809 }, { "epoch": 2.19, "learning_rate": 3.6275455870206298e-06, "loss": 0.4202, "step": 11810 }, { "epoch": 2.19, "learning_rate": 3.626006355894811e-06, "loss": 0.4255, "step": 11811 }, { "epoch": 2.19, "learning_rate": 3.624467379079537e-06, "loss": 0.402, "step": 11812 }, { "epoch": 2.19, "learning_rate": 3.6229286566362076e-06, "loss": 0.4055, "step": 11813 }, { "epoch": 2.19, "learning_rate": 3.6213901886262214e-06, "loss": 0.4311, "step": 11814 }, { "epoch": 2.19, "learning_rate": 3.619851975110953e-06, "loss": 0.4373, "step": 11815 }, { "epoch": 2.19, "learning_rate": 3.6183140161517817e-06, "loss": 0.4075, "step": 11816 }, { "epoch": 2.19, "learning_rate": 3.6167763118100663e-06, "loss": 0.4226, "step": 11817 }, { "epoch": 2.19, "learning_rate": 3.6152388621471545e-06, "loss": 0.4051, "step": 11818 }, { "epoch": 2.19, "learning_rate": 3.613701667224394e-06, "loss": 0.3925, "step": 11819 }, { "epoch": 2.19, "learning_rate": 3.61216472710311e-06, "loss": 0.399, "step": 11820 }, { "epoch": 2.19, "learning_rate": 3.6106280418446292e-06, "loss": 0.4141, "step": 11821 }, { "epoch": 2.19, "learning_rate": 3.6090916115102616e-06, "loss": 0.3878, "step": 11822 }, { "epoch": 2.19, "learning_rate": 3.607555436161302e-06, "loss": 0.4127, "step": 11823 }, { "epoch": 2.19, "learning_rate": 3.606019515859048e-06, "loss": 0.4335, "step": 11824 }, { "epoch": 2.19, "learning_rate": 3.604483850664774e-06, "loss": 0.4292, "step": 11825 }, { "epoch": 2.19, "learning_rate": 3.6029484406397574e-06, "loss": 0.3975, "step": 11826 }, { "epoch": 2.19, "learning_rate": 3.60141328584525e-06, "loss": 0.4131, "step": 11827 }, { "epoch": 2.19, "learning_rate": 3.5998783863425103e-06, "loss": 0.4183, "step": 11828 }, { "epoch": 2.19, "learning_rate": 3.5983437421927724e-06, "loss": 0.4264, "step": 11829 }, { "epoch": 2.19, "learning_rate": 3.5968093534572635e-06, "loss": 0.4256, "step": 11830 }, { "epoch": 2.19, "learning_rate": 3.5952752201972096e-06, "loss": 0.4042, "step": 11831 }, { "epoch": 2.19, "learning_rate": 3.5937413424738144e-06, "loss": 0.4119, "step": 11832 }, { "epoch": 2.19, "learning_rate": 3.5922077203482806e-06, "loss": 0.4393, "step": 11833 }, { "epoch": 2.19, "learning_rate": 3.590674353881796e-06, "loss": 0.4209, "step": 11834 }, { "epoch": 2.19, "learning_rate": 3.589141243135533e-06, "loss": 0.4196, "step": 11835 }, { "epoch": 2.19, "learning_rate": 3.58760838817067e-06, "loss": 0.4177, "step": 11836 }, { "epoch": 2.19, "learning_rate": 3.5860757890483567e-06, "loss": 0.3904, "step": 11837 }, { "epoch": 2.19, "learning_rate": 3.584543445829748e-06, "loss": 0.4122, "step": 11838 }, { "epoch": 2.19, "learning_rate": 3.5830113585759762e-06, "loss": 0.4234, "step": 11839 }, { "epoch": 2.19, "learning_rate": 3.5814795273481685e-06, "loss": 0.4133, "step": 11840 }, { "epoch": 2.19, "learning_rate": 3.579947952207448e-06, "loss": 0.4286, "step": 11841 }, { "epoch": 2.19, "learning_rate": 3.578416633214913e-06, "loss": 0.4043, "step": 11842 }, { "epoch": 2.19, "learning_rate": 3.5768855704316687e-06, "loss": 0.4187, "step": 11843 }, { "epoch": 2.19, "learning_rate": 3.575354763918799e-06, "loss": 0.4134, "step": 11844 }, { "epoch": 2.19, "learning_rate": 3.573824213737375e-06, "loss": 0.4301, "step": 11845 }, { "epoch": 2.19, "learning_rate": 3.572293919948471e-06, "loss": 0.401, "step": 11846 }, { "epoch": 2.19, "learning_rate": 3.570763882613135e-06, "loss": 0.4107, "step": 11847 }, { "epoch": 2.19, "learning_rate": 3.5692341017924205e-06, "loss": 0.4273, "step": 11848 }, { "epoch": 2.19, "learning_rate": 3.5677045775473562e-06, "loss": 0.4175, "step": 11849 }, { "epoch": 2.19, "learning_rate": 3.566175309938973e-06, "loss": 0.3962, "step": 11850 }, { "epoch": 2.19, "learning_rate": 3.564646299028279e-06, "loss": 0.3964, "step": 11851 }, { "epoch": 2.19, "learning_rate": 3.5631175448762877e-06, "loss": 0.4, "step": 11852 }, { "epoch": 2.19, "learning_rate": 3.561589047543984e-06, "loss": 0.4156, "step": 11853 }, { "epoch": 2.19, "learning_rate": 3.5600608070923616e-06, "loss": 0.4232, "step": 11854 }, { "epoch": 2.19, "learning_rate": 3.5585328235823856e-06, "loss": 0.4136, "step": 11855 }, { "epoch": 2.19, "learning_rate": 3.5570050970750282e-06, "loss": 0.3999, "step": 11856 }, { "epoch": 2.19, "learning_rate": 3.5554776276312343e-06, "loss": 0.4186, "step": 11857 }, { "epoch": 2.19, "learning_rate": 3.553950415311954e-06, "loss": 0.4143, "step": 11858 }, { "epoch": 2.19, "learning_rate": 3.552423460178116e-06, "loss": 0.429, "step": 11859 }, { "epoch": 2.19, "learning_rate": 3.5508967622906463e-06, "loss": 0.4097, "step": 11860 }, { "epoch": 2.19, "learning_rate": 3.549370321710457e-06, "loss": 0.429, "step": 11861 }, { "epoch": 2.19, "learning_rate": 3.547844138498444e-06, "loss": 0.4144, "step": 11862 }, { "epoch": 2.19, "learning_rate": 3.5463182127155085e-06, "loss": 0.4195, "step": 11863 }, { "epoch": 2.2, "learning_rate": 3.544792544422524e-06, "loss": 0.4303, "step": 11864 }, { "epoch": 2.2, "learning_rate": 3.5432671336803683e-06, "loss": 0.4129, "step": 11865 }, { "epoch": 2.2, "learning_rate": 3.541741980549901e-06, "loss": 0.4189, "step": 11866 }, { "epoch": 2.2, "learning_rate": 3.540217085091967e-06, "loss": 0.4133, "step": 11867 }, { "epoch": 2.2, "learning_rate": 3.5386924473674144e-06, "loss": 0.4038, "step": 11868 }, { "epoch": 2.2, "learning_rate": 3.537168067437068e-06, "loss": 0.4314, "step": 11869 }, { "epoch": 2.2, "learning_rate": 3.535643945361753e-06, "loss": 0.4227, "step": 11870 }, { "epoch": 2.2, "learning_rate": 3.5341200812022724e-06, "loss": 0.4228, "step": 11871 }, { "epoch": 2.2, "learning_rate": 3.532596475019433e-06, "loss": 0.4002, "step": 11872 }, { "epoch": 2.2, "learning_rate": 3.5310731268740208e-06, "loss": 0.4128, "step": 11873 }, { "epoch": 2.2, "learning_rate": 3.5295500368268097e-06, "loss": 0.4199, "step": 11874 }, { "epoch": 2.2, "learning_rate": 3.528027204938577e-06, "loss": 0.4091, "step": 11875 }, { "epoch": 2.2, "learning_rate": 3.5265046312700714e-06, "loss": 0.4276, "step": 11876 }, { "epoch": 2.2, "learning_rate": 3.5249823158820493e-06, "loss": 0.4135, "step": 11877 }, { "epoch": 2.2, "learning_rate": 3.523460258835245e-06, "loss": 0.406, "step": 11878 }, { "epoch": 2.2, "learning_rate": 3.5219384601903815e-06, "loss": 0.418, "step": 11879 }, { "epoch": 2.2, "learning_rate": 3.5204169200081838e-06, "loss": 0.4159, "step": 11880 }, { "epoch": 2.2, "learning_rate": 3.518895638349351e-06, "loss": 0.4155, "step": 11881 }, { "epoch": 2.2, "learning_rate": 3.517374615274586e-06, "loss": 0.4138, "step": 11882 }, { "epoch": 2.2, "learning_rate": 3.5158538508445716e-06, "loss": 0.4097, "step": 11883 }, { "epoch": 2.2, "learning_rate": 3.514333345119979e-06, "loss": 0.4145, "step": 11884 }, { "epoch": 2.2, "learning_rate": 3.512813098161483e-06, "loss": 0.4211, "step": 11885 }, { "epoch": 2.2, "learning_rate": 3.51129311002973e-06, "loss": 0.4386, "step": 11886 }, { "epoch": 2.2, "learning_rate": 3.5097733807853705e-06, "loss": 0.405, "step": 11887 }, { "epoch": 2.2, "learning_rate": 3.5082539104890377e-06, "loss": 0.3963, "step": 11888 }, { "epoch": 2.2, "learning_rate": 3.5067346992013516e-06, "loss": 0.4189, "step": 11889 }, { "epoch": 2.2, "learning_rate": 3.505215746982932e-06, "loss": 0.4602, "step": 11890 }, { "epoch": 2.2, "learning_rate": 3.503697053894376e-06, "loss": 0.4141, "step": 11891 }, { "epoch": 2.2, "learning_rate": 3.5021786199962837e-06, "loss": 0.4357, "step": 11892 }, { "epoch": 2.2, "learning_rate": 3.5006604453492298e-06, "loss": 0.4294, "step": 11893 }, { "epoch": 2.2, "learning_rate": 3.4991425300137948e-06, "loss": 0.4087, "step": 11894 }, { "epoch": 2.2, "learning_rate": 3.497624874050537e-06, "loss": 0.4421, "step": 11895 }, { "epoch": 2.2, "learning_rate": 3.4961074775200056e-06, "loss": 0.4118, "step": 11896 }, { "epoch": 2.2, "learning_rate": 3.4945903404827453e-06, "loss": 0.4095, "step": 11897 }, { "epoch": 2.2, "learning_rate": 3.4930734629992847e-06, "loss": 0.4345, "step": 11898 }, { "epoch": 2.2, "learning_rate": 3.4915568451301473e-06, "loss": 0.403, "step": 11899 }, { "epoch": 2.2, "learning_rate": 3.490040486935843e-06, "loss": 0.4246, "step": 11900 }, { "epoch": 2.2, "learning_rate": 3.488524388476866e-06, "loss": 0.4174, "step": 11901 }, { "epoch": 2.2, "learning_rate": 3.487008549813714e-06, "loss": 0.415, "step": 11902 }, { "epoch": 2.2, "learning_rate": 3.4854929710068596e-06, "loss": 0.4301, "step": 11903 }, { "epoch": 2.2, "learning_rate": 3.483977652116777e-06, "loss": 0.4256, "step": 11904 }, { "epoch": 2.2, "learning_rate": 3.482462593203919e-06, "loss": 0.395, "step": 11905 }, { "epoch": 2.2, "learning_rate": 3.4809477943287394e-06, "loss": 0.4107, "step": 11906 }, { "epoch": 2.2, "learning_rate": 3.4794332555516706e-06, "loss": 0.3881, "step": 11907 }, { "epoch": 2.2, "learning_rate": 3.4779189769331457e-06, "loss": 0.4215, "step": 11908 }, { "epoch": 2.2, "learning_rate": 3.4764049585335747e-06, "loss": 0.4162, "step": 11909 }, { "epoch": 2.2, "learning_rate": 3.4748912004133705e-06, "loss": 0.4308, "step": 11910 }, { "epoch": 2.2, "learning_rate": 3.473377702632924e-06, "loss": 0.4296, "step": 11911 }, { "epoch": 2.2, "learning_rate": 3.4718644652526266e-06, "loss": 0.4203, "step": 11912 }, { "epoch": 2.2, "learning_rate": 3.470351488332847e-06, "loss": 0.4239, "step": 11913 }, { "epoch": 2.2, "learning_rate": 3.4688387719339566e-06, "loss": 0.4115, "step": 11914 }, { "epoch": 2.2, "learning_rate": 3.4673263161163052e-06, "loss": 0.4212, "step": 11915 }, { "epoch": 2.2, "learning_rate": 3.4658141209402408e-06, "loss": 0.3988, "step": 11916 }, { "epoch": 2.2, "learning_rate": 3.4643021864660952e-06, "loss": 0.413, "step": 11917 }, { "epoch": 2.2, "learning_rate": 3.4627905127541892e-06, "loss": 0.4003, "step": 11918 }, { "epoch": 2.21, "learning_rate": 3.4612790998648417e-06, "loss": 0.4122, "step": 11919 }, { "epoch": 2.21, "learning_rate": 3.459767947858348e-06, "loss": 0.4288, "step": 11920 }, { "epoch": 2.21, "learning_rate": 3.458257056795008e-06, "loss": 0.4092, "step": 11921 }, { "epoch": 2.21, "learning_rate": 3.4567464267351004e-06, "loss": 0.4197, "step": 11922 }, { "epoch": 2.21, "learning_rate": 3.455236057738892e-06, "loss": 0.4204, "step": 11923 }, { "epoch": 2.21, "learning_rate": 3.4537259498666507e-06, "loss": 0.4093, "step": 11924 }, { "epoch": 2.21, "learning_rate": 3.4522161031786204e-06, "loss": 0.4129, "step": 11925 }, { "epoch": 2.21, "learning_rate": 3.4507065177350485e-06, "loss": 0.4198, "step": 11926 }, { "epoch": 2.21, "learning_rate": 3.449197193596161e-06, "loss": 0.4275, "step": 11927 }, { "epoch": 2.21, "learning_rate": 3.4476881308221733e-06, "loss": 0.4073, "step": 11928 }, { "epoch": 2.21, "learning_rate": 3.4461793294733013e-06, "loss": 0.4405, "step": 11929 }, { "epoch": 2.21, "learning_rate": 3.4446707896097363e-06, "loss": 0.4079, "step": 11930 }, { "epoch": 2.21, "learning_rate": 3.4431625112916732e-06, "loss": 0.4238, "step": 11931 }, { "epoch": 2.21, "learning_rate": 3.4416544945792874e-06, "loss": 0.4341, "step": 11932 }, { "epoch": 2.21, "learning_rate": 3.4401467395327402e-06, "loss": 0.3982, "step": 11933 }, { "epoch": 2.21, "learning_rate": 3.4386392462121964e-06, "loss": 0.4141, "step": 11934 }, { "epoch": 2.21, "learning_rate": 3.4371320146777953e-06, "loss": 0.41, "step": 11935 }, { "epoch": 2.21, "learning_rate": 3.43562504498968e-06, "loss": 0.3944, "step": 11936 }, { "epoch": 2.21, "learning_rate": 3.434118337207968e-06, "loss": 0.4344, "step": 11937 }, { "epoch": 2.21, "learning_rate": 3.432611891392782e-06, "loss": 0.4127, "step": 11938 }, { "epoch": 2.21, "learning_rate": 3.431105707604221e-06, "loss": 0.4076, "step": 11939 }, { "epoch": 2.21, "learning_rate": 3.4295997859023778e-06, "loss": 0.4218, "step": 11940 }, { "epoch": 2.21, "learning_rate": 3.428094126347341e-06, "loss": 0.4118, "step": 11941 }, { "epoch": 2.21, "learning_rate": 3.4265887289991784e-06, "loss": 0.443, "step": 11942 }, { "epoch": 2.21, "learning_rate": 3.425083593917958e-06, "loss": 0.4048, "step": 11943 }, { "epoch": 2.21, "learning_rate": 3.4235787211637293e-06, "loss": 0.4207, "step": 11944 }, { "epoch": 2.21, "learning_rate": 3.4220741107965304e-06, "loss": 0.4083, "step": 11945 }, { "epoch": 2.21, "learning_rate": 3.4205697628764e-06, "loss": 0.4199, "step": 11946 }, { "epoch": 2.21, "learning_rate": 3.4190656774633502e-06, "loss": 0.4191, "step": 11947 }, { "epoch": 2.21, "learning_rate": 3.4175618546173994e-06, "loss": 0.4368, "step": 11948 }, { "epoch": 2.21, "learning_rate": 3.4160582943985433e-06, "loss": 0.4025, "step": 11949 }, { "epoch": 2.21, "learning_rate": 3.414554996866768e-06, "loss": 0.4202, "step": 11950 }, { "epoch": 2.21, "learning_rate": 3.413051962082059e-06, "loss": 0.4275, "step": 11951 }, { "epoch": 2.21, "learning_rate": 3.4115491901043775e-06, "loss": 0.4303, "step": 11952 }, { "epoch": 2.21, "learning_rate": 3.4100466809936894e-06, "loss": 0.4224, "step": 11953 }, { "epoch": 2.21, "learning_rate": 3.408544434809934e-06, "loss": 0.4245, "step": 11954 }, { "epoch": 2.21, "learning_rate": 3.407042451613055e-06, "loss": 0.3997, "step": 11955 }, { "epoch": 2.21, "learning_rate": 3.405540731462973e-06, "loss": 0.4225, "step": 11956 }, { "epoch": 2.21, "learning_rate": 3.404039274419608e-06, "loss": 0.4114, "step": 11957 }, { "epoch": 2.21, "learning_rate": 3.402538080542863e-06, "loss": 0.4321, "step": 11958 }, { "epoch": 2.21, "learning_rate": 3.401037149892635e-06, "loss": 0.4139, "step": 11959 }, { "epoch": 2.21, "learning_rate": 3.399536482528806e-06, "loss": 0.41, "step": 11960 }, { "epoch": 2.21, "learning_rate": 3.398036078511252e-06, "loss": 0.4157, "step": 11961 }, { "epoch": 2.21, "learning_rate": 3.396535937899833e-06, "loss": 0.4233, "step": 11962 }, { "epoch": 2.21, "learning_rate": 3.3950360607544074e-06, "loss": 0.403, "step": 11963 }, { "epoch": 2.21, "learning_rate": 3.3935364471348108e-06, "loss": 0.4312, "step": 11964 }, { "epoch": 2.21, "learning_rate": 3.392037097100881e-06, "loss": 0.4043, "step": 11965 }, { "epoch": 2.21, "learning_rate": 3.3905380107124373e-06, "loss": 0.3923, "step": 11966 }, { "epoch": 2.21, "learning_rate": 3.3890391880292874e-06, "loss": 0.42, "step": 11967 }, { "epoch": 2.21, "learning_rate": 3.3875406291112367e-06, "loss": 0.4243, "step": 11968 }, { "epoch": 2.21, "learning_rate": 3.386042334018068e-06, "loss": 0.4171, "step": 11969 }, { "epoch": 2.21, "learning_rate": 3.3845443028095695e-06, "loss": 0.4092, "step": 11970 }, { "epoch": 2.21, "learning_rate": 3.3830465355455044e-06, "loss": 0.4032, "step": 11971 }, { "epoch": 2.21, "learning_rate": 3.381549032285628e-06, "loss": 0.4156, "step": 11972 }, { "epoch": 2.22, "learning_rate": 3.3800517930896957e-06, "loss": 0.4379, "step": 11973 }, { "epoch": 2.22, "learning_rate": 3.3785548180174365e-06, "loss": 0.4245, "step": 11974 }, { "epoch": 2.22, "learning_rate": 3.3770581071285834e-06, "loss": 0.4225, "step": 11975 }, { "epoch": 2.22, "learning_rate": 3.3755616604828513e-06, "loss": 0.4265, "step": 11976 }, { "epoch": 2.22, "learning_rate": 3.3740654781399395e-06, "loss": 0.4364, "step": 11977 }, { "epoch": 2.22, "learning_rate": 3.372569560159552e-06, "loss": 0.4145, "step": 11978 }, { "epoch": 2.22, "learning_rate": 3.3710739066013644e-06, "loss": 0.4214, "step": 11979 }, { "epoch": 2.22, "learning_rate": 3.3695785175250586e-06, "loss": 0.4294, "step": 11980 }, { "epoch": 2.22, "learning_rate": 3.368083392990293e-06, "loss": 0.3708, "step": 11981 }, { "epoch": 2.22, "learning_rate": 3.3665885330567193e-06, "loss": 0.4272, "step": 11982 }, { "epoch": 2.22, "learning_rate": 3.3650939377839854e-06, "loss": 0.4142, "step": 11983 }, { "epoch": 2.22, "learning_rate": 3.3635996072317146e-06, "loss": 0.4092, "step": 11984 }, { "epoch": 2.22, "learning_rate": 3.362105541459536e-06, "loss": 0.4177, "step": 11985 }, { "epoch": 2.22, "learning_rate": 3.3606117405270534e-06, "loss": 0.4171, "step": 11986 }, { "epoch": 2.22, "learning_rate": 3.359118204493874e-06, "loss": 0.4199, "step": 11987 }, { "epoch": 2.22, "learning_rate": 3.357624933419582e-06, "loss": 0.4066, "step": 11988 }, { "epoch": 2.22, "learning_rate": 3.356131927363754e-06, "loss": 0.4238, "step": 11989 }, { "epoch": 2.22, "learning_rate": 3.354639186385965e-06, "loss": 0.4398, "step": 11990 }, { "epoch": 2.22, "learning_rate": 3.353146710545765e-06, "loss": 0.3972, "step": 11991 }, { "epoch": 2.22, "learning_rate": 3.351654499902709e-06, "loss": 0.411, "step": 11992 }, { "epoch": 2.22, "learning_rate": 3.3501625545163284e-06, "loss": 0.4414, "step": 11993 }, { "epoch": 2.22, "learning_rate": 3.3486708744461473e-06, "loss": 0.4119, "step": 11994 }, { "epoch": 2.22, "learning_rate": 3.347179459751687e-06, "loss": 0.3972, "step": 11995 }, { "epoch": 2.22, "learning_rate": 3.345688310492445e-06, "loss": 0.4178, "step": 11996 }, { "epoch": 2.22, "learning_rate": 3.3441974267279243e-06, "loss": 0.42, "step": 11997 }, { "epoch": 2.22, "learning_rate": 3.342706808517602e-06, "loss": 0.4391, "step": 11998 }, { "epoch": 2.22, "learning_rate": 3.3412164559209492e-06, "loss": 0.4123, "step": 11999 }, { "epoch": 2.22, "learning_rate": 3.3397263689974346e-06, "loss": 0.4103, "step": 12000 }, { "epoch": 2.22, "learning_rate": 3.338236547806504e-06, "loss": 0.4147, "step": 12001 }, { "epoch": 2.22, "learning_rate": 3.3367469924076036e-06, "loss": 0.4138, "step": 12002 }, { "epoch": 2.22, "learning_rate": 3.3352577028601583e-06, "loss": 0.4103, "step": 12003 }, { "epoch": 2.22, "learning_rate": 3.3337686792235957e-06, "loss": 0.4193, "step": 12004 }, { "epoch": 2.22, "learning_rate": 3.3322799215573165e-06, "loss": 0.4165, "step": 12005 }, { "epoch": 2.22, "learning_rate": 3.3307914299207266e-06, "loss": 0.4104, "step": 12006 }, { "epoch": 2.22, "learning_rate": 3.3293032043732076e-06, "loss": 0.4168, "step": 12007 }, { "epoch": 2.22, "learning_rate": 3.327815244974144e-06, "loss": 0.4259, "step": 12008 }, { "epoch": 2.22, "learning_rate": 3.326327551782895e-06, "loss": 0.4252, "step": 12009 }, { "epoch": 2.22, "learning_rate": 3.3248401248588247e-06, "loss": 0.4313, "step": 12010 }, { "epoch": 2.22, "learning_rate": 3.323352964261272e-06, "loss": 0.4411, "step": 12011 }, { "epoch": 2.22, "learning_rate": 3.3218660700495763e-06, "loss": 0.4244, "step": 12012 }, { "epoch": 2.22, "learning_rate": 3.3203794422830583e-06, "loss": 0.4258, "step": 12013 }, { "epoch": 2.22, "learning_rate": 3.3188930810210364e-06, "loss": 0.4188, "step": 12014 }, { "epoch": 2.22, "learning_rate": 3.3174069863228097e-06, "loss": 0.4056, "step": 12015 }, { "epoch": 2.22, "learning_rate": 3.3159211582476692e-06, "loss": 0.4256, "step": 12016 }, { "epoch": 2.22, "learning_rate": 3.3144355968549027e-06, "loss": 0.4139, "step": 12017 }, { "epoch": 2.22, "learning_rate": 3.3129503022037748e-06, "loss": 0.3985, "step": 12018 }, { "epoch": 2.22, "learning_rate": 3.3114652743535524e-06, "loss": 0.3932, "step": 12019 }, { "epoch": 2.22, "learning_rate": 3.309980513363481e-06, "loss": 0.4256, "step": 12020 }, { "epoch": 2.22, "learning_rate": 3.3084960192927984e-06, "loss": 0.4228, "step": 12021 }, { "epoch": 2.22, "learning_rate": 3.3070117922007395e-06, "loss": 0.4086, "step": 12022 }, { "epoch": 2.22, "learning_rate": 3.3055278321465144e-06, "loss": 0.42, "step": 12023 }, { "epoch": 2.22, "learning_rate": 3.3040441391893375e-06, "loss": 0.4208, "step": 12024 }, { "epoch": 2.22, "learning_rate": 3.302560713388403e-06, "loss": 0.413, "step": 12025 }, { "epoch": 2.22, "learning_rate": 3.3010775548028917e-06, "loss": 0.4279, "step": 12026 }, { "epoch": 2.23, "learning_rate": 3.299594663491987e-06, "loss": 0.4059, "step": 12027 }, { "epoch": 2.23, "learning_rate": 3.298112039514847e-06, "loss": 0.4247, "step": 12028 }, { "epoch": 2.23, "learning_rate": 3.296629682930631e-06, "loss": 0.4374, "step": 12029 }, { "epoch": 2.23, "learning_rate": 3.2951475937984765e-06, "loss": 0.4436, "step": 12030 }, { "epoch": 2.23, "learning_rate": 3.2936657721775223e-06, "loss": 0.4169, "step": 12031 }, { "epoch": 2.23, "learning_rate": 3.2921842181268882e-06, "loss": 0.4241, "step": 12032 }, { "epoch": 2.23, "learning_rate": 3.2907029317056803e-06, "loss": 0.4133, "step": 12033 }, { "epoch": 2.23, "learning_rate": 3.2892219129730076e-06, "loss": 0.4274, "step": 12034 }, { "epoch": 2.23, "learning_rate": 3.2877411619879517e-06, "loss": 0.4204, "step": 12035 }, { "epoch": 2.23, "learning_rate": 3.286260678809601e-06, "loss": 0.4057, "step": 12036 }, { "epoch": 2.23, "learning_rate": 3.284780463497017e-06, "loss": 0.4296, "step": 12037 }, { "epoch": 2.23, "learning_rate": 3.283300516109258e-06, "loss": 0.4236, "step": 12038 }, { "epoch": 2.23, "learning_rate": 3.281820836705375e-06, "loss": 0.4299, "step": 12039 }, { "epoch": 2.23, "learning_rate": 3.280341425344399e-06, "loss": 0.419, "step": 12040 }, { "epoch": 2.23, "learning_rate": 3.2788622820853634e-06, "loss": 0.4059, "step": 12041 }, { "epoch": 2.23, "learning_rate": 3.2773834069872778e-06, "loss": 0.4282, "step": 12042 }, { "epoch": 2.23, "learning_rate": 3.2759048001091443e-06, "loss": 0.4387, "step": 12043 }, { "epoch": 2.23, "learning_rate": 3.2744264615099643e-06, "loss": 0.404, "step": 12044 }, { "epoch": 2.23, "learning_rate": 3.2729483912487112e-06, "loss": 0.4248, "step": 12045 }, { "epoch": 2.23, "learning_rate": 3.2714705893843677e-06, "loss": 0.4416, "step": 12046 }, { "epoch": 2.23, "learning_rate": 3.26999305597589e-06, "loss": 0.4386, "step": 12047 }, { "epoch": 2.23, "learning_rate": 3.2685157910822252e-06, "loss": 0.4121, "step": 12048 }, { "epoch": 2.23, "learning_rate": 3.2670387947623205e-06, "loss": 0.3943, "step": 12049 }, { "epoch": 2.23, "learning_rate": 3.2655620670750986e-06, "loss": 0.4133, "step": 12050 }, { "epoch": 2.23, "learning_rate": 3.2640856080794857e-06, "loss": 0.4109, "step": 12051 }, { "epoch": 2.23, "learning_rate": 3.2626094178343826e-06, "loss": 0.4198, "step": 12052 }, { "epoch": 2.23, "learning_rate": 3.261133496398692e-06, "loss": 0.4324, "step": 12053 }, { "epoch": 2.23, "learning_rate": 3.2596578438312963e-06, "loss": 0.4184, "step": 12054 }, { "epoch": 2.23, "learning_rate": 3.258182460191075e-06, "loss": 0.4201, "step": 12055 }, { "epoch": 2.23, "learning_rate": 3.2567073455368892e-06, "loss": 0.4211, "step": 12056 }, { "epoch": 2.23, "learning_rate": 3.2552324999275985e-06, "loss": 0.4127, "step": 12057 }, { "epoch": 2.23, "learning_rate": 3.2537579234220405e-06, "loss": 0.4154, "step": 12058 }, { "epoch": 2.23, "learning_rate": 3.252283616079054e-06, "loss": 0.4045, "step": 12059 }, { "epoch": 2.23, "learning_rate": 3.2508095779574545e-06, "loss": 0.3925, "step": 12060 }, { "epoch": 2.23, "learning_rate": 3.249335809116061e-06, "loss": 0.4102, "step": 12061 }, { "epoch": 2.23, "learning_rate": 3.2478623096136663e-06, "loss": 0.4201, "step": 12062 }, { "epoch": 2.23, "learning_rate": 3.246389079509068e-06, "loss": 0.4145, "step": 12063 }, { "epoch": 2.23, "learning_rate": 3.244916118861041e-06, "loss": 0.4092, "step": 12064 }, { "epoch": 2.23, "learning_rate": 3.243443427728351e-06, "loss": 0.4124, "step": 12065 }, { "epoch": 2.23, "learning_rate": 3.241971006169763e-06, "loss": 0.4246, "step": 12066 }, { "epoch": 2.23, "learning_rate": 3.2404988542440154e-06, "loss": 0.4234, "step": 12067 }, { "epoch": 2.23, "learning_rate": 3.239026972009852e-06, "loss": 0.4199, "step": 12068 }, { "epoch": 2.23, "learning_rate": 3.2375553595259944e-06, "loss": 0.4179, "step": 12069 }, { "epoch": 2.23, "learning_rate": 3.2360840168511553e-06, "loss": 0.4269, "step": 12070 }, { "epoch": 2.23, "learning_rate": 3.2346129440440443e-06, "loss": 0.4135, "step": 12071 }, { "epoch": 2.23, "learning_rate": 3.233142141163347e-06, "loss": 0.3968, "step": 12072 }, { "epoch": 2.23, "learning_rate": 3.2316716082677533e-06, "loss": 0.4223, "step": 12073 }, { "epoch": 2.23, "learning_rate": 3.2302013454159276e-06, "loss": 0.428, "step": 12074 }, { "epoch": 2.23, "learning_rate": 3.2287313526665378e-06, "loss": 0.4041, "step": 12075 }, { "epoch": 2.23, "learning_rate": 3.22726163007823e-06, "loss": 0.4318, "step": 12076 }, { "epoch": 2.23, "learning_rate": 3.2257921777096412e-06, "loss": 0.4322, "step": 12077 }, { "epoch": 2.23, "learning_rate": 3.2243229956194054e-06, "loss": 0.4319, "step": 12078 }, { "epoch": 2.23, "learning_rate": 3.2228540838661336e-06, "loss": 0.445, "step": 12079 }, { "epoch": 2.23, "learning_rate": 3.22138544250844e-06, "loss": 0.4258, "step": 12080 }, { "epoch": 2.24, "learning_rate": 3.2199170716049167e-06, "loss": 0.4259, "step": 12081 }, { "epoch": 2.24, "learning_rate": 3.2184489712141463e-06, "loss": 0.4063, "step": 12082 }, { "epoch": 2.24, "learning_rate": 3.2169811413947093e-06, "loss": 0.4255, "step": 12083 }, { "epoch": 2.24, "learning_rate": 3.215513582205163e-06, "loss": 0.4251, "step": 12084 }, { "epoch": 2.24, "learning_rate": 3.214046293704067e-06, "loss": 0.4105, "step": 12085 }, { "epoch": 2.24, "learning_rate": 3.212579275949961e-06, "loss": 0.4087, "step": 12086 }, { "epoch": 2.24, "learning_rate": 3.21111252900137e-06, "loss": 0.4092, "step": 12087 }, { "epoch": 2.24, "learning_rate": 3.209646052916825e-06, "loss": 0.4205, "step": 12088 }, { "epoch": 2.24, "learning_rate": 3.2081798477548253e-06, "loss": 0.4281, "step": 12089 }, { "epoch": 2.24, "learning_rate": 3.20671391357388e-06, "loss": 0.405, "step": 12090 }, { "epoch": 2.24, "learning_rate": 3.205248250432471e-06, "loss": 0.4081, "step": 12091 }, { "epoch": 2.24, "learning_rate": 3.203782858389074e-06, "loss": 0.42, "step": 12092 }, { "epoch": 2.24, "learning_rate": 3.2023177375021606e-06, "loss": 0.4146, "step": 12093 }, { "epoch": 2.24, "learning_rate": 3.2008528878301812e-06, "loss": 0.4307, "step": 12094 }, { "epoch": 2.24, "learning_rate": 3.199388309431587e-06, "loss": 0.4051, "step": 12095 }, { "epoch": 2.24, "learning_rate": 3.197924002364805e-06, "loss": 0.42, "step": 12096 }, { "epoch": 2.24, "learning_rate": 3.1964599666882647e-06, "loss": 0.4279, "step": 12097 }, { "epoch": 2.24, "learning_rate": 3.194996202460374e-06, "loss": 0.4256, "step": 12098 }, { "epoch": 2.24, "learning_rate": 3.1935327097395343e-06, "loss": 0.406, "step": 12099 }, { "epoch": 2.24, "learning_rate": 3.1920694885841395e-06, "loss": 0.4257, "step": 12100 }, { "epoch": 2.24, "learning_rate": 3.1906065390525653e-06, "loss": 0.4328, "step": 12101 }, { "epoch": 2.24, "learning_rate": 3.1891438612031857e-06, "loss": 0.4196, "step": 12102 }, { "epoch": 2.24, "learning_rate": 3.1876814550943524e-06, "loss": 0.4027, "step": 12103 }, { "epoch": 2.24, "learning_rate": 3.1862193207844206e-06, "loss": 0.4292, "step": 12104 }, { "epoch": 2.24, "learning_rate": 3.1847574583317185e-06, "loss": 0.403, "step": 12105 }, { "epoch": 2.24, "learning_rate": 3.183295867794579e-06, "loss": 0.4321, "step": 12106 }, { "epoch": 2.24, "learning_rate": 3.1818345492313108e-06, "loss": 0.4119, "step": 12107 }, { "epoch": 2.24, "learning_rate": 3.180373502700224e-06, "loss": 0.407, "step": 12108 }, { "epoch": 2.24, "learning_rate": 3.178912728259603e-06, "loss": 0.4207, "step": 12109 }, { "epoch": 2.24, "learning_rate": 3.177452225967741e-06, "loss": 0.43, "step": 12110 }, { "epoch": 2.24, "learning_rate": 3.175991995882899e-06, "loss": 0.4105, "step": 12111 }, { "epoch": 2.24, "learning_rate": 3.174532038063346e-06, "loss": 0.4299, "step": 12112 }, { "epoch": 2.24, "learning_rate": 3.173072352567327e-06, "loss": 0.4204, "step": 12113 }, { "epoch": 2.24, "learning_rate": 3.171612939453079e-06, "loss": 0.4287, "step": 12114 }, { "epoch": 2.24, "learning_rate": 3.1701537987788346e-06, "loss": 0.4233, "step": 12115 }, { "epoch": 2.24, "learning_rate": 3.1686949306028057e-06, "loss": 0.417, "step": 12116 }, { "epoch": 2.24, "learning_rate": 3.1672363349832047e-06, "loss": 0.405, "step": 12117 }, { "epoch": 2.24, "learning_rate": 3.16577801197822e-06, "loss": 0.4243, "step": 12118 }, { "epoch": 2.24, "learning_rate": 3.164319961646043e-06, "loss": 0.4364, "step": 12119 }, { "epoch": 2.24, "learning_rate": 3.1628621840448426e-06, "loss": 0.4161, "step": 12120 }, { "epoch": 2.24, "learning_rate": 3.16140467923278e-06, "loss": 0.4307, "step": 12121 }, { "epoch": 2.24, "learning_rate": 3.1599474472680125e-06, "loss": 0.3896, "step": 12122 }, { "epoch": 2.24, "learning_rate": 3.1584904882086743e-06, "loss": 0.4022, "step": 12123 }, { "epoch": 2.24, "learning_rate": 3.1570338021129023e-06, "loss": 0.4295, "step": 12124 }, { "epoch": 2.24, "learning_rate": 3.155577389038813e-06, "loss": 0.4181, "step": 12125 }, { "epoch": 2.24, "learning_rate": 3.1541212490445094e-06, "loss": 0.4214, "step": 12126 }, { "epoch": 2.24, "learning_rate": 3.152665382188097e-06, "loss": 0.4107, "step": 12127 }, { "epoch": 2.24, "learning_rate": 3.151209788527655e-06, "loss": 0.409, "step": 12128 }, { "epoch": 2.24, "learning_rate": 3.1497544681212645e-06, "loss": 0.4182, "step": 12129 }, { "epoch": 2.24, "learning_rate": 3.148299421026989e-06, "loss": 0.4049, "step": 12130 }, { "epoch": 2.24, "learning_rate": 3.146844647302878e-06, "loss": 0.4204, "step": 12131 }, { "epoch": 2.24, "learning_rate": 3.145390147006979e-06, "loss": 0.3848, "step": 12132 }, { "epoch": 2.24, "learning_rate": 3.143935920197321e-06, "loss": 0.4357, "step": 12133 }, { "epoch": 2.24, "learning_rate": 3.1424819669319272e-06, "loss": 0.4, "step": 12134 }, { "epoch": 2.25, "learning_rate": 3.141028287268808e-06, "loss": 0.4155, "step": 12135 }, { "epoch": 2.25, "learning_rate": 3.1395748812659576e-06, "loss": 0.424, "step": 12136 }, { "epoch": 2.25, "learning_rate": 3.138121748981371e-06, "loss": 0.393, "step": 12137 }, { "epoch": 2.25, "learning_rate": 3.136668890473019e-06, "loss": 0.4134, "step": 12138 }, { "epoch": 2.25, "learning_rate": 3.135216305798874e-06, "loss": 0.4109, "step": 12139 }, { "epoch": 2.25, "learning_rate": 3.133763995016885e-06, "loss": 0.4127, "step": 12140 }, { "epoch": 2.25, "learning_rate": 3.1323119581850047e-06, "loss": 0.4239, "step": 12141 }, { "epoch": 2.25, "learning_rate": 3.1308601953611605e-06, "loss": 0.4093, "step": 12142 }, { "epoch": 2.25, "learning_rate": 3.1294087066032743e-06, "loss": 0.4015, "step": 12143 }, { "epoch": 2.25, "learning_rate": 3.1279574919692636e-06, "loss": 0.4503, "step": 12144 }, { "epoch": 2.25, "learning_rate": 3.1265065515170223e-06, "loss": 0.4251, "step": 12145 }, { "epoch": 2.25, "learning_rate": 3.1250558853044464e-06, "loss": 0.4269, "step": 12146 }, { "epoch": 2.25, "learning_rate": 3.1236054933894123e-06, "loss": 0.4273, "step": 12147 }, { "epoch": 2.25, "learning_rate": 3.122155375829784e-06, "loss": 0.376, "step": 12148 }, { "epoch": 2.25, "learning_rate": 3.1207055326834266e-06, "loss": 0.414, "step": 12149 }, { "epoch": 2.25, "learning_rate": 3.1192559640081775e-06, "loss": 0.41, "step": 12150 }, { "epoch": 2.25, "learning_rate": 3.11780666986188e-06, "loss": 0.435, "step": 12151 }, { "epoch": 2.25, "learning_rate": 3.116357650302354e-06, "loss": 0.4107, "step": 12152 }, { "epoch": 2.25, "learning_rate": 3.114908905387409e-06, "loss": 0.4169, "step": 12153 }, { "epoch": 2.25, "learning_rate": 3.1134604351748565e-06, "loss": 0.4104, "step": 12154 }, { "epoch": 2.25, "learning_rate": 3.1120122397224785e-06, "loss": 0.4162, "step": 12155 }, { "epoch": 2.25, "learning_rate": 3.110564319088062e-06, "loss": 0.4172, "step": 12156 }, { "epoch": 2.25, "learning_rate": 3.109116673329371e-06, "loss": 0.4208, "step": 12157 }, { "epoch": 2.25, "learning_rate": 3.1076693025041694e-06, "loss": 0.4223, "step": 12158 }, { "epoch": 2.25, "learning_rate": 3.1062222066701986e-06, "loss": 0.4132, "step": 12159 }, { "epoch": 2.25, "learning_rate": 3.1047753858852014e-06, "loss": 0.4239, "step": 12160 }, { "epoch": 2.25, "learning_rate": 3.103328840206897e-06, "loss": 0.4109, "step": 12161 }, { "epoch": 2.25, "learning_rate": 3.1018825696930064e-06, "loss": 0.4064, "step": 12162 }, { "epoch": 2.25, "learning_rate": 3.1004365744012267e-06, "loss": 0.3958, "step": 12163 }, { "epoch": 2.25, "learning_rate": 3.0989908543892565e-06, "loss": 0.4364, "step": 12164 }, { "epoch": 2.25, "learning_rate": 3.0975454097147716e-06, "loss": 0.4132, "step": 12165 }, { "epoch": 2.25, "learning_rate": 3.0961002404354477e-06, "loss": 0.4213, "step": 12166 }, { "epoch": 2.25, "learning_rate": 3.094655346608939e-06, "loss": 0.4072, "step": 12167 }, { "epoch": 2.25, "learning_rate": 3.0932107282929004e-06, "loss": 0.4191, "step": 12168 }, { "epoch": 2.25, "learning_rate": 3.0917663855449663e-06, "loss": 0.4114, "step": 12169 }, { "epoch": 2.25, "learning_rate": 3.0903223184227602e-06, "loss": 0.3967, "step": 12170 }, { "epoch": 2.25, "learning_rate": 3.088878526983903e-06, "loss": 0.4367, "step": 12171 }, { "epoch": 2.25, "learning_rate": 3.0874350112859942e-06, "loss": 0.4002, "step": 12172 }, { "epoch": 2.25, "learning_rate": 3.0859917713866338e-06, "loss": 0.4324, "step": 12173 }, { "epoch": 2.25, "learning_rate": 3.0845488073434003e-06, "loss": 0.4322, "step": 12174 }, { "epoch": 2.25, "learning_rate": 3.0831061192138636e-06, "loss": 0.4299, "step": 12175 }, { "epoch": 2.25, "learning_rate": 3.0816637070555876e-06, "loss": 0.447, "step": 12176 }, { "epoch": 2.25, "learning_rate": 3.0802215709261194e-06, "loss": 0.4041, "step": 12177 }, { "epoch": 2.25, "learning_rate": 3.078779710883001e-06, "loss": 0.4307, "step": 12178 }, { "epoch": 2.25, "learning_rate": 3.0773381269837587e-06, "loss": 0.4115, "step": 12179 }, { "epoch": 2.25, "learning_rate": 3.075896819285904e-06, "loss": 0.3988, "step": 12180 }, { "epoch": 2.25, "learning_rate": 3.0744557878469506e-06, "loss": 0.4232, "step": 12181 }, { "epoch": 2.25, "learning_rate": 3.073015032724386e-06, "loss": 0.4065, "step": 12182 }, { "epoch": 2.25, "learning_rate": 3.071574553975698e-06, "loss": 0.429, "step": 12183 }, { "epoch": 2.25, "learning_rate": 3.0701343516583558e-06, "loss": 0.4122, "step": 12184 }, { "epoch": 2.25, "learning_rate": 3.068694425829826e-06, "loss": 0.4097, "step": 12185 }, { "epoch": 2.25, "learning_rate": 3.0672547765475557e-06, "loss": 0.4268, "step": 12186 }, { "epoch": 2.25, "learning_rate": 3.0658154038689804e-06, "loss": 0.4073, "step": 12187 }, { "epoch": 2.25, "learning_rate": 3.0643763078515353e-06, "loss": 0.4095, "step": 12188 }, { "epoch": 2.26, "learning_rate": 3.062937488552632e-06, "loss": 0.4353, "step": 12189 }, { "epoch": 2.26, "learning_rate": 3.061498946029683e-06, "loss": 0.4057, "step": 12190 }, { "epoch": 2.26, "learning_rate": 3.060060680340079e-06, "loss": 0.4019, "step": 12191 }, { "epoch": 2.26, "learning_rate": 3.0586226915412008e-06, "loss": 0.4188, "step": 12192 }, { "epoch": 2.26, "learning_rate": 3.0571849796904296e-06, "loss": 0.4016, "step": 12193 }, { "epoch": 2.26, "learning_rate": 3.0557475448451203e-06, "loss": 0.4219, "step": 12194 }, { "epoch": 2.26, "learning_rate": 3.0543103870626303e-06, "loss": 0.4084, "step": 12195 }, { "epoch": 2.26, "learning_rate": 3.0528735064002966e-06, "loss": 0.4303, "step": 12196 }, { "epoch": 2.26, "learning_rate": 3.0514369029154435e-06, "loss": 0.4207, "step": 12197 }, { "epoch": 2.26, "learning_rate": 3.0500005766653973e-06, "loss": 0.436, "step": 12198 }, { "epoch": 2.26, "learning_rate": 3.0485645277074573e-06, "loss": 0.4402, "step": 12199 }, { "epoch": 2.26, "learning_rate": 3.0471287560989247e-06, "loss": 0.4129, "step": 12200 }, { "epoch": 2.26, "learning_rate": 3.0456932618970824e-06, "loss": 0.4253, "step": 12201 }, { "epoch": 2.26, "learning_rate": 3.0442580451592e-06, "loss": 0.4081, "step": 12202 }, { "epoch": 2.26, "learning_rate": 3.0428231059425463e-06, "loss": 0.4259, "step": 12203 }, { "epoch": 2.26, "learning_rate": 3.041388444304367e-06, "loss": 0.392, "step": 12204 }, { "epoch": 2.26, "learning_rate": 3.0399540603019083e-06, "loss": 0.4313, "step": 12205 }, { "epoch": 2.26, "learning_rate": 3.0385199539923936e-06, "loss": 0.4256, "step": 12206 }, { "epoch": 2.26, "learning_rate": 3.0370861254330474e-06, "loss": 0.4133, "step": 12207 }, { "epoch": 2.26, "learning_rate": 3.0356525746810693e-06, "loss": 0.4298, "step": 12208 }, { "epoch": 2.26, "learning_rate": 3.034219301793663e-06, "loss": 0.4167, "step": 12209 }, { "epoch": 2.26, "learning_rate": 3.032786306828006e-06, "loss": 0.4259, "step": 12210 }, { "epoch": 2.26, "learning_rate": 3.0313535898412795e-06, "loss": 0.4273, "step": 12211 }, { "epoch": 2.26, "learning_rate": 3.029921150890639e-06, "loss": 0.427, "step": 12212 }, { "epoch": 2.26, "learning_rate": 3.028488990033244e-06, "loss": 0.41, "step": 12213 }, { "epoch": 2.26, "learning_rate": 3.027057107326227e-06, "loss": 0.3993, "step": 12214 }, { "epoch": 2.26, "learning_rate": 3.0256255028267243e-06, "loss": 0.4051, "step": 12215 }, { "epoch": 2.26, "learning_rate": 3.024194176591848e-06, "loss": 0.4045, "step": 12216 }, { "epoch": 2.26, "learning_rate": 3.022763128678713e-06, "loss": 0.4092, "step": 12217 }, { "epoch": 2.26, "learning_rate": 3.0213323591444097e-06, "loss": 0.4009, "step": 12218 }, { "epoch": 2.26, "learning_rate": 3.0199018680460236e-06, "loss": 0.4191, "step": 12219 }, { "epoch": 2.26, "learning_rate": 3.0184716554406314e-06, "loss": 0.418, "step": 12220 }, { "epoch": 2.26, "learning_rate": 3.017041721385291e-06, "loss": 0.4248, "step": 12221 }, { "epoch": 2.26, "learning_rate": 3.0156120659370603e-06, "loss": 0.4225, "step": 12222 }, { "epoch": 2.26, "learning_rate": 3.0141826891529768e-06, "loss": 0.4353, "step": 12223 }, { "epoch": 2.26, "learning_rate": 3.0127535910900672e-06, "loss": 0.4093, "step": 12224 }, { "epoch": 2.26, "learning_rate": 3.011324771805356e-06, "loss": 0.4094, "step": 12225 }, { "epoch": 2.26, "learning_rate": 3.0098962313558442e-06, "loss": 0.3923, "step": 12226 }, { "epoch": 2.26, "learning_rate": 3.008467969798534e-06, "loss": 0.4549, "step": 12227 }, { "epoch": 2.26, "learning_rate": 3.007039987190404e-06, "loss": 0.434, "step": 12228 }, { "epoch": 2.26, "learning_rate": 3.005612283588435e-06, "loss": 0.4135, "step": 12229 }, { "epoch": 2.26, "learning_rate": 3.004184859049586e-06, "loss": 0.4186, "step": 12230 }, { "epoch": 2.26, "learning_rate": 3.0027577136308063e-06, "loss": 0.3975, "step": 12231 }, { "epoch": 2.26, "learning_rate": 3.0013308473890403e-06, "loss": 0.4208, "step": 12232 }, { "epoch": 2.26, "learning_rate": 2.9999042603812136e-06, "loss": 0.4151, "step": 12233 }, { "epoch": 2.26, "learning_rate": 2.9984779526642494e-06, "loss": 0.4432, "step": 12234 }, { "epoch": 2.26, "learning_rate": 2.9970519242950522e-06, "loss": 0.4306, "step": 12235 }, { "epoch": 2.26, "learning_rate": 2.995626175330514e-06, "loss": 0.4055, "step": 12236 }, { "epoch": 2.26, "learning_rate": 2.994200705827527e-06, "loss": 0.4123, "step": 12237 }, { "epoch": 2.26, "learning_rate": 2.992775515842957e-06, "loss": 0.4353, "step": 12238 }, { "epoch": 2.26, "learning_rate": 2.991350605433674e-06, "loss": 0.414, "step": 12239 }, { "epoch": 2.26, "learning_rate": 2.989925974656526e-06, "loss": 0.3911, "step": 12240 }, { "epoch": 2.26, "learning_rate": 2.9885016235683497e-06, "loss": 0.4135, "step": 12241 }, { "epoch": 2.26, "learning_rate": 2.98707755222598e-06, "loss": 0.4092, "step": 12242 }, { "epoch": 2.27, "learning_rate": 2.985653760686228e-06, "loss": 0.4224, "step": 12243 }, { "epoch": 2.27, "learning_rate": 2.984230249005908e-06, "loss": 0.4211, "step": 12244 }, { "epoch": 2.27, "learning_rate": 2.9828070172418122e-06, "loss": 0.4297, "step": 12245 }, { "epoch": 2.27, "learning_rate": 2.9813840654507207e-06, "loss": 0.4119, "step": 12246 }, { "epoch": 2.27, "learning_rate": 2.9799613936894135e-06, "loss": 0.4127, "step": 12247 }, { "epoch": 2.27, "learning_rate": 2.9785390020146467e-06, "loss": 0.4108, "step": 12248 }, { "epoch": 2.27, "learning_rate": 2.977116890483176e-06, "loss": 0.4142, "step": 12249 }, { "epoch": 2.27, "learning_rate": 2.9756950591517363e-06, "loss": 0.4199, "step": 12250 }, { "epoch": 2.27, "learning_rate": 2.9742735080770623e-06, "loss": 0.4199, "step": 12251 }, { "epoch": 2.27, "learning_rate": 2.9728522373158673e-06, "loss": 0.42, "step": 12252 }, { "epoch": 2.27, "learning_rate": 2.971431246924854e-06, "loss": 0.4313, "step": 12253 }, { "epoch": 2.27, "learning_rate": 2.9700105369607247e-06, "loss": 0.4201, "step": 12254 }, { "epoch": 2.27, "learning_rate": 2.9685901074801547e-06, "loss": 0.4194, "step": 12255 }, { "epoch": 2.27, "learning_rate": 2.967169958539826e-06, "loss": 0.3983, "step": 12256 }, { "epoch": 2.27, "learning_rate": 2.965750090196391e-06, "loss": 0.4389, "step": 12257 }, { "epoch": 2.27, "learning_rate": 2.964330502506507e-06, "loss": 0.4212, "step": 12258 }, { "epoch": 2.27, "learning_rate": 2.9629111955268063e-06, "loss": 0.4011, "step": 12259 }, { "epoch": 2.27, "learning_rate": 2.961492169313924e-06, "loss": 0.4222, "step": 12260 }, { "epoch": 2.27, "learning_rate": 2.96007342392447e-06, "loss": 0.3987, "step": 12261 }, { "epoch": 2.27, "learning_rate": 2.9586549594150537e-06, "loss": 0.4337, "step": 12262 }, { "epoch": 2.27, "learning_rate": 2.957236775842266e-06, "loss": 0.4248, "step": 12263 }, { "epoch": 2.27, "learning_rate": 2.955818873262695e-06, "loss": 0.4194, "step": 12264 }, { "epoch": 2.27, "learning_rate": 2.9544012517329046e-06, "loss": 0.4222, "step": 12265 }, { "epoch": 2.27, "learning_rate": 2.952983911309464e-06, "loss": 0.4051, "step": 12266 }, { "epoch": 2.27, "learning_rate": 2.9515668520489173e-06, "loss": 0.4138, "step": 12267 }, { "epoch": 2.27, "learning_rate": 2.9501500740078004e-06, "loss": 0.4214, "step": 12268 }, { "epoch": 2.27, "learning_rate": 2.948733577242646e-06, "loss": 0.4236, "step": 12269 }, { "epoch": 2.27, "learning_rate": 2.947317361809965e-06, "loss": 0.4195, "step": 12270 }, { "epoch": 2.27, "learning_rate": 2.9459014277662656e-06, "loss": 0.4019, "step": 12271 }, { "epoch": 2.27, "learning_rate": 2.9444857751680358e-06, "loss": 0.4172, "step": 12272 }, { "epoch": 2.27, "learning_rate": 2.943070404071764e-06, "loss": 0.4259, "step": 12273 }, { "epoch": 2.27, "learning_rate": 2.9416553145339167e-06, "loss": 0.3985, "step": 12274 }, { "epoch": 2.27, "learning_rate": 2.9402405066109517e-06, "loss": 0.4224, "step": 12275 }, { "epoch": 2.27, "learning_rate": 2.938825980359323e-06, "loss": 0.4072, "step": 12276 }, { "epoch": 2.27, "learning_rate": 2.9374117358354616e-06, "loss": 0.4158, "step": 12277 }, { "epoch": 2.27, "learning_rate": 2.935997773095798e-06, "loss": 0.4201, "step": 12278 }, { "epoch": 2.27, "learning_rate": 2.934584092196745e-06, "loss": 0.4253, "step": 12279 }, { "epoch": 2.27, "learning_rate": 2.9331706931947024e-06, "loss": 0.4103, "step": 12280 }, { "epoch": 2.27, "learning_rate": 2.931757576146068e-06, "loss": 0.401, "step": 12281 }, { "epoch": 2.27, "learning_rate": 2.930344741107217e-06, "loss": 0.4228, "step": 12282 }, { "epoch": 2.27, "learning_rate": 2.9289321881345257e-06, "loss": 0.4224, "step": 12283 }, { "epoch": 2.27, "learning_rate": 2.9275199172843473e-06, "loss": 0.4153, "step": 12284 }, { "epoch": 2.27, "learning_rate": 2.9261079286130267e-06, "loss": 0.4258, "step": 12285 }, { "epoch": 2.27, "learning_rate": 2.9246962221769073e-06, "loss": 0.4242, "step": 12286 }, { "epoch": 2.27, "learning_rate": 2.9232847980323043e-06, "loss": 0.4277, "step": 12287 }, { "epoch": 2.27, "learning_rate": 2.9218736562355388e-06, "loss": 0.4142, "step": 12288 }, { "epoch": 2.27, "learning_rate": 2.92046279684291e-06, "loss": 0.4404, "step": 12289 }, { "epoch": 2.27, "learning_rate": 2.9190522199107054e-06, "loss": 0.4308, "step": 12290 }, { "epoch": 2.27, "learning_rate": 2.9176419254952104e-06, "loss": 0.4225, "step": 12291 }, { "epoch": 2.27, "learning_rate": 2.916231913652686e-06, "loss": 0.4169, "step": 12292 }, { "epoch": 2.27, "learning_rate": 2.9148221844393975e-06, "loss": 0.4136, "step": 12293 }, { "epoch": 2.27, "learning_rate": 2.913412737911585e-06, "loss": 0.4276, "step": 12294 }, { "epoch": 2.27, "learning_rate": 2.9120035741254806e-06, "loss": 0.4401, "step": 12295 }, { "epoch": 2.27, "learning_rate": 2.910594693137314e-06, "loss": 0.4276, "step": 12296 }, { "epoch": 2.28, "learning_rate": 2.9091860950032904e-06, "loss": 0.4206, "step": 12297 }, { "epoch": 2.28, "learning_rate": 2.907777779779616e-06, "loss": 0.4216, "step": 12298 }, { "epoch": 2.28, "learning_rate": 2.906369747522474e-06, "loss": 0.4016, "step": 12299 }, { "epoch": 2.28, "learning_rate": 2.9049619982880494e-06, "loss": 0.4173, "step": 12300 }, { "epoch": 2.28, "learning_rate": 2.903554532132504e-06, "loss": 0.41, "step": 12301 }, { "epoch": 2.28, "learning_rate": 2.9021473491119924e-06, "loss": 0.4137, "step": 12302 }, { "epoch": 2.28, "learning_rate": 2.9007404492826618e-06, "loss": 0.4124, "step": 12303 }, { "epoch": 2.28, "learning_rate": 2.8993338327006413e-06, "loss": 0.4093, "step": 12304 }, { "epoch": 2.28, "learning_rate": 2.8979274994220576e-06, "loss": 0.4061, "step": 12305 }, { "epoch": 2.28, "learning_rate": 2.896521449503014e-06, "loss": 0.3895, "step": 12306 }, { "epoch": 2.28, "learning_rate": 2.8951156829996153e-06, "loss": 0.4001, "step": 12307 }, { "epoch": 2.28, "learning_rate": 2.893710199967944e-06, "loss": 0.4034, "step": 12308 }, { "epoch": 2.28, "learning_rate": 2.892305000464082e-06, "loss": 0.4128, "step": 12309 }, { "epoch": 2.28, "learning_rate": 2.890900084544087e-06, "loss": 0.411, "step": 12310 }, { "epoch": 2.28, "learning_rate": 2.8894954522640206e-06, "loss": 0.4065, "step": 12311 }, { "epoch": 2.28, "learning_rate": 2.8880911036799175e-06, "loss": 0.4244, "step": 12312 }, { "epoch": 2.28, "learning_rate": 2.886687038847815e-06, "loss": 0.4024, "step": 12313 }, { "epoch": 2.28, "learning_rate": 2.8852832578237267e-06, "loss": 0.4021, "step": 12314 }, { "epoch": 2.28, "learning_rate": 2.883879760663667e-06, "loss": 0.4246, "step": 12315 }, { "epoch": 2.28, "learning_rate": 2.8824765474236305e-06, "loss": 0.4253, "step": 12316 }, { "epoch": 2.28, "learning_rate": 2.8810736181595976e-06, "loss": 0.4164, "step": 12317 }, { "epoch": 2.28, "learning_rate": 2.8796709729275505e-06, "loss": 0.3949, "step": 12318 }, { "epoch": 2.28, "learning_rate": 2.8782686117834455e-06, "loss": 0.4015, "step": 12319 }, { "epoch": 2.28, "learning_rate": 2.8768665347832402e-06, "loss": 0.4104, "step": 12320 }, { "epoch": 2.28, "learning_rate": 2.8754647419828696e-06, "loss": 0.4257, "step": 12321 }, { "epoch": 2.28, "learning_rate": 2.874063233438268e-06, "loss": 0.4264, "step": 12322 }, { "epoch": 2.28, "learning_rate": 2.87266200920535e-06, "loss": 0.4133, "step": 12323 }, { "epoch": 2.28, "learning_rate": 2.871261069340019e-06, "loss": 0.4176, "step": 12324 }, { "epoch": 2.28, "learning_rate": 2.8698604138981756e-06, "loss": 0.4236, "step": 12325 }, { "epoch": 2.28, "learning_rate": 2.868460042935697e-06, "loss": 0.4438, "step": 12326 }, { "epoch": 2.28, "learning_rate": 2.8670599565084633e-06, "loss": 0.4137, "step": 12327 }, { "epoch": 2.28, "learning_rate": 2.8656601546723295e-06, "loss": 0.4217, "step": 12328 }, { "epoch": 2.28, "learning_rate": 2.864260637483145e-06, "loss": 0.4303, "step": 12329 }, { "epoch": 2.28, "learning_rate": 2.862861404996752e-06, "loss": 0.4186, "step": 12330 }, { "epoch": 2.28, "learning_rate": 2.861462457268972e-06, "loss": 0.4051, "step": 12331 }, { "epoch": 2.28, "learning_rate": 2.8600637943556265e-06, "loss": 0.4099, "step": 12332 }, { "epoch": 2.28, "learning_rate": 2.858665416312516e-06, "loss": 0.4088, "step": 12333 }, { "epoch": 2.28, "learning_rate": 2.8572673231954307e-06, "loss": 0.4097, "step": 12334 }, { "epoch": 2.28, "learning_rate": 2.8558695150601577e-06, "loss": 0.413, "step": 12335 }, { "epoch": 2.28, "learning_rate": 2.8544719919624608e-06, "loss": 0.4235, "step": 12336 }, { "epoch": 2.28, "learning_rate": 2.853074753958106e-06, "loss": 0.4261, "step": 12337 }, { "epoch": 2.28, "learning_rate": 2.8516778011028357e-06, "loss": 0.4403, "step": 12338 }, { "epoch": 2.28, "learning_rate": 2.8502811334523826e-06, "loss": 0.4218, "step": 12339 }, { "epoch": 2.28, "learning_rate": 2.8488847510624782e-06, "loss": 0.4079, "step": 12340 }, { "epoch": 2.28, "learning_rate": 2.84748865398883e-06, "loss": 0.4218, "step": 12341 }, { "epoch": 2.28, "learning_rate": 2.846092842287145e-06, "loss": 0.4272, "step": 12342 }, { "epoch": 2.28, "learning_rate": 2.844697316013106e-06, "loss": 0.4363, "step": 12343 }, { "epoch": 2.28, "learning_rate": 2.8433020752224007e-06, "loss": 0.4196, "step": 12344 }, { "epoch": 2.28, "learning_rate": 2.8419071199706925e-06, "loss": 0.4112, "step": 12345 }, { "epoch": 2.28, "learning_rate": 2.840512450313634e-06, "loss": 0.4103, "step": 12346 }, { "epoch": 2.28, "learning_rate": 2.8391180663068764e-06, "loss": 0.416, "step": 12347 }, { "epoch": 2.28, "learning_rate": 2.8377239680060466e-06, "loss": 0.4104, "step": 12348 }, { "epoch": 2.28, "learning_rate": 2.8363301554667732e-06, "loss": 0.4103, "step": 12349 }, { "epoch": 2.28, "learning_rate": 2.8349366287446636e-06, "loss": 0.4085, "step": 12350 }, { "epoch": 2.29, "learning_rate": 2.833543387895312e-06, "loss": 0.4114, "step": 12351 }, { "epoch": 2.29, "learning_rate": 2.8321504329743153e-06, "loss": 0.4319, "step": 12352 }, { "epoch": 2.29, "learning_rate": 2.830757764037243e-06, "loss": 0.4008, "step": 12353 }, { "epoch": 2.29, "learning_rate": 2.8293653811396648e-06, "loss": 0.4209, "step": 12354 }, { "epoch": 2.29, "learning_rate": 2.8279732843371288e-06, "loss": 0.4319, "step": 12355 }, { "epoch": 2.29, "learning_rate": 2.826581473685184e-06, "loss": 0.4125, "step": 12356 }, { "epoch": 2.29, "learning_rate": 2.8251899492393532e-06, "loss": 0.419, "step": 12357 }, { "epoch": 2.29, "learning_rate": 2.8237987110551622e-06, "loss": 0.4027, "step": 12358 }, { "epoch": 2.29, "learning_rate": 2.822407759188114e-06, "loss": 0.4213, "step": 12359 }, { "epoch": 2.29, "learning_rate": 2.8210170936937096e-06, "loss": 0.4087, "step": 12360 }, { "epoch": 2.29, "learning_rate": 2.8196267146274293e-06, "loss": 0.3937, "step": 12361 }, { "epoch": 2.29, "learning_rate": 2.818236622044751e-06, "loss": 0.424, "step": 12362 }, { "epoch": 2.29, "learning_rate": 2.816846816001133e-06, "loss": 0.3956, "step": 12363 }, { "epoch": 2.29, "learning_rate": 2.81545729655203e-06, "loss": 0.4182, "step": 12364 }, { "epoch": 2.29, "learning_rate": 2.8140680637528774e-06, "loss": 0.4081, "step": 12365 }, { "epoch": 2.29, "learning_rate": 2.812679117659106e-06, "loss": 0.3998, "step": 12366 }, { "epoch": 2.29, "learning_rate": 2.8112904583261314e-06, "loss": 0.4006, "step": 12367 }, { "epoch": 2.29, "learning_rate": 2.809902085809355e-06, "loss": 0.4248, "step": 12368 }, { "epoch": 2.29, "learning_rate": 2.8085140001641764e-06, "loss": 0.4304, "step": 12369 }, { "epoch": 2.29, "learning_rate": 2.807126201445971e-06, "loss": 0.4294, "step": 12370 }, { "epoch": 2.29, "learning_rate": 2.805738689710117e-06, "loss": 0.4353, "step": 12371 }, { "epoch": 2.29, "learning_rate": 2.8043514650119684e-06, "loss": 0.4145, "step": 12372 }, { "epoch": 2.29, "learning_rate": 2.8029645274068717e-06, "loss": 0.4084, "step": 12373 }, { "epoch": 2.29, "learning_rate": 2.801577876950168e-06, "loss": 0.4241, "step": 12374 }, { "epoch": 2.29, "learning_rate": 2.800191513697176e-06, "loss": 0.406, "step": 12375 }, { "epoch": 2.29, "learning_rate": 2.798805437703216e-06, "loss": 0.4232, "step": 12376 }, { "epoch": 2.29, "learning_rate": 2.797419649023586e-06, "loss": 0.4162, "step": 12377 }, { "epoch": 2.29, "learning_rate": 2.7960341477135743e-06, "loss": 0.4087, "step": 12378 }, { "epoch": 2.29, "learning_rate": 2.7946489338284654e-06, "loss": 0.4253, "step": 12379 }, { "epoch": 2.29, "learning_rate": 2.7932640074235207e-06, "loss": 0.4207, "step": 12380 }, { "epoch": 2.29, "learning_rate": 2.7918793685540023e-06, "loss": 0.4013, "step": 12381 }, { "epoch": 2.29, "learning_rate": 2.790495017275151e-06, "loss": 0.4302, "step": 12382 }, { "epoch": 2.29, "learning_rate": 2.789110953642198e-06, "loss": 0.4035, "step": 12383 }, { "epoch": 2.29, "learning_rate": 2.78772717771037e-06, "loss": 0.4184, "step": 12384 }, { "epoch": 2.29, "learning_rate": 2.7863436895348715e-06, "loss": 0.4098, "step": 12385 }, { "epoch": 2.29, "learning_rate": 2.784960489170907e-06, "loss": 0.4002, "step": 12386 }, { "epoch": 2.29, "learning_rate": 2.7835775766736583e-06, "loss": 0.4155, "step": 12387 }, { "epoch": 2.29, "learning_rate": 2.782194952098306e-06, "loss": 0.4138, "step": 12388 }, { "epoch": 2.29, "learning_rate": 2.7808126155000114e-06, "loss": 0.4132, "step": 12389 }, { "epoch": 2.29, "learning_rate": 2.779430566933925e-06, "loss": 0.4058, "step": 12390 }, { "epoch": 2.29, "learning_rate": 2.7780488064551927e-06, "loss": 0.4254, "step": 12391 }, { "epoch": 2.29, "learning_rate": 2.77666733411894e-06, "loss": 0.4229, "step": 12392 }, { "epoch": 2.29, "learning_rate": 2.7752861499802886e-06, "loss": 0.4162, "step": 12393 }, { "epoch": 2.29, "learning_rate": 2.7739052540943447e-06, "loss": 0.3979, "step": 12394 }, { "epoch": 2.29, "learning_rate": 2.772524646516199e-06, "loss": 0.4291, "step": 12395 }, { "epoch": 2.29, "learning_rate": 2.771144327300942e-06, "loss": 0.3889, "step": 12396 }, { "epoch": 2.29, "learning_rate": 2.769764296503639e-06, "loss": 0.4132, "step": 12397 }, { "epoch": 2.29, "learning_rate": 2.7683845541793577e-06, "loss": 0.4313, "step": 12398 }, { "epoch": 2.29, "learning_rate": 2.7670051003831433e-06, "loss": 0.4269, "step": 12399 }, { "epoch": 2.29, "learning_rate": 2.765625935170031e-06, "loss": 0.4135, "step": 12400 }, { "epoch": 2.29, "learning_rate": 2.764247058595052e-06, "loss": 0.3916, "step": 12401 }, { "epoch": 2.29, "learning_rate": 2.762868470713217e-06, "loss": 0.4142, "step": 12402 }, { "epoch": 2.29, "learning_rate": 2.761490171579533e-06, "loss": 0.4044, "step": 12403 }, { "epoch": 2.29, "learning_rate": 2.7601121612489866e-06, "loss": 0.4176, "step": 12404 }, { "epoch": 2.3, "learning_rate": 2.7587344397765637e-06, "loss": 0.4226, "step": 12405 }, { "epoch": 2.3, "learning_rate": 2.757357007217227e-06, "loss": 0.4162, "step": 12406 }, { "epoch": 2.3, "learning_rate": 2.7559798636259394e-06, "loss": 0.4082, "step": 12407 }, { "epoch": 2.3, "learning_rate": 2.7546030090576402e-06, "loss": 0.4121, "step": 12408 }, { "epoch": 2.3, "learning_rate": 2.7532264435672695e-06, "loss": 0.4127, "step": 12409 }, { "epoch": 2.3, "learning_rate": 2.751850167209743e-06, "loss": 0.3918, "step": 12410 }, { "epoch": 2.3, "learning_rate": 2.7504741800399792e-06, "loss": 0.4201, "step": 12411 }, { "epoch": 2.3, "learning_rate": 2.7490984821128695e-06, "loss": 0.4139, "step": 12412 }, { "epoch": 2.3, "learning_rate": 2.7477230734833095e-06, "loss": 0.3921, "step": 12413 }, { "epoch": 2.3, "learning_rate": 2.7463479542061678e-06, "loss": 0.4405, "step": 12414 }, { "epoch": 2.3, "learning_rate": 2.7449731243363164e-06, "loss": 0.4057, "step": 12415 }, { "epoch": 2.3, "learning_rate": 2.743598583928605e-06, "loss": 0.4093, "step": 12416 }, { "epoch": 2.3, "learning_rate": 2.742224333037873e-06, "loss": 0.4108, "step": 12417 }, { "epoch": 2.3, "learning_rate": 2.740850371718955e-06, "loss": 0.4079, "step": 12418 }, { "epoch": 2.3, "learning_rate": 2.739476700026664e-06, "loss": 0.411, "step": 12419 }, { "epoch": 2.3, "learning_rate": 2.7381033180158133e-06, "loss": 0.4322, "step": 12420 }, { "epoch": 2.3, "learning_rate": 2.7367302257411956e-06, "loss": 0.4161, "step": 12421 }, { "epoch": 2.3, "learning_rate": 2.7353574232575907e-06, "loss": 0.4222, "step": 12422 }, { "epoch": 2.3, "learning_rate": 2.733984910619777e-06, "loss": 0.4209, "step": 12423 }, { "epoch": 2.3, "learning_rate": 2.732612687882511e-06, "loss": 0.4144, "step": 12424 }, { "epoch": 2.3, "learning_rate": 2.731240755100546e-06, "loss": 0.419, "step": 12425 }, { "epoch": 2.3, "learning_rate": 2.729869112328617e-06, "loss": 0.4191, "step": 12426 }, { "epoch": 2.3, "learning_rate": 2.7284977596214467e-06, "loss": 0.4172, "step": 12427 }, { "epoch": 2.3, "learning_rate": 2.7271266970337575e-06, "loss": 0.3974, "step": 12428 }, { "epoch": 2.3, "learning_rate": 2.7257559246202424e-06, "loss": 0.4119, "step": 12429 }, { "epoch": 2.3, "learning_rate": 2.7243854424356033e-06, "loss": 0.4168, "step": 12430 }, { "epoch": 2.3, "learning_rate": 2.7230152505345096e-06, "loss": 0.4331, "step": 12431 }, { "epoch": 2.3, "learning_rate": 2.7216453489716388e-06, "loss": 0.4221, "step": 12432 }, { "epoch": 2.3, "learning_rate": 2.720275737801643e-06, "loss": 0.4212, "step": 12433 }, { "epoch": 2.3, "learning_rate": 2.7189064170791635e-06, "loss": 0.4099, "step": 12434 }, { "epoch": 2.3, "learning_rate": 2.7175373868588416e-06, "loss": 0.394, "step": 12435 }, { "epoch": 2.3, "learning_rate": 2.716168647195291e-06, "loss": 0.422, "step": 12436 }, { "epoch": 2.3, "learning_rate": 2.714800198143128e-06, "loss": 0.4157, "step": 12437 }, { "epoch": 2.3, "learning_rate": 2.71343203975695e-06, "loss": 0.4286, "step": 12438 }, { "epoch": 2.3, "learning_rate": 2.7120641720913397e-06, "loss": 0.4265, "step": 12439 }, { "epoch": 2.3, "learning_rate": 2.710696595200878e-06, "loss": 0.4323, "step": 12440 }, { "epoch": 2.3, "learning_rate": 2.709329309140124e-06, "loss": 0.4163, "step": 12441 }, { "epoch": 2.3, "learning_rate": 2.7079623139636356e-06, "loss": 0.409, "step": 12442 }, { "epoch": 2.3, "learning_rate": 2.7065956097259493e-06, "loss": 0.4131, "step": 12443 }, { "epoch": 2.3, "learning_rate": 2.7052291964815924e-06, "loss": 0.4394, "step": 12444 }, { "epoch": 2.3, "learning_rate": 2.703863074285087e-06, "loss": 0.4213, "step": 12445 }, { "epoch": 2.3, "learning_rate": 2.7024972431909337e-06, "loss": 0.3961, "step": 12446 }, { "epoch": 2.3, "learning_rate": 2.701131703253633e-06, "loss": 0.4015, "step": 12447 }, { "epoch": 2.3, "learning_rate": 2.6997664545276635e-06, "loss": 0.3908, "step": 12448 }, { "epoch": 2.3, "learning_rate": 2.6984014970674934e-06, "loss": 0.4195, "step": 12449 }, { "epoch": 2.3, "learning_rate": 2.6970368309275872e-06, "loss": 0.4217, "step": 12450 }, { "epoch": 2.3, "learning_rate": 2.695672456162388e-06, "loss": 0.4193, "step": 12451 }, { "epoch": 2.3, "learning_rate": 2.6943083728263375e-06, "loss": 0.4091, "step": 12452 }, { "epoch": 2.3, "learning_rate": 2.692944580973854e-06, "loss": 0.4078, "step": 12453 }, { "epoch": 2.3, "learning_rate": 2.6915810806593556e-06, "loss": 0.4201, "step": 12454 }, { "epoch": 2.3, "learning_rate": 2.690217871937241e-06, "loss": 0.4241, "step": 12455 }, { "epoch": 2.3, "learning_rate": 2.6888549548618968e-06, "loss": 0.3994, "step": 12456 }, { "epoch": 2.3, "learning_rate": 2.6874923294877064e-06, "loss": 0.4102, "step": 12457 }, { "epoch": 2.3, "learning_rate": 2.68612999586903e-06, "loss": 0.4267, "step": 12458 }, { "epoch": 2.31, "learning_rate": 2.684767954060229e-06, "loss": 0.4191, "step": 12459 }, { "epoch": 2.31, "learning_rate": 2.6834062041156395e-06, "loss": 0.4013, "step": 12460 }, { "epoch": 2.31, "learning_rate": 2.6820447460895994e-06, "loss": 0.4178, "step": 12461 }, { "epoch": 2.31, "learning_rate": 2.6806835800364217e-06, "loss": 0.4372, "step": 12462 }, { "epoch": 2.31, "learning_rate": 2.6793227060104222e-06, "loss": 0.4249, "step": 12463 }, { "epoch": 2.31, "learning_rate": 2.677962124065888e-06, "loss": 0.4271, "step": 12464 }, { "epoch": 2.31, "learning_rate": 2.676601834257113e-06, "loss": 0.4072, "step": 12465 }, { "epoch": 2.31, "learning_rate": 2.6752418366383625e-06, "loss": 0.4293, "step": 12466 }, { "epoch": 2.31, "learning_rate": 2.673882131263904e-06, "loss": 0.4243, "step": 12467 }, { "epoch": 2.31, "learning_rate": 2.672522718187981e-06, "loss": 0.414, "step": 12468 }, { "epoch": 2.31, "learning_rate": 2.6711635974648385e-06, "loss": 0.4203, "step": 12469 }, { "epoch": 2.31, "learning_rate": 2.6698047691487005e-06, "loss": 0.4203, "step": 12470 }, { "epoch": 2.31, "learning_rate": 2.6684462332937765e-06, "loss": 0.4141, "step": 12471 }, { "epoch": 2.31, "learning_rate": 2.6670879899542777e-06, "loss": 0.4095, "step": 12472 }, { "epoch": 2.31, "learning_rate": 2.6657300391843876e-06, "loss": 0.4305, "step": 12473 }, { "epoch": 2.31, "learning_rate": 2.664372381038294e-06, "loss": 0.4135, "step": 12474 }, { "epoch": 2.31, "learning_rate": 2.6630150155701575e-06, "loss": 0.3995, "step": 12475 }, { "epoch": 2.31, "learning_rate": 2.6616579428341407e-06, "loss": 0.4187, "step": 12476 }, { "epoch": 2.31, "learning_rate": 2.6603011628843845e-06, "loss": 0.4053, "step": 12477 }, { "epoch": 2.31, "learning_rate": 2.6589446757750204e-06, "loss": 0.4345, "step": 12478 }, { "epoch": 2.31, "learning_rate": 2.657588481560176e-06, "loss": 0.4307, "step": 12479 }, { "epoch": 2.31, "learning_rate": 2.6562325802939527e-06, "loss": 0.4053, "step": 12480 }, { "epoch": 2.31, "learning_rate": 2.654876972030457e-06, "loss": 0.4282, "step": 12481 }, { "epoch": 2.31, "learning_rate": 2.6535216568237708e-06, "loss": 0.4168, "step": 12482 }, { "epoch": 2.31, "learning_rate": 2.652166634727965e-06, "loss": 0.435, "step": 12483 }, { "epoch": 2.31, "learning_rate": 2.6508119057971105e-06, "loss": 0.4105, "step": 12484 }, { "epoch": 2.31, "learning_rate": 2.6494574700852504e-06, "loss": 0.4189, "step": 12485 }, { "epoch": 2.31, "learning_rate": 2.6481033276464306e-06, "loss": 0.4114, "step": 12486 }, { "epoch": 2.31, "learning_rate": 2.6467494785346782e-06, "loss": 0.4085, "step": 12487 }, { "epoch": 2.31, "learning_rate": 2.6453959228040028e-06, "loss": 0.4288, "step": 12488 }, { "epoch": 2.31, "learning_rate": 2.644042660508417e-06, "loss": 0.4237, "step": 12489 }, { "epoch": 2.31, "learning_rate": 2.6426896917019062e-06, "loss": 0.4243, "step": 12490 }, { "epoch": 2.31, "learning_rate": 2.641337016438459e-06, "loss": 0.4029, "step": 12491 }, { "epoch": 2.31, "learning_rate": 2.6399846347720405e-06, "loss": 0.4335, "step": 12492 }, { "epoch": 2.31, "learning_rate": 2.6386325467566043e-06, "loss": 0.4248, "step": 12493 }, { "epoch": 2.31, "learning_rate": 2.637280752446104e-06, "loss": 0.4303, "step": 12494 }, { "epoch": 2.31, "learning_rate": 2.635929251894468e-06, "loss": 0.4213, "step": 12495 }, { "epoch": 2.31, "learning_rate": 2.6345780451556224e-06, "loss": 0.4162, "step": 12496 }, { "epoch": 2.31, "learning_rate": 2.6332271322834733e-06, "loss": 0.4124, "step": 12497 }, { "epoch": 2.31, "learning_rate": 2.631876513331926e-06, "loss": 0.4019, "step": 12498 }, { "epoch": 2.31, "learning_rate": 2.6305261883548625e-06, "loss": 0.4138, "step": 12499 }, { "epoch": 2.31, "learning_rate": 2.629176157406158e-06, "loss": 0.4032, "step": 12500 }, { "epoch": 2.31, "learning_rate": 2.627826420539681e-06, "loss": 0.439, "step": 12501 }, { "epoch": 2.31, "learning_rate": 2.626476977809278e-06, "loss": 0.4052, "step": 12502 }, { "epoch": 2.31, "learning_rate": 2.625127829268794e-06, "loss": 0.4082, "step": 12503 }, { "epoch": 2.31, "learning_rate": 2.6237789749720566e-06, "loss": 0.4168, "step": 12504 }, { "epoch": 2.31, "learning_rate": 2.6224304149728776e-06, "loss": 0.4316, "step": 12505 }, { "epoch": 2.31, "learning_rate": 2.621082149325068e-06, "loss": 0.3988, "step": 12506 }, { "epoch": 2.31, "learning_rate": 2.619734178082418e-06, "loss": 0.3851, "step": 12507 }, { "epoch": 2.31, "learning_rate": 2.618386501298712e-06, "loss": 0.4048, "step": 12508 }, { "epoch": 2.31, "learning_rate": 2.6170391190277143e-06, "loss": 0.4227, "step": 12509 }, { "epoch": 2.31, "learning_rate": 2.6156920313231903e-06, "loss": 0.4071, "step": 12510 }, { "epoch": 2.31, "learning_rate": 2.614345238238879e-06, "loss": 0.4208, "step": 12511 }, { "epoch": 2.31, "learning_rate": 2.6129987398285227e-06, "loss": 0.4198, "step": 12512 }, { "epoch": 2.32, "learning_rate": 2.6116525361458355e-06, "loss": 0.4182, "step": 12513 }, { "epoch": 2.32, "learning_rate": 2.6103066272445365e-06, "loss": 0.4013, "step": 12514 }, { "epoch": 2.32, "learning_rate": 2.6089610131783193e-06, "loss": 0.3906, "step": 12515 }, { "epoch": 2.32, "learning_rate": 2.6076156940008756e-06, "loss": 0.4073, "step": 12516 }, { "epoch": 2.32, "learning_rate": 2.606270669765876e-06, "loss": 0.4199, "step": 12517 }, { "epoch": 2.32, "learning_rate": 2.604925940526991e-06, "loss": 0.4138, "step": 12518 }, { "epoch": 2.32, "learning_rate": 2.6035815063378666e-06, "loss": 0.3999, "step": 12519 }, { "epoch": 2.32, "learning_rate": 2.6022373672521485e-06, "loss": 0.4082, "step": 12520 }, { "epoch": 2.32, "learning_rate": 2.6008935233234623e-06, "loss": 0.4222, "step": 12521 }, { "epoch": 2.32, "learning_rate": 2.5995499746054232e-06, "loss": 0.4197, "step": 12522 }, { "epoch": 2.32, "learning_rate": 2.5982067211516414e-06, "loss": 0.419, "step": 12523 }, { "epoch": 2.32, "learning_rate": 2.5968637630157044e-06, "loss": 0.4178, "step": 12524 }, { "epoch": 2.32, "learning_rate": 2.5955211002512006e-06, "loss": 0.4307, "step": 12525 }, { "epoch": 2.32, "learning_rate": 2.594178732911694e-06, "loss": 0.4016, "step": 12526 }, { "epoch": 2.32, "learning_rate": 2.5928366610507427e-06, "loss": 0.4169, "step": 12527 }, { "epoch": 2.32, "learning_rate": 2.591494884721898e-06, "loss": 0.4182, "step": 12528 }, { "epoch": 2.32, "learning_rate": 2.5901534039786867e-06, "loss": 0.4178, "step": 12529 }, { "epoch": 2.32, "learning_rate": 2.5888122188746388e-06, "loss": 0.433, "step": 12530 }, { "epoch": 2.32, "learning_rate": 2.5874713294632625e-06, "loss": 0.4222, "step": 12531 }, { "epoch": 2.32, "learning_rate": 2.5861307357980536e-06, "loss": 0.4289, "step": 12532 }, { "epoch": 2.32, "learning_rate": 2.584790437932504e-06, "loss": 0.4078, "step": 12533 }, { "epoch": 2.32, "learning_rate": 2.5834504359200843e-06, "loss": 0.4039, "step": 12534 }, { "epoch": 2.32, "learning_rate": 2.5821107298142643e-06, "loss": 0.4074, "step": 12535 }, { "epoch": 2.32, "learning_rate": 2.5807713196684913e-06, "loss": 0.4236, "step": 12536 }, { "epoch": 2.32, "learning_rate": 2.579432205536204e-06, "loss": 0.4157, "step": 12537 }, { "epoch": 2.32, "learning_rate": 2.5780933874708357e-06, "loss": 0.4034, "step": 12538 }, { "epoch": 2.32, "learning_rate": 2.576754865525798e-06, "loss": 0.4155, "step": 12539 }, { "epoch": 2.32, "learning_rate": 2.5754166397544987e-06, "loss": 0.4053, "step": 12540 }, { "epoch": 2.32, "learning_rate": 2.574078710210327e-06, "loss": 0.4003, "step": 12541 }, { "epoch": 2.32, "learning_rate": 2.5727410769466697e-06, "loss": 0.426, "step": 12542 }, { "epoch": 2.32, "learning_rate": 2.571403740016891e-06, "loss": 0.4145, "step": 12543 }, { "epoch": 2.32, "learning_rate": 2.570066699474347e-06, "loss": 0.3959, "step": 12544 }, { "epoch": 2.32, "learning_rate": 2.5687299553723887e-06, "loss": 0.4168, "step": 12545 }, { "epoch": 2.32, "learning_rate": 2.567393507764343e-06, "loss": 0.413, "step": 12546 }, { "epoch": 2.32, "learning_rate": 2.5660573567035394e-06, "loss": 0.428, "step": 12547 }, { "epoch": 2.32, "learning_rate": 2.5647215022432827e-06, "loss": 0.4296, "step": 12548 }, { "epoch": 2.32, "learning_rate": 2.5633859444368692e-06, "loss": 0.4106, "step": 12549 }, { "epoch": 2.32, "learning_rate": 2.5620506833375913e-06, "loss": 0.4315, "step": 12550 }, { "epoch": 2.32, "learning_rate": 2.5607157189987166e-06, "loss": 0.4165, "step": 12551 }, { "epoch": 2.32, "learning_rate": 2.559381051473514e-06, "loss": 0.4011, "step": 12552 }, { "epoch": 2.32, "learning_rate": 2.5580466808152326e-06, "loss": 0.4014, "step": 12553 }, { "epoch": 2.32, "learning_rate": 2.5567126070771064e-06, "loss": 0.4266, "step": 12554 }, { "epoch": 2.32, "learning_rate": 2.5553788303123694e-06, "loss": 0.4109, "step": 12555 }, { "epoch": 2.32, "learning_rate": 2.5540453505742303e-06, "loss": 0.4352, "step": 12556 }, { "epoch": 2.32, "learning_rate": 2.5527121679158996e-06, "loss": 0.4019, "step": 12557 }, { "epoch": 2.32, "learning_rate": 2.5513792823905625e-06, "loss": 0.4149, "step": 12558 }, { "epoch": 2.32, "learning_rate": 2.5500466940514034e-06, "loss": 0.4107, "step": 12559 }, { "epoch": 2.32, "learning_rate": 2.5487144029515854e-06, "loss": 0.4165, "step": 12560 }, { "epoch": 2.32, "learning_rate": 2.54738240914427e-06, "loss": 0.4137, "step": 12561 }, { "epoch": 2.32, "learning_rate": 2.546050712682595e-06, "loss": 0.4343, "step": 12562 }, { "epoch": 2.32, "learning_rate": 2.544719313619699e-06, "loss": 0.4236, "step": 12563 }, { "epoch": 2.32, "learning_rate": 2.5433882120086974e-06, "loss": 0.4289, "step": 12564 }, { "epoch": 2.32, "learning_rate": 2.5420574079027016e-06, "loss": 0.4139, "step": 12565 }, { "epoch": 2.32, "learning_rate": 2.5407269013548053e-06, "loss": 0.4278, "step": 12566 }, { "epoch": 2.33, "learning_rate": 2.539396692418099e-06, "loss": 0.4226, "step": 12567 }, { "epoch": 2.33, "learning_rate": 2.5380667811456473e-06, "loss": 0.4103, "step": 12568 }, { "epoch": 2.33, "learning_rate": 2.5367371675905196e-06, "loss": 0.4202, "step": 12569 }, { "epoch": 2.33, "learning_rate": 2.53540785180576e-06, "loss": 0.4304, "step": 12570 }, { "epoch": 2.33, "learning_rate": 2.5340788338444044e-06, "loss": 0.4229, "step": 12571 }, { "epoch": 2.33, "learning_rate": 2.5327501137594844e-06, "loss": 0.4057, "step": 12572 }, { "epoch": 2.33, "learning_rate": 2.5314216916040057e-06, "loss": 0.4019, "step": 12573 }, { "epoch": 2.33, "learning_rate": 2.530093567430977e-06, "loss": 0.4146, "step": 12574 }, { "epoch": 2.33, "learning_rate": 2.5287657412933842e-06, "loss": 0.4131, "step": 12575 }, { "epoch": 2.33, "learning_rate": 2.527438213244203e-06, "loss": 0.4254, "step": 12576 }, { "epoch": 2.33, "learning_rate": 2.5261109833364063e-06, "loss": 0.4197, "step": 12577 }, { "epoch": 2.33, "learning_rate": 2.524784051622939e-06, "loss": 0.4272, "step": 12578 }, { "epoch": 2.33, "learning_rate": 2.523457418156752e-06, "loss": 0.4174, "step": 12579 }, { "epoch": 2.33, "learning_rate": 2.522131082990771e-06, "loss": 0.3961, "step": 12580 }, { "epoch": 2.33, "learning_rate": 2.520805046177912e-06, "loss": 0.4181, "step": 12581 }, { "epoch": 2.33, "learning_rate": 2.5194793077710877e-06, "loss": 0.4159, "step": 12582 }, { "epoch": 2.33, "learning_rate": 2.5181538678231864e-06, "loss": 0.4247, "step": 12583 }, { "epoch": 2.33, "learning_rate": 2.516828726387096e-06, "loss": 0.4283, "step": 12584 }, { "epoch": 2.33, "learning_rate": 2.515503883515682e-06, "loss": 0.4093, "step": 12585 }, { "epoch": 2.33, "learning_rate": 2.5141793392618087e-06, "loss": 0.4147, "step": 12586 }, { "epoch": 2.33, "learning_rate": 2.5128550936783202e-06, "loss": 0.4048, "step": 12587 }, { "epoch": 2.33, "learning_rate": 2.511531146818048e-06, "loss": 0.412, "step": 12588 }, { "epoch": 2.33, "learning_rate": 2.510207498733822e-06, "loss": 0.4044, "step": 12589 }, { "epoch": 2.33, "learning_rate": 2.508884149478447e-06, "loss": 0.417, "step": 12590 }, { "epoch": 2.33, "learning_rate": 2.507561099104727e-06, "loss": 0.4013, "step": 12591 }, { "epoch": 2.33, "learning_rate": 2.5062383476654483e-06, "loss": 0.432, "step": 12592 }, { "epoch": 2.33, "learning_rate": 2.504915895213382e-06, "loss": 0.4152, "step": 12593 }, { "epoch": 2.33, "learning_rate": 2.503593741801298e-06, "loss": 0.4191, "step": 12594 }, { "epoch": 2.33, "learning_rate": 2.502271887481941e-06, "loss": 0.4294, "step": 12595 }, { "epoch": 2.33, "learning_rate": 2.5009503323080562e-06, "loss": 0.4239, "step": 12596 }, { "epoch": 2.33, "learning_rate": 2.4996290763323704e-06, "loss": 0.4429, "step": 12597 }, { "epoch": 2.33, "learning_rate": 2.4983081196075943e-06, "loss": 0.4037, "step": 12598 }, { "epoch": 2.33, "learning_rate": 2.4969874621864375e-06, "loss": 0.4258, "step": 12599 }, { "epoch": 2.33, "learning_rate": 2.4956671041215875e-06, "loss": 0.4067, "step": 12600 }, { "epoch": 2.33, "learning_rate": 2.494347045465729e-06, "loss": 0.4198, "step": 12601 }, { "epoch": 2.33, "learning_rate": 2.4930272862715268e-06, "loss": 0.3996, "step": 12602 }, { "epoch": 2.33, "learning_rate": 2.491707826591635e-06, "loss": 0.4088, "step": 12603 }, { "epoch": 2.33, "learning_rate": 2.490388666478701e-06, "loss": 0.4203, "step": 12604 }, { "epoch": 2.33, "learning_rate": 2.4890698059853535e-06, "loss": 0.4137, "step": 12605 }, { "epoch": 2.33, "learning_rate": 2.4877512451642183e-06, "loss": 0.4263, "step": 12606 }, { "epoch": 2.33, "learning_rate": 2.486432984067896e-06, "loss": 0.4084, "step": 12607 }, { "epoch": 2.33, "learning_rate": 2.4851150227489895e-06, "loss": 0.3996, "step": 12608 }, { "epoch": 2.33, "learning_rate": 2.4837973612600776e-06, "loss": 0.3977, "step": 12609 }, { "epoch": 2.33, "learning_rate": 2.4824799996537374e-06, "loss": 0.4178, "step": 12610 }, { "epoch": 2.33, "learning_rate": 2.4811629379825254e-06, "loss": 0.3869, "step": 12611 }, { "epoch": 2.33, "learning_rate": 2.4798461762989935e-06, "loss": 0.4033, "step": 12612 }, { "epoch": 2.33, "learning_rate": 2.4785297146556718e-06, "loss": 0.4181, "step": 12613 }, { "epoch": 2.33, "learning_rate": 2.477213553105093e-06, "loss": 0.4407, "step": 12614 }, { "epoch": 2.33, "learning_rate": 2.4758976916997624e-06, "loss": 0.4198, "step": 12615 }, { "epoch": 2.33, "learning_rate": 2.474582130492187e-06, "loss": 0.4023, "step": 12616 }, { "epoch": 2.33, "learning_rate": 2.4732668695348485e-06, "loss": 0.4228, "step": 12617 }, { "epoch": 2.33, "learning_rate": 2.471951908880228e-06, "loss": 0.4217, "step": 12618 }, { "epoch": 2.33, "learning_rate": 2.4706372485807894e-06, "loss": 0.419, "step": 12619 }, { "epoch": 2.33, "learning_rate": 2.469322888688982e-06, "loss": 0.4392, "step": 12620 }, { "epoch": 2.34, "learning_rate": 2.468008829257251e-06, "loss": 0.4094, "step": 12621 }, { "epoch": 2.34, "learning_rate": 2.46669507033802e-06, "loss": 0.3935, "step": 12622 }, { "epoch": 2.34, "learning_rate": 2.4653816119837102e-06, "loss": 0.399, "step": 12623 }, { "epoch": 2.34, "learning_rate": 2.4640684542467254e-06, "loss": 0.422, "step": 12624 }, { "epoch": 2.34, "learning_rate": 2.4627555971794525e-06, "loss": 0.3966, "step": 12625 }, { "epoch": 2.34, "learning_rate": 2.4614430408342806e-06, "loss": 0.4104, "step": 12626 }, { "epoch": 2.34, "learning_rate": 2.4601307852635714e-06, "loss": 0.4106, "step": 12627 }, { "epoch": 2.34, "learning_rate": 2.458818830519686e-06, "loss": 0.4198, "step": 12628 }, { "epoch": 2.34, "learning_rate": 2.4575071766549673e-06, "loss": 0.4042, "step": 12629 }, { "epoch": 2.34, "learning_rate": 2.4561958237217454e-06, "loss": 0.4197, "step": 12630 }, { "epoch": 2.34, "learning_rate": 2.4548847717723457e-06, "loss": 0.3975, "step": 12631 }, { "epoch": 2.34, "learning_rate": 2.453574020859071e-06, "loss": 0.4178, "step": 12632 }, { "epoch": 2.34, "learning_rate": 2.4522635710342247e-06, "loss": 0.3948, "step": 12633 }, { "epoch": 2.34, "learning_rate": 2.450953422350084e-06, "loss": 0.4356, "step": 12634 }, { "epoch": 2.34, "learning_rate": 2.449643574858929e-06, "loss": 0.4185, "step": 12635 }, { "epoch": 2.34, "learning_rate": 2.4483340286130152e-06, "loss": 0.4194, "step": 12636 }, { "epoch": 2.34, "learning_rate": 2.4470247836645887e-06, "loss": 0.4143, "step": 12637 }, { "epoch": 2.34, "learning_rate": 2.4457158400658932e-06, "loss": 0.4013, "step": 12638 }, { "epoch": 2.34, "learning_rate": 2.4444071978691464e-06, "loss": 0.4144, "step": 12639 }, { "epoch": 2.34, "learning_rate": 2.443098857126567e-06, "loss": 0.4119, "step": 12640 }, { "epoch": 2.34, "learning_rate": 2.4417908178903516e-06, "loss": 0.4207, "step": 12641 }, { "epoch": 2.34, "learning_rate": 2.4404830802126855e-06, "loss": 0.4281, "step": 12642 }, { "epoch": 2.34, "learning_rate": 2.4391756441457515e-06, "loss": 0.4158, "step": 12643 }, { "epoch": 2.34, "learning_rate": 2.4378685097417078e-06, "loss": 0.3987, "step": 12644 }, { "epoch": 2.34, "learning_rate": 2.4365616770527133e-06, "loss": 0.4211, "step": 12645 }, { "epoch": 2.34, "learning_rate": 2.4352551461309038e-06, "loss": 0.4037, "step": 12646 }, { "epoch": 2.34, "learning_rate": 2.4339489170284057e-06, "loss": 0.397, "step": 12647 }, { "epoch": 2.34, "learning_rate": 2.4326429897973403e-06, "loss": 0.4244, "step": 12648 }, { "epoch": 2.34, "learning_rate": 2.4313373644898065e-06, "loss": 0.4187, "step": 12649 }, { "epoch": 2.34, "learning_rate": 2.4300320411579014e-06, "loss": 0.4249, "step": 12650 }, { "epoch": 2.34, "learning_rate": 2.4287270198537016e-06, "loss": 0.402, "step": 12651 }, { "epoch": 2.34, "learning_rate": 2.427422300629274e-06, "loss": 0.4199, "step": 12652 }, { "epoch": 2.34, "learning_rate": 2.4261178835366794e-06, "loss": 0.4142, "step": 12653 }, { "epoch": 2.34, "learning_rate": 2.424813768627955e-06, "loss": 0.4247, "step": 12654 }, { "epoch": 2.34, "learning_rate": 2.42350995595514e-06, "loss": 0.4145, "step": 12655 }, { "epoch": 2.34, "learning_rate": 2.4222064455702466e-06, "loss": 0.4263, "step": 12656 }, { "epoch": 2.34, "learning_rate": 2.4209032375252894e-06, "loss": 0.3993, "step": 12657 }, { "epoch": 2.34, "learning_rate": 2.4196003318722573e-06, "loss": 0.4264, "step": 12658 }, { "epoch": 2.34, "learning_rate": 2.4182977286631404e-06, "loss": 0.4377, "step": 12659 }, { "epoch": 2.34, "learning_rate": 2.416995427949904e-06, "loss": 0.4151, "step": 12660 }, { "epoch": 2.34, "learning_rate": 2.4156934297845137e-06, "loss": 0.3934, "step": 12661 }, { "epoch": 2.34, "learning_rate": 2.4143917342189106e-06, "loss": 0.413, "step": 12662 }, { "epoch": 2.34, "learning_rate": 2.4130903413050354e-06, "loss": 0.4043, "step": 12663 }, { "epoch": 2.34, "learning_rate": 2.411789251094806e-06, "loss": 0.4178, "step": 12664 }, { "epoch": 2.34, "learning_rate": 2.4104884636401394e-06, "loss": 0.3999, "step": 12665 }, { "epoch": 2.34, "learning_rate": 2.4091879789929284e-06, "loss": 0.4168, "step": 12666 }, { "epoch": 2.34, "learning_rate": 2.407887797205066e-06, "loss": 0.4236, "step": 12667 }, { "epoch": 2.34, "learning_rate": 2.4065879183284247e-06, "loss": 0.4111, "step": 12668 }, { "epoch": 2.34, "learning_rate": 2.405288342414863e-06, "loss": 0.4062, "step": 12669 }, { "epoch": 2.34, "learning_rate": 2.403989069516238e-06, "loss": 0.4315, "step": 12670 }, { "epoch": 2.34, "learning_rate": 2.4026900996843828e-06, "loss": 0.4316, "step": 12671 }, { "epoch": 2.34, "learning_rate": 2.4013914329711295e-06, "loss": 0.421, "step": 12672 }, { "epoch": 2.34, "learning_rate": 2.4000930694282898e-06, "loss": 0.4155, "step": 12673 }, { "epoch": 2.34, "learning_rate": 2.3987950091076628e-06, "loss": 0.4173, "step": 12674 }, { "epoch": 2.35, "learning_rate": 2.397497252061045e-06, "loss": 0.4119, "step": 12675 }, { "epoch": 2.35, "learning_rate": 2.3961997983402073e-06, "loss": 0.4248, "step": 12676 }, { "epoch": 2.35, "learning_rate": 2.3949026479969227e-06, "loss": 0.4223, "step": 12677 }, { "epoch": 2.35, "learning_rate": 2.39360580108294e-06, "loss": 0.4049, "step": 12678 }, { "epoch": 2.35, "learning_rate": 2.392309257650005e-06, "loss": 0.4257, "step": 12679 }, { "epoch": 2.35, "learning_rate": 2.391013017749846e-06, "loss": 0.4162, "step": 12680 }, { "epoch": 2.35, "learning_rate": 2.389717081434176e-06, "loss": 0.4231, "step": 12681 }, { "epoch": 2.35, "learning_rate": 2.3884214487547074e-06, "loss": 0.4301, "step": 12682 }, { "epoch": 2.35, "learning_rate": 2.3871261197631292e-06, "loss": 0.4021, "step": 12683 }, { "epoch": 2.35, "learning_rate": 2.385831094511125e-06, "loss": 0.4002, "step": 12684 }, { "epoch": 2.35, "learning_rate": 2.3845363730503636e-06, "loss": 0.4329, "step": 12685 }, { "epoch": 2.35, "learning_rate": 2.383241955432498e-06, "loss": 0.4165, "step": 12686 }, { "epoch": 2.35, "learning_rate": 2.3819478417091803e-06, "loss": 0.4335, "step": 12687 }, { "epoch": 2.35, "learning_rate": 2.380654031932036e-06, "loss": 0.4163, "step": 12688 }, { "epoch": 2.35, "learning_rate": 2.379360526152691e-06, "loss": 0.4287, "step": 12689 }, { "epoch": 2.35, "learning_rate": 2.3780673244227527e-06, "loss": 0.4143, "step": 12690 }, { "epoch": 2.35, "learning_rate": 2.376774426793813e-06, "loss": 0.4243, "step": 12691 }, { "epoch": 2.35, "learning_rate": 2.3754818333174633e-06, "loss": 0.426, "step": 12692 }, { "epoch": 2.35, "learning_rate": 2.374189544045268e-06, "loss": 0.4501, "step": 12693 }, { "epoch": 2.35, "learning_rate": 2.3728975590287952e-06, "loss": 0.4236, "step": 12694 }, { "epoch": 2.35, "learning_rate": 2.371605878319587e-06, "loss": 0.4207, "step": 12695 }, { "epoch": 2.35, "learning_rate": 2.3703145019691797e-06, "loss": 0.421, "step": 12696 }, { "epoch": 2.35, "learning_rate": 2.369023430029099e-06, "loss": 0.4152, "step": 12697 }, { "epoch": 2.35, "learning_rate": 2.3677326625508534e-06, "loss": 0.4168, "step": 12698 }, { "epoch": 2.35, "learning_rate": 2.3664421995859467e-06, "loss": 0.4178, "step": 12699 }, { "epoch": 2.35, "learning_rate": 2.3651520411858596e-06, "loss": 0.4185, "step": 12700 }, { "epoch": 2.35, "learning_rate": 2.3638621874020727e-06, "loss": 0.415, "step": 12701 }, { "epoch": 2.35, "learning_rate": 2.3625726382860482e-06, "loss": 0.4145, "step": 12702 }, { "epoch": 2.35, "learning_rate": 2.361283393889231e-06, "loss": 0.4015, "step": 12703 }, { "epoch": 2.35, "learning_rate": 2.359994454263067e-06, "loss": 0.4238, "step": 12704 }, { "epoch": 2.35, "learning_rate": 2.3587058194589762e-06, "loss": 0.4036, "step": 12705 }, { "epoch": 2.35, "learning_rate": 2.3574174895283786e-06, "loss": 0.4174, "step": 12706 }, { "epoch": 2.35, "learning_rate": 2.356129464522674e-06, "loss": 0.4163, "step": 12707 }, { "epoch": 2.35, "learning_rate": 2.354841744493247e-06, "loss": 0.4099, "step": 12708 }, { "epoch": 2.35, "learning_rate": 2.353554329491484e-06, "loss": 0.4194, "step": 12709 }, { "epoch": 2.35, "learning_rate": 2.3522672195687433e-06, "loss": 0.423, "step": 12710 }, { "epoch": 2.35, "learning_rate": 2.3509804147763835e-06, "loss": 0.4139, "step": 12711 }, { "epoch": 2.35, "learning_rate": 2.3496939151657404e-06, "loss": 0.4057, "step": 12712 }, { "epoch": 2.35, "learning_rate": 2.3484077207881496e-06, "loss": 0.4198, "step": 12713 }, { "epoch": 2.35, "learning_rate": 2.3471218316949207e-06, "loss": 0.4285, "step": 12714 }, { "epoch": 2.35, "learning_rate": 2.345836247937365e-06, "loss": 0.4245, "step": 12715 }, { "epoch": 2.35, "learning_rate": 2.344550969566769e-06, "loss": 0.4179, "step": 12716 }, { "epoch": 2.35, "learning_rate": 2.3432659966344175e-06, "loss": 0.4304, "step": 12717 }, { "epoch": 2.35, "learning_rate": 2.341981329191575e-06, "loss": 0.4114, "step": 12718 }, { "epoch": 2.35, "learning_rate": 2.3406969672895006e-06, "loss": 0.4441, "step": 12719 }, { "epoch": 2.35, "learning_rate": 2.339412910979435e-06, "loss": 0.4238, "step": 12720 }, { "epoch": 2.35, "learning_rate": 2.338129160312613e-06, "loss": 0.4106, "step": 12721 }, { "epoch": 2.35, "learning_rate": 2.336845715340249e-06, "loss": 0.3932, "step": 12722 }, { "epoch": 2.35, "learning_rate": 2.3355625761135557e-06, "loss": 0.3914, "step": 12723 }, { "epoch": 2.35, "learning_rate": 2.334279742683726e-06, "loss": 0.4063, "step": 12724 }, { "epoch": 2.35, "learning_rate": 2.332997215101939e-06, "loss": 0.4214, "step": 12725 }, { "epoch": 2.35, "learning_rate": 2.3317149934193704e-06, "loss": 0.4137, "step": 12726 }, { "epoch": 2.35, "learning_rate": 2.330433077687173e-06, "loss": 0.3941, "step": 12727 }, { "epoch": 2.35, "learning_rate": 2.3291514679564996e-06, "loss": 0.4289, "step": 12728 }, { "epoch": 2.36, "learning_rate": 2.3278701642784807e-06, "loss": 0.4212, "step": 12729 }, { "epoch": 2.36, "learning_rate": 2.326589166704234e-06, "loss": 0.4185, "step": 12730 }, { "epoch": 2.36, "learning_rate": 2.3253084752848753e-06, "loss": 0.4063, "step": 12731 }, { "epoch": 2.36, "learning_rate": 2.324028090071496e-06, "loss": 0.3901, "step": 12732 }, { "epoch": 2.36, "learning_rate": 2.322748011115188e-06, "loss": 0.4038, "step": 12733 }, { "epoch": 2.36, "learning_rate": 2.321468238467021e-06, "loss": 0.398, "step": 12734 }, { "epoch": 2.36, "learning_rate": 2.3201887721780503e-06, "loss": 0.4233, "step": 12735 }, { "epoch": 2.36, "learning_rate": 2.3189096122993326e-06, "loss": 0.4233, "step": 12736 }, { "epoch": 2.36, "learning_rate": 2.317630758881897e-06, "loss": 0.4217, "step": 12737 }, { "epoch": 2.36, "learning_rate": 2.3163522119767733e-06, "loss": 0.4254, "step": 12738 }, { "epoch": 2.36, "learning_rate": 2.3150739716349713e-06, "loss": 0.4279, "step": 12739 }, { "epoch": 2.36, "learning_rate": 2.3137960379074862e-06, "loss": 0.409, "step": 12740 }, { "epoch": 2.36, "learning_rate": 2.3125184108453113e-06, "loss": 0.4455, "step": 12741 }, { "epoch": 2.36, "learning_rate": 2.3112410904994155e-06, "loss": 0.4029, "step": 12742 }, { "epoch": 2.36, "learning_rate": 2.309964076920769e-06, "loss": 0.4228, "step": 12743 }, { "epoch": 2.36, "learning_rate": 2.3086873701603143e-06, "loss": 0.448, "step": 12744 }, { "epoch": 2.36, "learning_rate": 2.3074109702689964e-06, "loss": 0.4143, "step": 12745 }, { "epoch": 2.36, "learning_rate": 2.306134877297739e-06, "loss": 0.3981, "step": 12746 }, { "epoch": 2.36, "learning_rate": 2.304859091297451e-06, "loss": 0.4314, "step": 12747 }, { "epoch": 2.36, "learning_rate": 2.3035836123190414e-06, "loss": 0.4178, "step": 12748 }, { "epoch": 2.36, "learning_rate": 2.3023084404133932e-06, "loss": 0.4125, "step": 12749 }, { "epoch": 2.36, "learning_rate": 2.3010335756313906e-06, "loss": 0.4249, "step": 12750 }, { "epoch": 2.36, "learning_rate": 2.299759018023893e-06, "loss": 0.3967, "step": 12751 }, { "epoch": 2.36, "learning_rate": 2.298484767641751e-06, "loss": 0.4125, "step": 12752 }, { "epoch": 2.36, "learning_rate": 2.2972108245358103e-06, "loss": 0.4399, "step": 12753 }, { "epoch": 2.36, "learning_rate": 2.295937188756894e-06, "loss": 0.4088, "step": 12754 }, { "epoch": 2.36, "learning_rate": 2.2946638603558237e-06, "loss": 0.4132, "step": 12755 }, { "epoch": 2.36, "learning_rate": 2.2933908393833983e-06, "loss": 0.4172, "step": 12756 }, { "epoch": 2.36, "learning_rate": 2.292118125890407e-06, "loss": 0.4066, "step": 12757 }, { "epoch": 2.36, "learning_rate": 2.290845719927636e-06, "loss": 0.4373, "step": 12758 }, { "epoch": 2.36, "learning_rate": 2.2895736215458433e-06, "loss": 0.4305, "step": 12759 }, { "epoch": 2.36, "learning_rate": 2.2883018307957907e-06, "loss": 0.4174, "step": 12760 }, { "epoch": 2.36, "learning_rate": 2.2870303477282153e-06, "loss": 0.4003, "step": 12761 }, { "epoch": 2.36, "learning_rate": 2.285759172393851e-06, "loss": 0.4258, "step": 12762 }, { "epoch": 2.36, "learning_rate": 2.2844883048434096e-06, "loss": 0.403, "step": 12763 }, { "epoch": 2.36, "learning_rate": 2.2832177451276037e-06, "loss": 0.3874, "step": 12764 }, { "epoch": 2.36, "learning_rate": 2.2819474932971196e-06, "loss": 0.4221, "step": 12765 }, { "epoch": 2.36, "learning_rate": 2.2806775494026445e-06, "loss": 0.4147, "step": 12766 }, { "epoch": 2.36, "learning_rate": 2.27940791349484e-06, "loss": 0.4128, "step": 12767 }, { "epoch": 2.36, "learning_rate": 2.278138585624368e-06, "loss": 0.4248, "step": 12768 }, { "epoch": 2.36, "learning_rate": 2.276869565841866e-06, "loss": 0.3901, "step": 12769 }, { "epoch": 2.36, "learning_rate": 2.2756008541979734e-06, "loss": 0.4349, "step": 12770 }, { "epoch": 2.36, "learning_rate": 2.2743324507433016e-06, "loss": 0.4131, "step": 12771 }, { "epoch": 2.36, "learning_rate": 2.273064355528465e-06, "loss": 0.3984, "step": 12772 }, { "epoch": 2.36, "learning_rate": 2.2717965686040546e-06, "loss": 0.4193, "step": 12773 }, { "epoch": 2.36, "learning_rate": 2.27052909002065e-06, "loss": 0.402, "step": 12774 }, { "epoch": 2.36, "learning_rate": 2.2692619198288256e-06, "loss": 0.3945, "step": 12775 }, { "epoch": 2.36, "learning_rate": 2.2679950580791364e-06, "loss": 0.4434, "step": 12776 }, { "epoch": 2.36, "learning_rate": 2.266728504822131e-06, "loss": 0.4077, "step": 12777 }, { "epoch": 2.36, "learning_rate": 2.26546226010834e-06, "loss": 0.4033, "step": 12778 }, { "epoch": 2.36, "learning_rate": 2.2641963239882826e-06, "loss": 0.4147, "step": 12779 }, { "epoch": 2.36, "learning_rate": 2.262930696512472e-06, "loss": 0.4054, "step": 12780 }, { "epoch": 2.36, "learning_rate": 2.261665377731399e-06, "loss": 0.3868, "step": 12781 }, { "epoch": 2.36, "learning_rate": 2.2604003676955523e-06, "loss": 0.4242, "step": 12782 }, { "epoch": 2.37, "learning_rate": 2.259135666455402e-06, "loss": 0.4117, "step": 12783 }, { "epoch": 2.37, "learning_rate": 2.257871274061405e-06, "loss": 0.3872, "step": 12784 }, { "epoch": 2.37, "learning_rate": 2.256607190564012e-06, "loss": 0.4121, "step": 12785 }, { "epoch": 2.37, "learning_rate": 2.2553434160136522e-06, "loss": 0.4204, "step": 12786 }, { "epoch": 2.37, "learning_rate": 2.2540799504607546e-06, "loss": 0.4266, "step": 12787 }, { "epoch": 2.37, "learning_rate": 2.2528167939557235e-06, "loss": 0.4207, "step": 12788 }, { "epoch": 2.37, "learning_rate": 2.25155394654896e-06, "loss": 0.4233, "step": 12789 }, { "epoch": 2.37, "learning_rate": 2.25029140829085e-06, "loss": 0.4112, "step": 12790 }, { "epoch": 2.37, "learning_rate": 2.249029179231761e-06, "loss": 0.4213, "step": 12791 }, { "epoch": 2.37, "learning_rate": 2.2477672594220602e-06, "loss": 0.4198, "step": 12792 }, { "epoch": 2.37, "learning_rate": 2.2465056489120895e-06, "loss": 0.403, "step": 12793 }, { "epoch": 2.37, "learning_rate": 2.2452443477521912e-06, "loss": 0.4014, "step": 12794 }, { "epoch": 2.37, "learning_rate": 2.243983355992686e-06, "loss": 0.4104, "step": 12795 }, { "epoch": 2.37, "learning_rate": 2.2427226736838827e-06, "loss": 0.41, "step": 12796 }, { "epoch": 2.37, "learning_rate": 2.241462300876085e-06, "loss": 0.4292, "step": 12797 }, { "epoch": 2.37, "learning_rate": 2.240202237619573e-06, "loss": 0.4079, "step": 12798 }, { "epoch": 2.37, "learning_rate": 2.238942483964629e-06, "loss": 0.3999, "step": 12799 }, { "epoch": 2.37, "learning_rate": 2.23768303996151e-06, "loss": 0.4023, "step": 12800 }, { "epoch": 2.37, "learning_rate": 2.2364239056604643e-06, "loss": 0.4011, "step": 12801 }, { "epoch": 2.37, "learning_rate": 2.235165081111733e-06, "loss": 0.42, "step": 12802 }, { "epoch": 2.37, "learning_rate": 2.2339065663655356e-06, "loss": 0.4034, "step": 12803 }, { "epoch": 2.37, "learning_rate": 2.2326483614720917e-06, "loss": 0.4407, "step": 12804 }, { "epoch": 2.37, "learning_rate": 2.2313904664815965e-06, "loss": 0.4345, "step": 12805 }, { "epoch": 2.37, "learning_rate": 2.230132881444236e-06, "loss": 0.4239, "step": 12806 }, { "epoch": 2.37, "learning_rate": 2.2288756064101903e-06, "loss": 0.4254, "step": 12807 }, { "epoch": 2.37, "learning_rate": 2.2276186414296175e-06, "loss": 0.4069, "step": 12808 }, { "epoch": 2.37, "learning_rate": 2.2263619865526733e-06, "loss": 0.4032, "step": 12809 }, { "epoch": 2.37, "learning_rate": 2.22510564182949e-06, "loss": 0.4067, "step": 12810 }, { "epoch": 2.37, "learning_rate": 2.223849607310201e-06, "loss": 0.4162, "step": 12811 }, { "epoch": 2.37, "learning_rate": 2.2225938830449123e-06, "loss": 0.4291, "step": 12812 }, { "epoch": 2.37, "learning_rate": 2.2213384690837304e-06, "loss": 0.4114, "step": 12813 }, { "epoch": 2.37, "learning_rate": 2.2200833654767396e-06, "loss": 0.4064, "step": 12814 }, { "epoch": 2.37, "learning_rate": 2.21882857227402e-06, "loss": 0.4216, "step": 12815 }, { "epoch": 2.37, "learning_rate": 2.2175740895256327e-06, "loss": 0.4097, "step": 12816 }, { "epoch": 2.37, "learning_rate": 2.2163199172816317e-06, "loss": 0.407, "step": 12817 }, { "epoch": 2.37, "learning_rate": 2.215066055592053e-06, "loss": 0.4121, "step": 12818 }, { "epoch": 2.37, "learning_rate": 2.213812504506928e-06, "loss": 0.3982, "step": 12819 }, { "epoch": 2.37, "learning_rate": 2.2125592640762662e-06, "loss": 0.4274, "step": 12820 }, { "epoch": 2.37, "learning_rate": 2.211306334350073e-06, "loss": 0.4085, "step": 12821 }, { "epoch": 2.37, "learning_rate": 2.2100537153783376e-06, "loss": 0.3932, "step": 12822 }, { "epoch": 2.37, "learning_rate": 2.2088014072110332e-06, "loss": 0.4115, "step": 12823 }, { "epoch": 2.37, "learning_rate": 2.207549409898131e-06, "loss": 0.4082, "step": 12824 }, { "epoch": 2.37, "learning_rate": 2.2062977234895764e-06, "loss": 0.4301, "step": 12825 }, { "epoch": 2.37, "learning_rate": 2.205046348035316e-06, "loss": 0.4242, "step": 12826 }, { "epoch": 2.37, "learning_rate": 2.203795283585275e-06, "loss": 0.4091, "step": 12827 }, { "epoch": 2.37, "learning_rate": 2.2025445301893644e-06, "loss": 0.4137, "step": 12828 }, { "epoch": 2.37, "learning_rate": 2.201294087897493e-06, "loss": 0.4219, "step": 12829 }, { "epoch": 2.37, "learning_rate": 2.2000439567595466e-06, "loss": 0.4124, "step": 12830 }, { "epoch": 2.37, "learning_rate": 2.1987941368254073e-06, "loss": 0.4176, "step": 12831 }, { "epoch": 2.37, "learning_rate": 2.197544628144935e-06, "loss": 0.4116, "step": 12832 }, { "epoch": 2.37, "learning_rate": 2.1962954307679906e-06, "loss": 0.4269, "step": 12833 }, { "epoch": 2.37, "learning_rate": 2.195046544744409e-06, "loss": 0.4262, "step": 12834 }, { "epoch": 2.37, "learning_rate": 2.1937979701240176e-06, "loss": 0.4265, "step": 12835 }, { "epoch": 2.37, "learning_rate": 2.192549706956637e-06, "loss": 0.3939, "step": 12836 }, { "epoch": 2.38, "learning_rate": 2.1913017552920656e-06, "loss": 0.4056, "step": 12837 }, { "epoch": 2.38, "learning_rate": 2.1900541151800992e-06, "loss": 0.4303, "step": 12838 }, { "epoch": 2.38, "learning_rate": 2.1888067866705134e-06, "loss": 0.4087, "step": 12839 }, { "epoch": 2.38, "learning_rate": 2.1875597698130725e-06, "loss": 0.3952, "step": 12840 }, { "epoch": 2.38, "learning_rate": 2.186313064657535e-06, "loss": 0.4017, "step": 12841 }, { "epoch": 2.38, "learning_rate": 2.185066671253637e-06, "loss": 0.4195, "step": 12842 }, { "epoch": 2.38, "learning_rate": 2.183820589651113e-06, "loss": 0.4169, "step": 12843 }, { "epoch": 2.38, "learning_rate": 2.1825748198996755e-06, "loss": 0.4242, "step": 12844 }, { "epoch": 2.38, "learning_rate": 2.1813293620490273e-06, "loss": 0.4276, "step": 12845 }, { "epoch": 2.38, "learning_rate": 2.1800842161488635e-06, "loss": 0.4282, "step": 12846 }, { "epoch": 2.38, "learning_rate": 2.1788393822488584e-06, "loss": 0.4098, "step": 12847 }, { "epoch": 2.38, "learning_rate": 2.177594860398685e-06, "loss": 0.4247, "step": 12848 }, { "epoch": 2.38, "learning_rate": 2.1763506506479924e-06, "loss": 0.3975, "step": 12849 }, { "epoch": 2.38, "learning_rate": 2.1751067530464233e-06, "loss": 0.4012, "step": 12850 }, { "epoch": 2.38, "learning_rate": 2.173863167643608e-06, "loss": 0.3881, "step": 12851 }, { "epoch": 2.38, "learning_rate": 2.172619894489161e-06, "loss": 0.396, "step": 12852 }, { "epoch": 2.38, "learning_rate": 2.1713769336326906e-06, "loss": 0.4275, "step": 12853 }, { "epoch": 2.38, "learning_rate": 2.170134285123784e-06, "loss": 0.4086, "step": 12854 }, { "epoch": 2.38, "learning_rate": 2.168891949012024e-06, "loss": 0.3983, "step": 12855 }, { "epoch": 2.38, "learning_rate": 2.1676499253469785e-06, "loss": 0.4137, "step": 12856 }, { "epoch": 2.38, "learning_rate": 2.166408214178195e-06, "loss": 0.3935, "step": 12857 }, { "epoch": 2.38, "learning_rate": 2.1651668155552242e-06, "loss": 0.4136, "step": 12858 }, { "epoch": 2.38, "learning_rate": 2.1639257295275882e-06, "loss": 0.4081, "step": 12859 }, { "epoch": 2.38, "learning_rate": 2.1626849561448114e-06, "loss": 0.399, "step": 12860 }, { "epoch": 2.38, "learning_rate": 2.1614444954563906e-06, "loss": 0.4199, "step": 12861 }, { "epoch": 2.38, "learning_rate": 2.160204347511825e-06, "loss": 0.4206, "step": 12862 }, { "epoch": 2.38, "learning_rate": 2.1589645123605883e-06, "loss": 0.4443, "step": 12863 }, { "epoch": 2.38, "learning_rate": 2.1577249900521526e-06, "loss": 0.4242, "step": 12864 }, { "epoch": 2.38, "learning_rate": 2.1564857806359673e-06, "loss": 0.4198, "step": 12865 }, { "epoch": 2.38, "learning_rate": 2.1552468841614804e-06, "loss": 0.4055, "step": 12866 }, { "epoch": 2.38, "learning_rate": 2.1540083006781164e-06, "loss": 0.4133, "step": 12867 }, { "epoch": 2.38, "learning_rate": 2.152770030235297e-06, "loss": 0.4262, "step": 12868 }, { "epoch": 2.38, "learning_rate": 2.151532072882422e-06, "loss": 0.4159, "step": 12869 }, { "epoch": 2.38, "learning_rate": 2.1502944286688897e-06, "loss": 0.413, "step": 12870 }, { "epoch": 2.38, "learning_rate": 2.149057097644075e-06, "loss": 0.432, "step": 12871 }, { "epoch": 2.38, "learning_rate": 2.1478200798573444e-06, "loss": 0.397, "step": 12872 }, { "epoch": 2.38, "learning_rate": 2.146583375358058e-06, "loss": 0.4475, "step": 12873 }, { "epoch": 2.38, "learning_rate": 2.145346984195551e-06, "loss": 0.4446, "step": 12874 }, { "epoch": 2.38, "learning_rate": 2.14411090641916e-06, "loss": 0.4152, "step": 12875 }, { "epoch": 2.38, "learning_rate": 2.142875142078197e-06, "loss": 0.4259, "step": 12876 }, { "epoch": 2.38, "learning_rate": 2.1416396912219705e-06, "loss": 0.44, "step": 12877 }, { "epoch": 2.38, "learning_rate": 2.1404045538997707e-06, "loss": 0.4369, "step": 12878 }, { "epoch": 2.38, "learning_rate": 2.1391697301608747e-06, "loss": 0.4088, "step": 12879 }, { "epoch": 2.38, "learning_rate": 2.1379352200545567e-06, "loss": 0.4163, "step": 12880 }, { "epoch": 2.38, "learning_rate": 2.1367010236300636e-06, "loss": 0.419, "step": 12881 }, { "epoch": 2.38, "learning_rate": 2.1354671409366435e-06, "loss": 0.4283, "step": 12882 }, { "epoch": 2.38, "learning_rate": 2.1342335720235243e-06, "loss": 0.4235, "step": 12883 }, { "epoch": 2.38, "learning_rate": 2.1330003169399195e-06, "loss": 0.4071, "step": 12884 }, { "epoch": 2.38, "learning_rate": 2.13176737573504e-06, "loss": 0.394, "step": 12885 }, { "epoch": 2.38, "learning_rate": 2.1305347484580708e-06, "loss": 0.4446, "step": 12886 }, { "epoch": 2.38, "learning_rate": 2.129302435158198e-06, "loss": 0.4079, "step": 12887 }, { "epoch": 2.38, "learning_rate": 2.128070435884587e-06, "loss": 0.4336, "step": 12888 }, { "epoch": 2.38, "learning_rate": 2.1268387506863875e-06, "loss": 0.3987, "step": 12889 }, { "epoch": 2.38, "learning_rate": 2.1256073796127485e-06, "loss": 0.4347, "step": 12890 }, { "epoch": 2.39, "learning_rate": 2.1243763227127924e-06, "loss": 0.411, "step": 12891 }, { "epoch": 2.39, "learning_rate": 2.1231455800356425e-06, "loss": 0.421, "step": 12892 }, { "epoch": 2.39, "learning_rate": 2.1219151516304004e-06, "loss": 0.4112, "step": 12893 }, { "epoch": 2.39, "learning_rate": 2.1206850375461564e-06, "loss": 0.4105, "step": 12894 }, { "epoch": 2.39, "learning_rate": 2.119455237831992e-06, "loss": 0.4016, "step": 12895 }, { "epoch": 2.39, "learning_rate": 2.118225752536972e-06, "loss": 0.4171, "step": 12896 }, { "epoch": 2.39, "learning_rate": 2.1169965817101533e-06, "loss": 0.4136, "step": 12897 }, { "epoch": 2.39, "learning_rate": 2.1157677254005736e-06, "loss": 0.4145, "step": 12898 }, { "epoch": 2.39, "learning_rate": 2.114539183657268e-06, "loss": 0.4088, "step": 12899 }, { "epoch": 2.39, "learning_rate": 2.1133109565292487e-06, "loss": 0.4158, "step": 12900 }, { "epoch": 2.39, "learning_rate": 2.112083044065517e-06, "loss": 0.4166, "step": 12901 }, { "epoch": 2.39, "learning_rate": 2.110855446315072e-06, "loss": 0.4172, "step": 12902 }, { "epoch": 2.39, "learning_rate": 2.1096281633268843e-06, "loss": 0.4288, "step": 12903 }, { "epoch": 2.39, "learning_rate": 2.1084011951499284e-06, "loss": 0.4194, "step": 12904 }, { "epoch": 2.39, "learning_rate": 2.1071745418331524e-06, "loss": 0.3926, "step": 12905 }, { "epoch": 2.39, "learning_rate": 2.1059482034254973e-06, "loss": 0.4261, "step": 12906 }, { "epoch": 2.39, "learning_rate": 2.1047221799758955e-06, "loss": 0.4129, "step": 12907 }, { "epoch": 2.39, "learning_rate": 2.1034964715332583e-06, "loss": 0.4087, "step": 12908 }, { "epoch": 2.39, "learning_rate": 2.102271078146495e-06, "loss": 0.4032, "step": 12909 }, { "epoch": 2.39, "learning_rate": 2.1010459998644907e-06, "loss": 0.41, "step": 12910 }, { "epoch": 2.39, "learning_rate": 2.0998212367361294e-06, "loss": 0.4138, "step": 12911 }, { "epoch": 2.39, "learning_rate": 2.0985967888102708e-06, "loss": 0.4179, "step": 12912 }, { "epoch": 2.39, "learning_rate": 2.0973726561357742e-06, "loss": 0.4135, "step": 12913 }, { "epoch": 2.39, "learning_rate": 2.0961488387614746e-06, "loss": 0.4128, "step": 12914 }, { "epoch": 2.39, "learning_rate": 2.0949253367362055e-06, "loss": 0.4291, "step": 12915 }, { "epoch": 2.39, "learning_rate": 2.0937021501087763e-06, "loss": 0.4153, "step": 12916 }, { "epoch": 2.39, "learning_rate": 2.092479278927997e-06, "loss": 0.4207, "step": 12917 }, { "epoch": 2.39, "learning_rate": 2.0912567232426496e-06, "loss": 0.4139, "step": 12918 }, { "epoch": 2.39, "learning_rate": 2.090034483101521e-06, "loss": 0.4057, "step": 12919 }, { "epoch": 2.39, "learning_rate": 2.088812558553368e-06, "loss": 0.3963, "step": 12920 }, { "epoch": 2.39, "learning_rate": 2.087590949646949e-06, "loss": 0.425, "step": 12921 }, { "epoch": 2.39, "learning_rate": 2.0863696564310022e-06, "loss": 0.3989, "step": 12922 }, { "epoch": 2.39, "learning_rate": 2.085148678954252e-06, "loss": 0.4001, "step": 12923 }, { "epoch": 2.39, "learning_rate": 2.0839280172654173e-06, "loss": 0.4316, "step": 12924 }, { "epoch": 2.39, "learning_rate": 2.0827076714131966e-06, "loss": 0.4072, "step": 12925 }, { "epoch": 2.39, "learning_rate": 2.0814876414462837e-06, "loss": 0.4374, "step": 12926 }, { "epoch": 2.39, "learning_rate": 2.080267927413353e-06, "loss": 0.4063, "step": 12927 }, { "epoch": 2.39, "learning_rate": 2.0790485293630668e-06, "loss": 0.4143, "step": 12928 }, { "epoch": 2.39, "learning_rate": 2.0778294473440817e-06, "loss": 0.4168, "step": 12929 }, { "epoch": 2.39, "learning_rate": 2.0766106814050315e-06, "loss": 0.404, "step": 12930 }, { "epoch": 2.39, "learning_rate": 2.075392231594547e-06, "loss": 0.4244, "step": 12931 }, { "epoch": 2.39, "learning_rate": 2.0741740979612426e-06, "loss": 0.3972, "step": 12932 }, { "epoch": 2.39, "learning_rate": 2.0729562805537128e-06, "loss": 0.4282, "step": 12933 }, { "epoch": 2.39, "learning_rate": 2.0717387794205546e-06, "loss": 0.4218, "step": 12934 }, { "epoch": 2.39, "learning_rate": 2.0705215946103365e-06, "loss": 0.4179, "step": 12935 }, { "epoch": 2.39, "learning_rate": 2.0693047261716294e-06, "loss": 0.4175, "step": 12936 }, { "epoch": 2.39, "learning_rate": 2.0680881741529803e-06, "loss": 0.4111, "step": 12937 }, { "epoch": 2.39, "learning_rate": 2.0668719386029245e-06, "loss": 0.4098, "step": 12938 }, { "epoch": 2.39, "learning_rate": 2.0656560195699937e-06, "loss": 0.4166, "step": 12939 }, { "epoch": 2.39, "learning_rate": 2.0644404171026943e-06, "loss": 0.4153, "step": 12940 }, { "epoch": 2.39, "learning_rate": 2.063225131249533e-06, "loss": 0.4181, "step": 12941 }, { "epoch": 2.39, "learning_rate": 2.062010162058995e-06, "loss": 0.3985, "step": 12942 }, { "epoch": 2.39, "learning_rate": 2.0607955095795505e-06, "loss": 0.3957, "step": 12943 }, { "epoch": 2.39, "learning_rate": 2.0595811738596706e-06, "loss": 0.4374, "step": 12944 }, { "epoch": 2.4, "learning_rate": 2.058367154947797e-06, "loss": 0.4171, "step": 12945 }, { "epoch": 2.4, "learning_rate": 2.057153452892373e-06, "loss": 0.4219, "step": 12946 }, { "epoch": 2.4, "learning_rate": 2.0559400677418186e-06, "loss": 0.4323, "step": 12947 }, { "epoch": 2.4, "learning_rate": 2.0547269995445484e-06, "loss": 0.4253, "step": 12948 }, { "epoch": 2.4, "learning_rate": 2.0535142483489622e-06, "loss": 0.423, "step": 12949 }, { "epoch": 2.4, "learning_rate": 2.052301814203441e-06, "loss": 0.4527, "step": 12950 }, { "epoch": 2.4, "learning_rate": 2.0510896971563665e-06, "loss": 0.4177, "step": 12951 }, { "epoch": 2.4, "learning_rate": 2.049877897256093e-06, "loss": 0.4013, "step": 12952 }, { "epoch": 2.4, "learning_rate": 2.048666414550975e-06, "loss": 0.4217, "step": 12953 }, { "epoch": 2.4, "learning_rate": 2.047455249089345e-06, "loss": 0.4157, "step": 12954 }, { "epoch": 2.4, "learning_rate": 2.0462444009195247e-06, "loss": 0.3918, "step": 12955 }, { "epoch": 2.4, "learning_rate": 2.0450338700898297e-06, "loss": 0.4233, "step": 12956 }, { "epoch": 2.4, "learning_rate": 2.0438236566485516e-06, "loss": 0.4172, "step": 12957 }, { "epoch": 2.4, "learning_rate": 2.0426137606439823e-06, "loss": 0.4016, "step": 12958 }, { "epoch": 2.4, "learning_rate": 2.041404182124389e-06, "loss": 0.4427, "step": 12959 }, { "epoch": 2.4, "learning_rate": 2.0401949211380355e-06, "loss": 0.4017, "step": 12960 }, { "epoch": 2.4, "learning_rate": 2.0389859777331656e-06, "loss": 0.4095, "step": 12961 }, { "epoch": 2.4, "learning_rate": 2.037777351958018e-06, "loss": 0.4171, "step": 12962 }, { "epoch": 2.4, "learning_rate": 2.03656904386081e-06, "loss": 0.4372, "step": 12963 }, { "epoch": 2.4, "learning_rate": 2.0353610534897562e-06, "loss": 0.4114, "step": 12964 }, { "epoch": 2.4, "learning_rate": 2.034153380893047e-06, "loss": 0.4309, "step": 12965 }, { "epoch": 2.4, "learning_rate": 2.0329460261188717e-06, "loss": 0.3981, "step": 12966 }, { "epoch": 2.4, "learning_rate": 2.0317389892153973e-06, "loss": 0.405, "step": 12967 }, { "epoch": 2.4, "learning_rate": 2.030532270230787e-06, "loss": 0.4344, "step": 12968 }, { "epoch": 2.4, "learning_rate": 2.0293258692131824e-06, "loss": 0.4318, "step": 12969 }, { "epoch": 2.4, "learning_rate": 2.0281197862107195e-06, "loss": 0.4335, "step": 12970 }, { "epoch": 2.4, "learning_rate": 2.0269140212715176e-06, "loss": 0.4185, "step": 12971 }, { "epoch": 2.4, "learning_rate": 2.0257085744436834e-06, "loss": 0.4081, "step": 12972 }, { "epoch": 2.4, "learning_rate": 2.024503445775314e-06, "loss": 0.4229, "step": 12973 }, { "epoch": 2.4, "learning_rate": 2.023298635314489e-06, "loss": 0.4061, "step": 12974 }, { "epoch": 2.4, "learning_rate": 2.022094143109282e-06, "loss": 0.4221, "step": 12975 }, { "epoch": 2.4, "learning_rate": 2.0208899692077487e-06, "loss": 0.4237, "step": 12976 }, { "epoch": 2.4, "learning_rate": 2.0196861136579305e-06, "loss": 0.4094, "step": 12977 }, { "epoch": 2.4, "learning_rate": 2.018482576507863e-06, "loss": 0.3976, "step": 12978 }, { "epoch": 2.4, "learning_rate": 2.0172793578055606e-06, "loss": 0.4166, "step": 12979 }, { "epoch": 2.4, "learning_rate": 2.0160764575990354e-06, "loss": 0.4125, "step": 12980 }, { "epoch": 2.4, "learning_rate": 2.0148738759362774e-06, "loss": 0.421, "step": 12981 }, { "epoch": 2.4, "learning_rate": 2.0136716128652643e-06, "loss": 0.4265, "step": 12982 }, { "epoch": 2.4, "learning_rate": 2.0124696684339717e-06, "loss": 0.4242, "step": 12983 }, { "epoch": 2.4, "learning_rate": 2.0112680426903475e-06, "loss": 0.4042, "step": 12984 }, { "epoch": 2.4, "learning_rate": 2.01006673568234e-06, "loss": 0.4165, "step": 12985 }, { "epoch": 2.4, "learning_rate": 2.0088657474578767e-06, "loss": 0.4182, "step": 12986 }, { "epoch": 2.4, "learning_rate": 2.007665078064873e-06, "loss": 0.3973, "step": 12987 }, { "epoch": 2.4, "learning_rate": 2.0064647275512374e-06, "loss": 0.4152, "step": 12988 }, { "epoch": 2.4, "learning_rate": 2.005264695964857e-06, "loss": 0.4318, "step": 12989 }, { "epoch": 2.4, "learning_rate": 2.0040649833536165e-06, "loss": 0.4182, "step": 12990 }, { "epoch": 2.4, "learning_rate": 2.0028655897653747e-06, "loss": 0.4198, "step": 12991 }, { "epoch": 2.4, "learning_rate": 2.0016665152479943e-06, "loss": 0.4237, "step": 12992 }, { "epoch": 2.4, "learning_rate": 2.0004677598493104e-06, "loss": 0.414, "step": 12993 }, { "epoch": 2.4, "learning_rate": 1.99926932361715e-06, "loss": 0.4119, "step": 12994 }, { "epoch": 2.4, "learning_rate": 1.9980712065993325e-06, "loss": 0.4299, "step": 12995 }, { "epoch": 2.4, "learning_rate": 1.996873408843656e-06, "loss": 0.4248, "step": 12996 }, { "epoch": 2.4, "learning_rate": 1.9956759303979165e-06, "loss": 0.4096, "step": 12997 }, { "epoch": 2.4, "learning_rate": 1.9944787713098877e-06, "loss": 0.4072, "step": 12998 }, { "epoch": 2.4, "learning_rate": 1.993281931627331e-06, "loss": 0.4066, "step": 12999 }, { "epoch": 2.41, "learning_rate": 1.992085411398004e-06, "loss": 0.4214, "step": 13000 }, { "epoch": 2.41, "learning_rate": 1.990889210669641e-06, "loss": 0.4216, "step": 13001 }, { "epoch": 2.41, "learning_rate": 1.9896933294899713e-06, "loss": 0.4084, "step": 13002 }, { "epoch": 2.41, "learning_rate": 1.9884977679067074e-06, "loss": 0.4038, "step": 13003 }, { "epoch": 2.41, "learning_rate": 1.9873025259675473e-06, "loss": 0.4309, "step": 13004 }, { "epoch": 2.41, "learning_rate": 1.9861076037201843e-06, "loss": 0.4025, "step": 13005 }, { "epoch": 2.41, "learning_rate": 1.9849130012122875e-06, "loss": 0.4096, "step": 13006 }, { "epoch": 2.41, "learning_rate": 1.9837187184915253e-06, "loss": 0.4117, "step": 13007 }, { "epoch": 2.41, "learning_rate": 1.9825247556055436e-06, "loss": 0.4184, "step": 13008 }, { "epoch": 2.41, "learning_rate": 1.9813311126019785e-06, "loss": 0.417, "step": 13009 }, { "epoch": 2.41, "learning_rate": 1.980137789528458e-06, "loss": 0.4239, "step": 13010 }, { "epoch": 2.41, "learning_rate": 1.9789447864325893e-06, "loss": 0.4184, "step": 13011 }, { "epoch": 2.41, "learning_rate": 1.9777521033619752e-06, "loss": 0.4185, "step": 13012 }, { "epoch": 2.41, "learning_rate": 1.9765597403641966e-06, "loss": 0.4112, "step": 13013 }, { "epoch": 2.41, "learning_rate": 1.975367697486833e-06, "loss": 0.4031, "step": 13014 }, { "epoch": 2.41, "learning_rate": 1.974175974777437e-06, "loss": 0.3993, "step": 13015 }, { "epoch": 2.41, "learning_rate": 1.9729845722835637e-06, "loss": 0.4179, "step": 13016 }, { "epoch": 2.41, "learning_rate": 1.971793490052741e-06, "loss": 0.3922, "step": 13017 }, { "epoch": 2.41, "learning_rate": 1.970602728132498e-06, "loss": 0.4183, "step": 13018 }, { "epoch": 2.41, "learning_rate": 1.969412286570337e-06, "loss": 0.435, "step": 13019 }, { "epoch": 2.41, "learning_rate": 1.968222165413759e-06, "loss": 0.4114, "step": 13020 }, { "epoch": 2.41, "learning_rate": 1.9670323647102452e-06, "loss": 0.4133, "step": 13021 }, { "epoch": 2.41, "learning_rate": 1.9658428845072686e-06, "loss": 0.4155, "step": 13022 }, { "epoch": 2.41, "learning_rate": 1.9646537248522844e-06, "loss": 0.4025, "step": 13023 }, { "epoch": 2.41, "learning_rate": 1.963464885792742e-06, "loss": 0.3926, "step": 13024 }, { "epoch": 2.41, "learning_rate": 1.9622763673760714e-06, "loss": 0.4121, "step": 13025 }, { "epoch": 2.41, "learning_rate": 1.96108816964969e-06, "loss": 0.4128, "step": 13026 }, { "epoch": 2.41, "learning_rate": 1.9599002926610087e-06, "loss": 0.4362, "step": 13027 }, { "epoch": 2.41, "learning_rate": 1.9587127364574177e-06, "loss": 0.4108, "step": 13028 }, { "epoch": 2.41, "learning_rate": 1.9575255010863037e-06, "loss": 0.4125, "step": 13029 }, { "epoch": 2.41, "learning_rate": 1.956338586595031e-06, "loss": 0.414, "step": 13030 }, { "epoch": 2.41, "learning_rate": 1.9551519930309537e-06, "loss": 0.4274, "step": 13031 }, { "epoch": 2.41, "learning_rate": 1.953965720441421e-06, "loss": 0.4047, "step": 13032 }, { "epoch": 2.41, "learning_rate": 1.9527797688737548e-06, "loss": 0.4142, "step": 13033 }, { "epoch": 2.41, "learning_rate": 1.951594138375281e-06, "loss": 0.4149, "step": 13034 }, { "epoch": 2.41, "learning_rate": 1.9504088289932967e-06, "loss": 0.4095, "step": 13035 }, { "epoch": 2.41, "learning_rate": 1.9492238407750987e-06, "loss": 0.4053, "step": 13036 }, { "epoch": 2.41, "learning_rate": 1.948039173767965e-06, "loss": 0.41, "step": 13037 }, { "epoch": 2.41, "learning_rate": 1.946854828019157e-06, "loss": 0.4135, "step": 13038 }, { "epoch": 2.41, "learning_rate": 1.945670803575934e-06, "loss": 0.4469, "step": 13039 }, { "epoch": 2.41, "learning_rate": 1.9444871004855315e-06, "loss": 0.4127, "step": 13040 }, { "epoch": 2.41, "learning_rate": 1.943303718795182e-06, "loss": 0.4128, "step": 13041 }, { "epoch": 2.41, "learning_rate": 1.9421206585520967e-06, "loss": 0.4045, "step": 13042 }, { "epoch": 2.41, "learning_rate": 1.940937919803477e-06, "loss": 0.4001, "step": 13043 }, { "epoch": 2.41, "learning_rate": 1.9397555025965155e-06, "loss": 0.4042, "step": 13044 }, { "epoch": 2.41, "learning_rate": 1.9385734069783835e-06, "loss": 0.4047, "step": 13045 }, { "epoch": 2.41, "learning_rate": 1.9373916329962492e-06, "loss": 0.4179, "step": 13046 }, { "epoch": 2.41, "learning_rate": 1.936210180697262e-06, "loss": 0.4305, "step": 13047 }, { "epoch": 2.41, "learning_rate": 1.935029050128556e-06, "loss": 0.4189, "step": 13048 }, { "epoch": 2.41, "learning_rate": 1.933848241337262e-06, "loss": 0.4038, "step": 13049 }, { "epoch": 2.41, "learning_rate": 1.9326677543704866e-06, "loss": 0.4086, "step": 13050 }, { "epoch": 2.41, "learning_rate": 1.931487589275334e-06, "loss": 0.3871, "step": 13051 }, { "epoch": 2.41, "learning_rate": 1.930307746098887e-06, "loss": 0.4007, "step": 13052 }, { "epoch": 2.41, "learning_rate": 1.929128224888218e-06, "loss": 0.4127, "step": 13053 }, { "epoch": 2.42, "learning_rate": 1.927949025690394e-06, "loss": 0.4366, "step": 13054 }, { "epoch": 2.42, "learning_rate": 1.926770148552455e-06, "loss": 0.4137, "step": 13055 }, { "epoch": 2.42, "learning_rate": 1.925591593521443e-06, "loss": 0.4246, "step": 13056 }, { "epoch": 2.42, "learning_rate": 1.9244133606443747e-06, "loss": 0.4319, "step": 13057 }, { "epoch": 2.42, "learning_rate": 1.923235449968264e-06, "loss": 0.4216, "step": 13058 }, { "epoch": 2.42, "learning_rate": 1.922057861540105e-06, "loss": 0.4129, "step": 13059 }, { "epoch": 2.42, "learning_rate": 1.9208805954068788e-06, "loss": 0.4241, "step": 13060 }, { "epoch": 2.42, "learning_rate": 1.919703651615562e-06, "loss": 0.3975, "step": 13061 }, { "epoch": 2.42, "learning_rate": 1.9185270302131066e-06, "loss": 0.4131, "step": 13062 }, { "epoch": 2.42, "learning_rate": 1.917350731246462e-06, "loss": 0.4111, "step": 13063 }, { "epoch": 2.42, "learning_rate": 1.9161747547625563e-06, "loss": 0.415, "step": 13064 }, { "epoch": 2.42, "learning_rate": 1.9149991008083134e-06, "loss": 0.4204, "step": 13065 }, { "epoch": 2.42, "learning_rate": 1.913823769430636e-06, "loss": 0.4111, "step": 13066 }, { "epoch": 2.42, "learning_rate": 1.9126487606764197e-06, "loss": 0.4016, "step": 13067 }, { "epoch": 2.42, "learning_rate": 1.911474074592544e-06, "loss": 0.4175, "step": 13068 }, { "epoch": 2.42, "learning_rate": 1.910299711225878e-06, "loss": 0.4422, "step": 13069 }, { "epoch": 2.42, "learning_rate": 1.9091256706232754e-06, "loss": 0.4285, "step": 13070 }, { "epoch": 2.42, "learning_rate": 1.9079519528315792e-06, "loss": 0.4176, "step": 13071 }, { "epoch": 2.42, "learning_rate": 1.9067785578976162e-06, "loss": 0.4116, "step": 13072 }, { "epoch": 2.42, "learning_rate": 1.9056054858682072e-06, "loss": 0.4117, "step": 13073 }, { "epoch": 2.42, "learning_rate": 1.9044327367901527e-06, "loss": 0.4275, "step": 13074 }, { "epoch": 2.42, "learning_rate": 1.903260310710241e-06, "loss": 0.4382, "step": 13075 }, { "epoch": 2.42, "learning_rate": 1.9020882076752556e-06, "loss": 0.3967, "step": 13076 }, { "epoch": 2.42, "learning_rate": 1.9009164277319547e-06, "loss": 0.4251, "step": 13077 }, { "epoch": 2.42, "learning_rate": 1.8997449709270954e-06, "loss": 0.3797, "step": 13078 }, { "epoch": 2.42, "learning_rate": 1.8985738373074126e-06, "loss": 0.4165, "step": 13079 }, { "epoch": 2.42, "learning_rate": 1.8974030269196364e-06, "loss": 0.3901, "step": 13080 }, { "epoch": 2.42, "learning_rate": 1.8962325398104775e-06, "loss": 0.4019, "step": 13081 }, { "epoch": 2.42, "learning_rate": 1.895062376026634e-06, "loss": 0.4025, "step": 13082 }, { "epoch": 2.42, "learning_rate": 1.8938925356147997e-06, "loss": 0.4259, "step": 13083 }, { "epoch": 2.42, "learning_rate": 1.8927230186216417e-06, "loss": 0.4176, "step": 13084 }, { "epoch": 2.42, "learning_rate": 1.891553825093827e-06, "loss": 0.4562, "step": 13085 }, { "epoch": 2.42, "learning_rate": 1.890384955078003e-06, "loss": 0.4117, "step": 13086 }, { "epoch": 2.42, "learning_rate": 1.889216408620802e-06, "loss": 0.4151, "step": 13087 }, { "epoch": 2.42, "learning_rate": 1.8880481857688526e-06, "loss": 0.4245, "step": 13088 }, { "epoch": 2.42, "learning_rate": 1.8868802865687586e-06, "loss": 0.419, "step": 13089 }, { "epoch": 2.42, "learning_rate": 1.8857127110671225e-06, "loss": 0.4198, "step": 13090 }, { "epoch": 2.42, "learning_rate": 1.8845454593105273e-06, "loss": 0.4053, "step": 13091 }, { "epoch": 2.42, "learning_rate": 1.8833785313455388e-06, "loss": 0.4142, "step": 13092 }, { "epoch": 2.42, "learning_rate": 1.8822119272187222e-06, "loss": 0.4205, "step": 13093 }, { "epoch": 2.42, "learning_rate": 1.881045646976618e-06, "loss": 0.4097, "step": 13094 }, { "epoch": 2.42, "learning_rate": 1.8798796906657635e-06, "loss": 0.4027, "step": 13095 }, { "epoch": 2.42, "learning_rate": 1.8787140583326746e-06, "loss": 0.4044, "step": 13096 }, { "epoch": 2.42, "learning_rate": 1.8775487500238565e-06, "loss": 0.4153, "step": 13097 }, { "epoch": 2.42, "learning_rate": 1.8763837657858075e-06, "loss": 0.4336, "step": 13098 }, { "epoch": 2.42, "learning_rate": 1.8752191056650026e-06, "loss": 0.4409, "step": 13099 }, { "epoch": 2.42, "learning_rate": 1.874054769707916e-06, "loss": 0.3954, "step": 13100 }, { "epoch": 2.42, "learning_rate": 1.8728907579609967e-06, "loss": 0.4378, "step": 13101 }, { "epoch": 2.42, "learning_rate": 1.8717270704706913e-06, "loss": 0.4375, "step": 13102 }, { "epoch": 2.42, "learning_rate": 1.870563707283427e-06, "loss": 0.4139, "step": 13103 }, { "epoch": 2.42, "learning_rate": 1.8694006684456168e-06, "loss": 0.4316, "step": 13104 }, { "epoch": 2.42, "learning_rate": 1.86823795400367e-06, "loss": 0.4126, "step": 13105 }, { "epoch": 2.42, "learning_rate": 1.8670755640039696e-06, "loss": 0.4126, "step": 13106 }, { "epoch": 2.42, "learning_rate": 1.8659134984928995e-06, "loss": 0.4099, "step": 13107 }, { "epoch": 2.43, "learning_rate": 1.8647517575168207e-06, "loss": 0.4294, "step": 13108 }, { "epoch": 2.43, "learning_rate": 1.8635903411220823e-06, "loss": 0.4152, "step": 13109 }, { "epoch": 2.43, "learning_rate": 1.8624292493550278e-06, "loss": 0.4214, "step": 13110 }, { "epoch": 2.43, "learning_rate": 1.8612684822619774e-06, "loss": 0.4081, "step": 13111 }, { "epoch": 2.43, "learning_rate": 1.8601080398892478e-06, "loss": 0.4187, "step": 13112 }, { "epoch": 2.43, "learning_rate": 1.8589479222831353e-06, "loss": 0.4115, "step": 13113 }, { "epoch": 2.43, "learning_rate": 1.8577881294899303e-06, "loss": 0.4108, "step": 13114 }, { "epoch": 2.43, "learning_rate": 1.8566286615559014e-06, "loss": 0.4307, "step": 13115 }, { "epoch": 2.43, "learning_rate": 1.8554695185273142e-06, "loss": 0.4387, "step": 13116 }, { "epoch": 2.43, "learning_rate": 1.8543107004504123e-06, "loss": 0.4362, "step": 13117 }, { "epoch": 2.43, "learning_rate": 1.8531522073714337e-06, "loss": 0.4088, "step": 13118 }, { "epoch": 2.43, "learning_rate": 1.8519940393365966e-06, "loss": 0.3913, "step": 13119 }, { "epoch": 2.43, "learning_rate": 1.850836196392114e-06, "loss": 0.4268, "step": 13120 }, { "epoch": 2.43, "learning_rate": 1.849678678584177e-06, "loss": 0.3865, "step": 13121 }, { "epoch": 2.43, "learning_rate": 1.8485214859589729e-06, "loss": 0.4137, "step": 13122 }, { "epoch": 2.43, "learning_rate": 1.8473646185626671e-06, "loss": 0.4224, "step": 13123 }, { "epoch": 2.43, "learning_rate": 1.8462080764414213e-06, "loss": 0.4275, "step": 13124 }, { "epoch": 2.43, "learning_rate": 1.8450518596413768e-06, "loss": 0.4109, "step": 13125 }, { "epoch": 2.43, "learning_rate": 1.8438959682086621e-06, "loss": 0.4199, "step": 13126 }, { "epoch": 2.43, "learning_rate": 1.8427404021894014e-06, "loss": 0.3949, "step": 13127 }, { "epoch": 2.43, "learning_rate": 1.841585161629692e-06, "loss": 0.4485, "step": 13128 }, { "epoch": 2.43, "learning_rate": 1.8404302465756317e-06, "loss": 0.415, "step": 13129 }, { "epoch": 2.43, "learning_rate": 1.8392756570732995e-06, "loss": 0.4433, "step": 13130 }, { "epoch": 2.43, "learning_rate": 1.8381213931687559e-06, "loss": 0.4083, "step": 13131 }, { "epoch": 2.43, "learning_rate": 1.8369674549080596e-06, "loss": 0.4259, "step": 13132 }, { "epoch": 2.43, "learning_rate": 1.8358138423372463e-06, "loss": 0.4326, "step": 13133 }, { "epoch": 2.43, "learning_rate": 1.8346605555023466e-06, "loss": 0.4162, "step": 13134 }, { "epoch": 2.43, "learning_rate": 1.8335075944493742e-06, "loss": 0.41, "step": 13135 }, { "epoch": 2.43, "learning_rate": 1.832354959224326e-06, "loss": 0.4031, "step": 13136 }, { "epoch": 2.43, "learning_rate": 1.831202649873196e-06, "loss": 0.4208, "step": 13137 }, { "epoch": 2.43, "learning_rate": 1.8300506664419526e-06, "loss": 0.4046, "step": 13138 }, { "epoch": 2.43, "learning_rate": 1.8288990089765646e-06, "loss": 0.4154, "step": 13139 }, { "epoch": 2.43, "learning_rate": 1.8277476775229773e-06, "loss": 0.4054, "step": 13140 }, { "epoch": 2.43, "learning_rate": 1.8265966721271255e-06, "loss": 0.4308, "step": 13141 }, { "epoch": 2.43, "learning_rate": 1.8254459928349355e-06, "loss": 0.4111, "step": 13142 }, { "epoch": 2.43, "learning_rate": 1.8242956396923129e-06, "loss": 0.4052, "step": 13143 }, { "epoch": 2.43, "learning_rate": 1.8231456127451608e-06, "loss": 0.4153, "step": 13144 }, { "epoch": 2.43, "learning_rate": 1.821995912039356e-06, "loss": 0.4033, "step": 13145 }, { "epoch": 2.43, "learning_rate": 1.8208465376207762e-06, "loss": 0.4242, "step": 13146 }, { "epoch": 2.43, "learning_rate": 1.819697489535277e-06, "loss": 0.4223, "step": 13147 }, { "epoch": 2.43, "learning_rate": 1.8185487678286996e-06, "loss": 0.4165, "step": 13148 }, { "epoch": 2.43, "learning_rate": 1.8174003725468803e-06, "loss": 0.4084, "step": 13149 }, { "epoch": 2.43, "learning_rate": 1.816252303735635e-06, "loss": 0.4246, "step": 13150 }, { "epoch": 2.43, "learning_rate": 1.8151045614407736e-06, "loss": 0.4349, "step": 13151 }, { "epoch": 2.43, "learning_rate": 1.8139571457080863e-06, "loss": 0.4138, "step": 13152 }, { "epoch": 2.43, "learning_rate": 1.8128100565833496e-06, "loss": 0.4363, "step": 13153 }, { "epoch": 2.43, "learning_rate": 1.8116632941123358e-06, "loss": 0.4254, "step": 13154 }, { "epoch": 2.43, "learning_rate": 1.810516858340795e-06, "loss": 0.4174, "step": 13155 }, { "epoch": 2.43, "learning_rate": 1.8093707493144708e-06, "loss": 0.4004, "step": 13156 }, { "epoch": 2.43, "learning_rate": 1.8082249670790897e-06, "loss": 0.4016, "step": 13157 }, { "epoch": 2.43, "learning_rate": 1.807079511680362e-06, "loss": 0.4101, "step": 13158 }, { "epoch": 2.43, "learning_rate": 1.8059343831639964e-06, "loss": 0.4221, "step": 13159 }, { "epoch": 2.43, "learning_rate": 1.8047895815756754e-06, "loss": 0.3996, "step": 13160 }, { "epoch": 2.43, "learning_rate": 1.8036451069610795e-06, "loss": 0.4088, "step": 13161 }, { "epoch": 2.44, "learning_rate": 1.802500959365867e-06, "loss": 0.4169, "step": 13162 }, { "epoch": 2.44, "learning_rate": 1.8013571388356899e-06, "loss": 0.3932, "step": 13163 }, { "epoch": 2.44, "learning_rate": 1.8002136454161822e-06, "loss": 0.4021, "step": 13164 }, { "epoch": 2.44, "learning_rate": 1.7990704791529712e-06, "loss": 0.4016, "step": 13165 }, { "epoch": 2.44, "learning_rate": 1.7979276400916611e-06, "loss": 0.4128, "step": 13166 }, { "epoch": 2.44, "learning_rate": 1.796785128277856e-06, "loss": 0.4193, "step": 13167 }, { "epoch": 2.44, "learning_rate": 1.7956429437571331e-06, "loss": 0.4365, "step": 13168 }, { "epoch": 2.44, "learning_rate": 1.794501086575069e-06, "loss": 0.4249, "step": 13169 }, { "epoch": 2.44, "learning_rate": 1.7933595567772178e-06, "loss": 0.4122, "step": 13170 }, { "epoch": 2.44, "learning_rate": 1.7922183544091276e-06, "loss": 0.3981, "step": 13171 }, { "epoch": 2.44, "learning_rate": 1.7910774795163278e-06, "loss": 0.4266, "step": 13172 }, { "epoch": 2.44, "learning_rate": 1.7899369321443394e-06, "loss": 0.4171, "step": 13173 }, { "epoch": 2.44, "learning_rate": 1.7887967123386673e-06, "loss": 0.4152, "step": 13174 }, { "epoch": 2.44, "learning_rate": 1.7876568201448008e-06, "loss": 0.4102, "step": 13175 }, { "epoch": 2.44, "learning_rate": 1.7865172556082255e-06, "loss": 0.4114, "step": 13176 }, { "epoch": 2.44, "learning_rate": 1.785378018774402e-06, "loss": 0.4242, "step": 13177 }, { "epoch": 2.44, "learning_rate": 1.784239109688789e-06, "loss": 0.4042, "step": 13178 }, { "epoch": 2.44, "learning_rate": 1.783100528396825e-06, "loss": 0.4171, "step": 13179 }, { "epoch": 2.44, "learning_rate": 1.7819622749439335e-06, "loss": 0.4044, "step": 13180 }, { "epoch": 2.44, "learning_rate": 1.7808243493755351e-06, "loss": 0.4033, "step": 13181 }, { "epoch": 2.44, "learning_rate": 1.7796867517370254e-06, "loss": 0.4304, "step": 13182 }, { "epoch": 2.44, "learning_rate": 1.7785494820737958e-06, "loss": 0.3993, "step": 13183 }, { "epoch": 2.44, "learning_rate": 1.7774125404312214e-06, "loss": 0.4111, "step": 13184 }, { "epoch": 2.44, "learning_rate": 1.7762759268546602e-06, "loss": 0.4174, "step": 13185 }, { "epoch": 2.44, "learning_rate": 1.7751396413894673e-06, "loss": 0.4021, "step": 13186 }, { "epoch": 2.44, "learning_rate": 1.7740036840809716e-06, "loss": 0.4061, "step": 13187 }, { "epoch": 2.44, "learning_rate": 1.7728680549745003e-06, "loss": 0.3988, "step": 13188 }, { "epoch": 2.44, "learning_rate": 1.7717327541153605e-06, "loss": 0.4297, "step": 13189 }, { "epoch": 2.44, "learning_rate": 1.7705977815488506e-06, "loss": 0.409, "step": 13190 }, { "epoch": 2.44, "learning_rate": 1.7694631373202542e-06, "loss": 0.4131, "step": 13191 }, { "epoch": 2.44, "learning_rate": 1.7683288214748373e-06, "loss": 0.4161, "step": 13192 }, { "epoch": 2.44, "learning_rate": 1.7671948340578616e-06, "loss": 0.4224, "step": 13193 }, { "epoch": 2.44, "learning_rate": 1.7660611751145684e-06, "loss": 0.4126, "step": 13194 }, { "epoch": 2.44, "learning_rate": 1.7649278446901906e-06, "loss": 0.3941, "step": 13195 }, { "epoch": 2.44, "learning_rate": 1.7637948428299456e-06, "loss": 0.4374, "step": 13196 }, { "epoch": 2.44, "learning_rate": 1.7626621695790346e-06, "loss": 0.4157, "step": 13197 }, { "epoch": 2.44, "learning_rate": 1.7615298249826552e-06, "loss": 0.4195, "step": 13198 }, { "epoch": 2.44, "learning_rate": 1.7603978090859797e-06, "loss": 0.4044, "step": 13199 }, { "epoch": 2.44, "learning_rate": 1.759266121934179e-06, "loss": 0.4085, "step": 13200 }, { "epoch": 2.44, "learning_rate": 1.7581347635724032e-06, "loss": 0.4385, "step": 13201 }, { "epoch": 2.44, "learning_rate": 1.757003734045788e-06, "loss": 0.3923, "step": 13202 }, { "epoch": 2.44, "learning_rate": 1.7558730333994644e-06, "loss": 0.4216, "step": 13203 }, { "epoch": 2.44, "learning_rate": 1.7547426616785413e-06, "loss": 0.4133, "step": 13204 }, { "epoch": 2.44, "learning_rate": 1.7536126189281222e-06, "loss": 0.437, "step": 13205 }, { "epoch": 2.44, "learning_rate": 1.7524829051932924e-06, "loss": 0.4242, "step": 13206 }, { "epoch": 2.44, "learning_rate": 1.7513535205191224e-06, "loss": 0.4252, "step": 13207 }, { "epoch": 2.44, "learning_rate": 1.7502244649506772e-06, "loss": 0.4122, "step": 13208 }, { "epoch": 2.44, "learning_rate": 1.7490957385329988e-06, "loss": 0.396, "step": 13209 }, { "epoch": 2.44, "learning_rate": 1.7479673413111275e-06, "loss": 0.4083, "step": 13210 }, { "epoch": 2.44, "learning_rate": 1.7468392733300777e-06, "loss": 0.4203, "step": 13211 }, { "epoch": 2.44, "learning_rate": 1.745711534634864e-06, "loss": 0.416, "step": 13212 }, { "epoch": 2.44, "learning_rate": 1.7445841252704742e-06, "loss": 0.4194, "step": 13213 }, { "epoch": 2.44, "learning_rate": 1.7434570452818966e-06, "loss": 0.4196, "step": 13214 }, { "epoch": 2.44, "learning_rate": 1.7423302947140941e-06, "loss": 0.4207, "step": 13215 }, { "epoch": 2.45, "learning_rate": 1.7412038736120263e-06, "loss": 0.4109, "step": 13216 }, { "epoch": 2.45, "learning_rate": 1.7400777820206305e-06, "loss": 0.4166, "step": 13217 }, { "epoch": 2.45, "learning_rate": 1.7389520199848409e-06, "loss": 0.416, "step": 13218 }, { "epoch": 2.45, "learning_rate": 1.7378265875495682e-06, "loss": 0.41, "step": 13219 }, { "epoch": 2.45, "learning_rate": 1.7367014847597207e-06, "loss": 0.3949, "step": 13220 }, { "epoch": 2.45, "learning_rate": 1.7355767116601818e-06, "loss": 0.4122, "step": 13221 }, { "epoch": 2.45, "learning_rate": 1.7344522682958332e-06, "loss": 0.4087, "step": 13222 }, { "epoch": 2.45, "learning_rate": 1.7333281547115365e-06, "loss": 0.4078, "step": 13223 }, { "epoch": 2.45, "learning_rate": 1.7322043709521386e-06, "loss": 0.4188, "step": 13224 }, { "epoch": 2.45, "learning_rate": 1.731080917062481e-06, "loss": 0.4029, "step": 13225 }, { "epoch": 2.45, "learning_rate": 1.7299577930873823e-06, "loss": 0.4081, "step": 13226 }, { "epoch": 2.45, "learning_rate": 1.728834999071659e-06, "loss": 0.4171, "step": 13227 }, { "epoch": 2.45, "learning_rate": 1.7277125350601066e-06, "loss": 0.4053, "step": 13228 }, { "epoch": 2.45, "learning_rate": 1.7265904010975042e-06, "loss": 0.4321, "step": 13229 }, { "epoch": 2.45, "learning_rate": 1.725468597228631e-06, "loss": 0.4022, "step": 13230 }, { "epoch": 2.45, "learning_rate": 1.7243471234982378e-06, "loss": 0.4125, "step": 13231 }, { "epoch": 2.45, "learning_rate": 1.7232259799510742e-06, "loss": 0.4192, "step": 13232 }, { "epoch": 2.45, "learning_rate": 1.7221051666318678e-06, "loss": 0.417, "step": 13233 }, { "epoch": 2.45, "learning_rate": 1.7209846835853427e-06, "loss": 0.4178, "step": 13234 }, { "epoch": 2.45, "learning_rate": 1.719864530856199e-06, "loss": 0.4099, "step": 13235 }, { "epoch": 2.45, "learning_rate": 1.7187447084891284e-06, "loss": 0.4336, "step": 13236 }, { "epoch": 2.45, "learning_rate": 1.7176252165288144e-06, "loss": 0.3891, "step": 13237 }, { "epoch": 2.45, "learning_rate": 1.7165060550199176e-06, "loss": 0.4354, "step": 13238 }, { "epoch": 2.45, "learning_rate": 1.7153872240070945e-06, "loss": 0.4038, "step": 13239 }, { "epoch": 2.45, "learning_rate": 1.714268723534983e-06, "loss": 0.4221, "step": 13240 }, { "epoch": 2.45, "learning_rate": 1.7131505536482062e-06, "loss": 0.429, "step": 13241 }, { "epoch": 2.45, "learning_rate": 1.7120327143913817e-06, "loss": 0.4273, "step": 13242 }, { "epoch": 2.45, "learning_rate": 1.710915205809105e-06, "loss": 0.409, "step": 13243 }, { "epoch": 2.45, "learning_rate": 1.7097980279459669e-06, "loss": 0.396, "step": 13244 }, { "epoch": 2.45, "learning_rate": 1.7086811808465397e-06, "loss": 0.4061, "step": 13245 }, { "epoch": 2.45, "learning_rate": 1.7075646645553789e-06, "loss": 0.4065, "step": 13246 }, { "epoch": 2.45, "learning_rate": 1.7064484791170378e-06, "loss": 0.4386, "step": 13247 }, { "epoch": 2.45, "learning_rate": 1.7053326245760448e-06, "loss": 0.4044, "step": 13248 }, { "epoch": 2.45, "learning_rate": 1.704217100976925e-06, "loss": 0.4216, "step": 13249 }, { "epoch": 2.45, "learning_rate": 1.7031019083641841e-06, "loss": 0.4048, "step": 13250 }, { "epoch": 2.45, "learning_rate": 1.701987046782313e-06, "loss": 0.4159, "step": 13251 }, { "epoch": 2.45, "learning_rate": 1.7008725162757977e-06, "loss": 0.4199, "step": 13252 }, { "epoch": 2.45, "learning_rate": 1.699758316889102e-06, "loss": 0.3989, "step": 13253 }, { "epoch": 2.45, "learning_rate": 1.6986444486666831e-06, "loss": 0.4179, "step": 13254 }, { "epoch": 2.45, "learning_rate": 1.6975309116529803e-06, "loss": 0.4183, "step": 13255 }, { "epoch": 2.45, "learning_rate": 1.6964177058924237e-06, "loss": 0.4192, "step": 13256 }, { "epoch": 2.45, "learning_rate": 1.6953048314294274e-06, "loss": 0.4094, "step": 13257 }, { "epoch": 2.45, "learning_rate": 1.6941922883083894e-06, "loss": 0.4188, "step": 13258 }, { "epoch": 2.45, "learning_rate": 1.6930800765737054e-06, "loss": 0.4176, "step": 13259 }, { "epoch": 2.45, "learning_rate": 1.6919681962697433e-06, "loss": 0.4182, "step": 13260 }, { "epoch": 2.45, "learning_rate": 1.6908566474408694e-06, "loss": 0.4096, "step": 13261 }, { "epoch": 2.45, "learning_rate": 1.6897454301314332e-06, "loss": 0.4427, "step": 13262 }, { "epoch": 2.45, "learning_rate": 1.6886345443857644e-06, "loss": 0.4173, "step": 13263 }, { "epoch": 2.45, "learning_rate": 1.6875239902481922e-06, "loss": 0.418, "step": 13264 }, { "epoch": 2.45, "learning_rate": 1.686413767763021e-06, "loss": 0.4235, "step": 13265 }, { "epoch": 2.45, "learning_rate": 1.6853038769745466e-06, "loss": 0.4138, "step": 13266 }, { "epoch": 2.45, "learning_rate": 1.684194317927057e-06, "loss": 0.4092, "step": 13267 }, { "epoch": 2.45, "learning_rate": 1.6830850906648156e-06, "loss": 0.3865, "step": 13268 }, { "epoch": 2.45, "learning_rate": 1.6819761952320823e-06, "loss": 0.4136, "step": 13269 }, { "epoch": 2.46, "learning_rate": 1.6808676316730965e-06, "loss": 0.4433, "step": 13270 }, { "epoch": 2.46, "learning_rate": 1.6797594000320916e-06, "loss": 0.4058, "step": 13271 }, { "epoch": 2.46, "learning_rate": 1.6786515003532821e-06, "loss": 0.4206, "step": 13272 }, { "epoch": 2.46, "learning_rate": 1.6775439326808696e-06, "loss": 0.4258, "step": 13273 }, { "epoch": 2.46, "learning_rate": 1.6764366970590473e-06, "loss": 0.4151, "step": 13274 }, { "epoch": 2.46, "learning_rate": 1.6753297935319878e-06, "loss": 0.3927, "step": 13275 }, { "epoch": 2.46, "learning_rate": 1.6742232221438592e-06, "loss": 0.4031, "step": 13276 }, { "epoch": 2.46, "learning_rate": 1.6731169829388095e-06, "loss": 0.4255, "step": 13277 }, { "epoch": 2.46, "learning_rate": 1.6720110759609732e-06, "loss": 0.4069, "step": 13278 }, { "epoch": 2.46, "learning_rate": 1.6709055012544772e-06, "loss": 0.3832, "step": 13279 }, { "epoch": 2.46, "learning_rate": 1.66980025886343e-06, "loss": 0.4094, "step": 13280 }, { "epoch": 2.46, "learning_rate": 1.6686953488319313e-06, "loss": 0.4059, "step": 13281 }, { "epoch": 2.46, "learning_rate": 1.6675907712040606e-06, "loss": 0.4122, "step": 13282 }, { "epoch": 2.46, "learning_rate": 1.6664865260238938e-06, "loss": 0.4229, "step": 13283 }, { "epoch": 2.46, "learning_rate": 1.6653826133354855e-06, "loss": 0.4179, "step": 13284 }, { "epoch": 2.46, "learning_rate": 1.6642790331828773e-06, "loss": 0.4125, "step": 13285 }, { "epoch": 2.46, "learning_rate": 1.6631757856101049e-06, "loss": 0.4281, "step": 13286 }, { "epoch": 2.46, "learning_rate": 1.662072870661181e-06, "loss": 0.4437, "step": 13287 }, { "epoch": 2.46, "learning_rate": 1.6609702883801137e-06, "loss": 0.4176, "step": 13288 }, { "epoch": 2.46, "learning_rate": 1.6598680388108946e-06, "loss": 0.4225, "step": 13289 }, { "epoch": 2.46, "learning_rate": 1.658766121997496e-06, "loss": 0.4028, "step": 13290 }, { "epoch": 2.46, "learning_rate": 1.6576645379838875e-06, "loss": 0.4087, "step": 13291 }, { "epoch": 2.46, "learning_rate": 1.6565632868140168e-06, "loss": 0.431, "step": 13292 }, { "epoch": 2.46, "learning_rate": 1.655462368531826e-06, "loss": 0.4138, "step": 13293 }, { "epoch": 2.46, "learning_rate": 1.6543617831812364e-06, "loss": 0.4226, "step": 13294 }, { "epoch": 2.46, "learning_rate": 1.6532615308061584e-06, "loss": 0.4259, "step": 13295 }, { "epoch": 2.46, "learning_rate": 1.6521616114504945e-06, "loss": 0.4349, "step": 13296 }, { "epoch": 2.46, "learning_rate": 1.6510620251581245e-06, "loss": 0.412, "step": 13297 }, { "epoch": 2.46, "learning_rate": 1.6499627719729228e-06, "loss": 0.433, "step": 13298 }, { "epoch": 2.46, "learning_rate": 1.6488638519387478e-06, "loss": 0.4235, "step": 13299 }, { "epoch": 2.46, "learning_rate": 1.6477652650994413e-06, "loss": 0.4317, "step": 13300 }, { "epoch": 2.46, "learning_rate": 1.6466670114988392e-06, "loss": 0.409, "step": 13301 }, { "epoch": 2.46, "learning_rate": 1.6455690911807553e-06, "loss": 0.4167, "step": 13302 }, { "epoch": 2.46, "learning_rate": 1.6444715041889992e-06, "loss": 0.389, "step": 13303 }, { "epoch": 2.46, "learning_rate": 1.6433742505673577e-06, "loss": 0.4225, "step": 13304 }, { "epoch": 2.46, "learning_rate": 1.642277330359614e-06, "loss": 0.4014, "step": 13305 }, { "epoch": 2.46, "learning_rate": 1.6411807436095306e-06, "loss": 0.4084, "step": 13306 }, { "epoch": 2.46, "learning_rate": 1.640084490360858e-06, "loss": 0.4229, "step": 13307 }, { "epoch": 2.46, "learning_rate": 1.6389885706573384e-06, "loss": 0.4379, "step": 13308 }, { "epoch": 2.46, "learning_rate": 1.6378929845426917e-06, "loss": 0.4086, "step": 13309 }, { "epoch": 2.46, "learning_rate": 1.6367977320606355e-06, "loss": 0.4188, "step": 13310 }, { "epoch": 2.46, "learning_rate": 1.635702813254867e-06, "loss": 0.4009, "step": 13311 }, { "epoch": 2.46, "learning_rate": 1.6346082281690667e-06, "loss": 0.4424, "step": 13312 }, { "epoch": 2.46, "learning_rate": 1.6335139768469122e-06, "loss": 0.3975, "step": 13313 }, { "epoch": 2.46, "learning_rate": 1.6324200593320584e-06, "loss": 0.4161, "step": 13314 }, { "epoch": 2.46, "learning_rate": 1.6313264756681535e-06, "loss": 0.4027, "step": 13315 }, { "epoch": 2.46, "learning_rate": 1.6302332258988263e-06, "loss": 0.4071, "step": 13316 }, { "epoch": 2.46, "learning_rate": 1.6291403100676984e-06, "loss": 0.4267, "step": 13317 }, { "epoch": 2.46, "learning_rate": 1.6280477282183725e-06, "loss": 0.4032, "step": 13318 }, { "epoch": 2.46, "learning_rate": 1.6269554803944443e-06, "loss": 0.4062, "step": 13319 }, { "epoch": 2.46, "learning_rate": 1.6258635666394884e-06, "loss": 0.41, "step": 13320 }, { "epoch": 2.46, "learning_rate": 1.6247719869970735e-06, "loss": 0.4096, "step": 13321 }, { "epoch": 2.46, "learning_rate": 1.623680741510747e-06, "loss": 0.4023, "step": 13322 }, { "epoch": 2.46, "learning_rate": 1.6225898302240539e-06, "loss": 0.4067, "step": 13323 }, { "epoch": 2.47, "learning_rate": 1.621499253180514e-06, "loss": 0.4279, "step": 13324 }, { "epoch": 2.47, "learning_rate": 1.6204090104236436e-06, "loss": 0.4252, "step": 13325 }, { "epoch": 2.47, "learning_rate": 1.6193191019969369e-06, "loss": 0.4111, "step": 13326 }, { "epoch": 2.47, "learning_rate": 1.6182295279438843e-06, "loss": 0.4289, "step": 13327 }, { "epoch": 2.47, "learning_rate": 1.6171402883079545e-06, "loss": 0.4421, "step": 13328 }, { "epoch": 2.47, "learning_rate": 1.616051383132604e-06, "loss": 0.3894, "step": 13329 }, { "epoch": 2.47, "learning_rate": 1.6149628124612838e-06, "loss": 0.4138, "step": 13330 }, { "epoch": 2.47, "learning_rate": 1.6138745763374209e-06, "loss": 0.4251, "step": 13331 }, { "epoch": 2.47, "learning_rate": 1.6127866748044373e-06, "loss": 0.4046, "step": 13332 }, { "epoch": 2.47, "learning_rate": 1.6116991079057376e-06, "loss": 0.3815, "step": 13333 }, { "epoch": 2.47, "learning_rate": 1.610611875684711e-06, "loss": 0.4117, "step": 13334 }, { "epoch": 2.47, "learning_rate": 1.60952497818474e-06, "loss": 0.4265, "step": 13335 }, { "epoch": 2.47, "learning_rate": 1.608438415449185e-06, "loss": 0.4047, "step": 13336 }, { "epoch": 2.47, "learning_rate": 1.6073521875214038e-06, "loss": 0.4171, "step": 13337 }, { "epoch": 2.47, "learning_rate": 1.6062662944447305e-06, "loss": 0.419, "step": 13338 }, { "epoch": 2.47, "learning_rate": 1.6051807362624905e-06, "loss": 0.4101, "step": 13339 }, { "epoch": 2.47, "learning_rate": 1.6040955130179981e-06, "loss": 0.4202, "step": 13340 }, { "epoch": 2.47, "learning_rate": 1.6030106247545475e-06, "loss": 0.4026, "step": 13341 }, { "epoch": 2.47, "learning_rate": 1.6019260715154294e-06, "loss": 0.4356, "step": 13342 }, { "epoch": 2.47, "learning_rate": 1.6008418533439118e-06, "loss": 0.423, "step": 13343 }, { "epoch": 2.47, "learning_rate": 1.5997579702832522e-06, "loss": 0.4116, "step": 13344 }, { "epoch": 2.47, "learning_rate": 1.5986744223766993e-06, "loss": 0.4256, "step": 13345 }, { "epoch": 2.47, "learning_rate": 1.5975912096674784e-06, "loss": 0.407, "step": 13346 }, { "epoch": 2.47, "learning_rate": 1.596508332198815e-06, "loss": 0.429, "step": 13347 }, { "epoch": 2.47, "learning_rate": 1.595425790013908e-06, "loss": 0.4159, "step": 13348 }, { "epoch": 2.47, "learning_rate": 1.594343583155954e-06, "loss": 0.4173, "step": 13349 }, { "epoch": 2.47, "learning_rate": 1.5932617116681281e-06, "loss": 0.4308, "step": 13350 }, { "epoch": 2.47, "learning_rate": 1.5921801755935928e-06, "loss": 0.425, "step": 13351 }, { "epoch": 2.47, "learning_rate": 1.5910989749755045e-06, "loss": 0.4156, "step": 13352 }, { "epoch": 2.47, "learning_rate": 1.5900181098569968e-06, "loss": 0.4061, "step": 13353 }, { "epoch": 2.47, "learning_rate": 1.5889375802811968e-06, "loss": 0.4138, "step": 13354 }, { "epoch": 2.47, "learning_rate": 1.587857386291215e-06, "loss": 0.4261, "step": 13355 }, { "epoch": 2.47, "learning_rate": 1.5867775279301467e-06, "loss": 0.4033, "step": 13356 }, { "epoch": 2.47, "learning_rate": 1.5856980052410808e-06, "loss": 0.4103, "step": 13357 }, { "epoch": 2.47, "learning_rate": 1.584618818267083e-06, "loss": 0.395, "step": 13358 }, { "epoch": 2.47, "learning_rate": 1.5835399670512165e-06, "loss": 0.4213, "step": 13359 }, { "epoch": 2.47, "learning_rate": 1.5824614516365234e-06, "loss": 0.4034, "step": 13360 }, { "epoch": 2.47, "learning_rate": 1.5813832720660293e-06, "loss": 0.4164, "step": 13361 }, { "epoch": 2.47, "learning_rate": 1.5803054283827601e-06, "loss": 0.4364, "step": 13362 }, { "epoch": 2.47, "learning_rate": 1.5792279206297124e-06, "loss": 0.4102, "step": 13363 }, { "epoch": 2.47, "learning_rate": 1.5781507488498837e-06, "loss": 0.4252, "step": 13364 }, { "epoch": 2.47, "learning_rate": 1.5770739130862434e-06, "loss": 0.4102, "step": 13365 }, { "epoch": 2.47, "learning_rate": 1.5759974133817625e-06, "loss": 0.4126, "step": 13366 }, { "epoch": 2.47, "learning_rate": 1.5749212497793864e-06, "loss": 0.433, "step": 13367 }, { "epoch": 2.47, "learning_rate": 1.5738454223220556e-06, "loss": 0.4168, "step": 13368 }, { "epoch": 2.47, "learning_rate": 1.572769931052689e-06, "loss": 0.4223, "step": 13369 }, { "epoch": 2.47, "learning_rate": 1.571694776014202e-06, "loss": 0.4328, "step": 13370 }, { "epoch": 2.47, "learning_rate": 1.5706199572494873e-06, "loss": 0.4101, "step": 13371 }, { "epoch": 2.47, "learning_rate": 1.5695454748014316e-06, "loss": 0.4011, "step": 13372 }, { "epoch": 2.47, "learning_rate": 1.5684713287129005e-06, "loss": 0.3938, "step": 13373 }, { "epoch": 2.47, "learning_rate": 1.5673975190267555e-06, "loss": 0.3962, "step": 13374 }, { "epoch": 2.47, "learning_rate": 1.5663240457858342e-06, "loss": 0.4174, "step": 13375 }, { "epoch": 2.47, "learning_rate": 1.5652509090329716e-06, "loss": 0.4079, "step": 13376 }, { "epoch": 2.47, "learning_rate": 1.5641781088109809e-06, "loss": 0.4093, "step": 13377 }, { "epoch": 2.48, "learning_rate": 1.5631056451626625e-06, "loss": 0.427, "step": 13378 }, { "epoch": 2.48, "learning_rate": 1.562033518130811e-06, "loss": 0.4057, "step": 13379 }, { "epoch": 2.48, "learning_rate": 1.560961727758198e-06, "loss": 0.3969, "step": 13380 }, { "epoch": 2.48, "learning_rate": 1.5598902740875887e-06, "loss": 0.4337, "step": 13381 }, { "epoch": 2.48, "learning_rate": 1.5588191571617318e-06, "loss": 0.4057, "step": 13382 }, { "epoch": 2.48, "learning_rate": 1.5577483770233603e-06, "loss": 0.41, "step": 13383 }, { "epoch": 2.48, "learning_rate": 1.5566779337151994e-06, "loss": 0.4067, "step": 13384 }, { "epoch": 2.48, "learning_rate": 1.5556078272799547e-06, "loss": 0.4081, "step": 13385 }, { "epoch": 2.48, "learning_rate": 1.5545380577603253e-06, "loss": 0.4111, "step": 13386 }, { "epoch": 2.48, "learning_rate": 1.5534686251989916e-06, "loss": 0.4287, "step": 13387 }, { "epoch": 2.48, "learning_rate": 1.5523995296386184e-06, "loss": 0.4174, "step": 13388 }, { "epoch": 2.48, "learning_rate": 1.5513307711218673e-06, "loss": 0.3886, "step": 13389 }, { "epoch": 2.48, "learning_rate": 1.5502623496913728e-06, "loss": 0.4106, "step": 13390 }, { "epoch": 2.48, "learning_rate": 1.5491942653897685e-06, "loss": 0.4207, "step": 13391 }, { "epoch": 2.48, "learning_rate": 1.548126518259665e-06, "loss": 0.404, "step": 13392 }, { "epoch": 2.48, "learning_rate": 1.547059108343667e-06, "loss": 0.3985, "step": 13393 }, { "epoch": 2.48, "learning_rate": 1.5459920356843606e-06, "loss": 0.4083, "step": 13394 }, { "epoch": 2.48, "learning_rate": 1.544925300324317e-06, "loss": 0.4307, "step": 13395 }, { "epoch": 2.48, "learning_rate": 1.5438589023061024e-06, "loss": 0.4251, "step": 13396 }, { "epoch": 2.48, "learning_rate": 1.5427928416722594e-06, "loss": 0.4226, "step": 13397 }, { "epoch": 2.48, "learning_rate": 1.541727118465326e-06, "loss": 0.4211, "step": 13398 }, { "epoch": 2.48, "learning_rate": 1.5406617327278207e-06, "loss": 0.4365, "step": 13399 }, { "epoch": 2.48, "learning_rate": 1.539596684502248e-06, "loss": 0.4069, "step": 13400 }, { "epoch": 2.48, "learning_rate": 1.5385319738311056e-06, "loss": 0.4089, "step": 13401 }, { "epoch": 2.48, "learning_rate": 1.537467600756869e-06, "loss": 0.4087, "step": 13402 }, { "epoch": 2.48, "learning_rate": 1.5364035653220099e-06, "loss": 0.4038, "step": 13403 }, { "epoch": 2.48, "learning_rate": 1.535339867568978e-06, "loss": 0.4221, "step": 13404 }, { "epoch": 2.48, "learning_rate": 1.534276507540212e-06, "loss": 0.4066, "step": 13405 }, { "epoch": 2.48, "learning_rate": 1.5332134852781412e-06, "loss": 0.4164, "step": 13406 }, { "epoch": 2.48, "learning_rate": 1.532150800825174e-06, "loss": 0.4046, "step": 13407 }, { "epoch": 2.48, "learning_rate": 1.5310884542237148e-06, "loss": 0.4344, "step": 13408 }, { "epoch": 2.48, "learning_rate": 1.5300264455161462e-06, "loss": 0.4284, "step": 13409 }, { "epoch": 2.48, "learning_rate": 1.5289647747448389e-06, "loss": 0.4111, "step": 13410 }, { "epoch": 2.48, "learning_rate": 1.5279034419521554e-06, "loss": 0.4099, "step": 13411 }, { "epoch": 2.48, "learning_rate": 1.5268424471804367e-06, "loss": 0.4125, "step": 13412 }, { "epoch": 2.48, "learning_rate": 1.5257817904720185e-06, "loss": 0.4002, "step": 13413 }, { "epoch": 2.48, "learning_rate": 1.524721471869216e-06, "loss": 0.4309, "step": 13414 }, { "epoch": 2.48, "learning_rate": 1.5236614914143366e-06, "loss": 0.4074, "step": 13415 }, { "epoch": 2.48, "learning_rate": 1.5226018491496685e-06, "loss": 0.4242, "step": 13416 }, { "epoch": 2.48, "learning_rate": 1.5215425451174926e-06, "loss": 0.4046, "step": 13417 }, { "epoch": 2.48, "learning_rate": 1.5204835793600702e-06, "loss": 0.4265, "step": 13418 }, { "epoch": 2.48, "learning_rate": 1.5194249519196559e-06, "loss": 0.4197, "step": 13419 }, { "epoch": 2.48, "learning_rate": 1.5183666628384819e-06, "loss": 0.4241, "step": 13420 }, { "epoch": 2.48, "learning_rate": 1.517308712158777e-06, "loss": 0.4191, "step": 13421 }, { "epoch": 2.48, "learning_rate": 1.5162510999227464e-06, "loss": 0.4233, "step": 13422 }, { "epoch": 2.48, "learning_rate": 1.5151938261725929e-06, "loss": 0.4051, "step": 13423 }, { "epoch": 2.48, "learning_rate": 1.5141368909504938e-06, "loss": 0.4266, "step": 13424 }, { "epoch": 2.48, "learning_rate": 1.5130802942986245e-06, "loss": 0.4169, "step": 13425 }, { "epoch": 2.48, "learning_rate": 1.5120240362591377e-06, "loss": 0.3835, "step": 13426 }, { "epoch": 2.48, "learning_rate": 1.5109681168741742e-06, "loss": 0.4448, "step": 13427 }, { "epoch": 2.48, "learning_rate": 1.509912536185869e-06, "loss": 0.417, "step": 13428 }, { "epoch": 2.48, "learning_rate": 1.5088572942363323e-06, "loss": 0.4248, "step": 13429 }, { "epoch": 2.48, "learning_rate": 1.5078023910676698e-06, "loss": 0.3997, "step": 13430 }, { "epoch": 2.48, "learning_rate": 1.5067478267219704e-06, "loss": 0.4177, "step": 13431 }, { "epoch": 2.49, "learning_rate": 1.5056936012413049e-06, "loss": 0.4036, "step": 13432 }, { "epoch": 2.49, "learning_rate": 1.5046397146677394e-06, "loss": 0.4232, "step": 13433 }, { "epoch": 2.49, "learning_rate": 1.5035861670433194e-06, "loss": 0.4164, "step": 13434 }, { "epoch": 2.49, "learning_rate": 1.5025329584100822e-06, "loss": 0.4162, "step": 13435 }, { "epoch": 2.49, "learning_rate": 1.5014800888100457e-06, "loss": 0.4032, "step": 13436 }, { "epoch": 2.49, "learning_rate": 1.5004275582852213e-06, "loss": 0.4004, "step": 13437 }, { "epoch": 2.49, "learning_rate": 1.4993753668776013e-06, "loss": 0.416, "step": 13438 }, { "epoch": 2.49, "learning_rate": 1.498323514629162e-06, "loss": 0.4003, "step": 13439 }, { "epoch": 2.49, "learning_rate": 1.4972720015818776e-06, "loss": 0.4282, "step": 13440 }, { "epoch": 2.49, "learning_rate": 1.4962208277776946e-06, "loss": 0.4108, "step": 13441 }, { "epoch": 2.49, "learning_rate": 1.4951699932585595e-06, "loss": 0.4192, "step": 13442 }, { "epoch": 2.49, "learning_rate": 1.4941194980663943e-06, "loss": 0.4107, "step": 13443 }, { "epoch": 2.49, "learning_rate": 1.4930693422431109e-06, "loss": 0.4254, "step": 13444 }, { "epoch": 2.49, "learning_rate": 1.4920195258306137e-06, "loss": 0.4078, "step": 13445 }, { "epoch": 2.49, "learning_rate": 1.4909700488707822e-06, "loss": 0.4143, "step": 13446 }, { "epoch": 2.49, "learning_rate": 1.4899209114054946e-06, "loss": 0.4108, "step": 13447 }, { "epoch": 2.49, "learning_rate": 1.488872113476606e-06, "loss": 0.4221, "step": 13448 }, { "epoch": 2.49, "learning_rate": 1.4878236551259607e-06, "loss": 0.4142, "step": 13449 }, { "epoch": 2.49, "learning_rate": 1.486775536395393e-06, "loss": 0.4078, "step": 13450 }, { "epoch": 2.49, "learning_rate": 1.4857277573267182e-06, "loss": 0.4046, "step": 13451 }, { "epoch": 2.49, "learning_rate": 1.484680317961744e-06, "loss": 0.4241, "step": 13452 }, { "epoch": 2.49, "learning_rate": 1.4836332183422596e-06, "loss": 0.4206, "step": 13453 }, { "epoch": 2.49, "learning_rate": 1.4825864585100392e-06, "loss": 0.4098, "step": 13454 }, { "epoch": 2.49, "learning_rate": 1.4815400385068523e-06, "loss": 0.4039, "step": 13455 }, { "epoch": 2.49, "learning_rate": 1.4804939583744438e-06, "loss": 0.431, "step": 13456 }, { "epoch": 2.49, "learning_rate": 1.4794482181545555e-06, "loss": 0.4115, "step": 13457 }, { "epoch": 2.49, "learning_rate": 1.4784028178889054e-06, "loss": 0.4227, "step": 13458 }, { "epoch": 2.49, "learning_rate": 1.4773577576192088e-06, "loss": 0.4225, "step": 13459 }, { "epoch": 2.49, "learning_rate": 1.476313037387157e-06, "loss": 0.4224, "step": 13460 }, { "epoch": 2.49, "learning_rate": 1.475268657234432e-06, "loss": 0.412, "step": 13461 }, { "epoch": 2.49, "learning_rate": 1.4742246172027075e-06, "loss": 0.4192, "step": 13462 }, { "epoch": 2.49, "learning_rate": 1.4731809173336332e-06, "loss": 0.431, "step": 13463 }, { "epoch": 2.49, "learning_rate": 1.4721375576688545e-06, "loss": 0.4192, "step": 13464 }, { "epoch": 2.49, "learning_rate": 1.4710945382499974e-06, "loss": 0.4201, "step": 13465 }, { "epoch": 2.49, "learning_rate": 1.4700518591186785e-06, "loss": 0.4003, "step": 13466 }, { "epoch": 2.49, "learning_rate": 1.4690095203164967e-06, "loss": 0.421, "step": 13467 }, { "epoch": 2.49, "learning_rate": 1.4679675218850408e-06, "loss": 0.4193, "step": 13468 }, { "epoch": 2.49, "learning_rate": 1.4669258638658834e-06, "loss": 0.4055, "step": 13469 }, { "epoch": 2.49, "learning_rate": 1.4658845463005877e-06, "loss": 0.4151, "step": 13470 }, { "epoch": 2.49, "learning_rate": 1.464843569230695e-06, "loss": 0.4186, "step": 13471 }, { "epoch": 2.49, "learning_rate": 1.4638029326977444e-06, "loss": 0.4095, "step": 13472 }, { "epoch": 2.49, "learning_rate": 1.462762636743249e-06, "loss": 0.4027, "step": 13473 }, { "epoch": 2.49, "learning_rate": 1.4617226814087215e-06, "loss": 0.4125, "step": 13474 }, { "epoch": 2.49, "learning_rate": 1.460683066735651e-06, "loss": 0.4071, "step": 13475 }, { "epoch": 2.49, "learning_rate": 1.4596437927655128e-06, "loss": 0.4012, "step": 13476 }, { "epoch": 2.49, "learning_rate": 1.4586048595397784e-06, "loss": 0.4082, "step": 13477 }, { "epoch": 2.49, "learning_rate": 1.4575662670998935e-06, "loss": 0.4128, "step": 13478 }, { "epoch": 2.49, "learning_rate": 1.4565280154873006e-06, "loss": 0.3928, "step": 13479 }, { "epoch": 2.49, "learning_rate": 1.45549010474342e-06, "loss": 0.4033, "step": 13480 }, { "epoch": 2.49, "learning_rate": 1.4544525349096672e-06, "loss": 0.4287, "step": 13481 }, { "epoch": 2.49, "learning_rate": 1.4534153060274358e-06, "loss": 0.3914, "step": 13482 }, { "epoch": 2.49, "learning_rate": 1.4523784181381084e-06, "loss": 0.4163, "step": 13483 }, { "epoch": 2.49, "learning_rate": 1.4513418712830584e-06, "loss": 0.403, "step": 13484 }, { "epoch": 2.49, "learning_rate": 1.4503056655036384e-06, "loss": 0.4299, "step": 13485 }, { "epoch": 2.5, "learning_rate": 1.4492698008411954e-06, "loss": 0.4203, "step": 13486 }, { "epoch": 2.5, "learning_rate": 1.4482342773370561e-06, "loss": 0.4045, "step": 13487 }, { "epoch": 2.5, "learning_rate": 1.4471990950325342e-06, "loss": 0.3952, "step": 13488 }, { "epoch": 2.5, "learning_rate": 1.4461642539689346e-06, "loss": 0.4145, "step": 13489 }, { "epoch": 2.5, "learning_rate": 1.445129754187542e-06, "loss": 0.4215, "step": 13490 }, { "epoch": 2.5, "learning_rate": 1.4440955957296366e-06, "loss": 0.4295, "step": 13491 }, { "epoch": 2.5, "learning_rate": 1.4430617786364754e-06, "loss": 0.431, "step": 13492 }, { "epoch": 2.5, "learning_rate": 1.4420283029493042e-06, "loss": 0.4203, "step": 13493 }, { "epoch": 2.5, "learning_rate": 1.4409951687093616e-06, "loss": 0.4311, "step": 13494 }, { "epoch": 2.5, "learning_rate": 1.4399623759578619e-06, "loss": 0.422, "step": 13495 }, { "epoch": 2.5, "learning_rate": 1.4389299247360179e-06, "loss": 0.4276, "step": 13496 }, { "epoch": 2.5, "learning_rate": 1.4378978150850197e-06, "loss": 0.43, "step": 13497 }, { "epoch": 2.5, "learning_rate": 1.4368660470460438e-06, "loss": 0.3991, "step": 13498 }, { "epoch": 2.5, "learning_rate": 1.4358346206602614e-06, "loss": 0.4073, "step": 13499 }, { "epoch": 2.5, "learning_rate": 1.4348035359688183e-06, "loss": 0.393, "step": 13500 }, { "epoch": 2.5, "learning_rate": 1.4337727930128586e-06, "loss": 0.4121, "step": 13501 }, { "epoch": 2.5, "learning_rate": 1.4327423918335026e-06, "loss": 0.4206, "step": 13502 }, { "epoch": 2.5, "learning_rate": 1.4317123324718652e-06, "loss": 0.4282, "step": 13503 }, { "epoch": 2.5, "learning_rate": 1.4306826149690423e-06, "loss": 0.4296, "step": 13504 }, { "epoch": 2.5, "learning_rate": 1.4296532393661145e-06, "loss": 0.3856, "step": 13505 }, { "epoch": 2.5, "learning_rate": 1.4286242057041578e-06, "loss": 0.3977, "step": 13506 }, { "epoch": 2.5, "learning_rate": 1.4275955140242238e-06, "loss": 0.4194, "step": 13507 }, { "epoch": 2.5, "learning_rate": 1.4265671643673583e-06, "loss": 0.4155, "step": 13508 }, { "epoch": 2.5, "learning_rate": 1.4255391567745914e-06, "loss": 0.4209, "step": 13509 }, { "epoch": 2.5, "learning_rate": 1.424511491286933e-06, "loss": 0.4149, "step": 13510 }, { "epoch": 2.5, "learning_rate": 1.4234841679453926e-06, "loss": 0.4102, "step": 13511 }, { "epoch": 2.5, "learning_rate": 1.422457186790952e-06, "loss": 0.4267, "step": 13512 }, { "epoch": 2.5, "learning_rate": 1.4214305478645907e-06, "loss": 0.4237, "step": 13513 }, { "epoch": 2.5, "learning_rate": 1.420404251207267e-06, "loss": 0.4199, "step": 13514 }, { "epoch": 2.5, "learning_rate": 1.419378296859929e-06, "loss": 0.4191, "step": 13515 }, { "epoch": 2.5, "learning_rate": 1.4183526848635098e-06, "loss": 0.3937, "step": 13516 }, { "epoch": 2.5, "learning_rate": 1.4173274152589322e-06, "loss": 0.4009, "step": 13517 }, { "epoch": 2.5, "learning_rate": 1.4163024880870968e-06, "loss": 0.4129, "step": 13518 }, { "epoch": 2.5, "learning_rate": 1.4152779033889031e-06, "loss": 0.4161, "step": 13519 }, { "epoch": 2.5, "learning_rate": 1.414253661205225e-06, "loss": 0.4259, "step": 13520 }, { "epoch": 2.5, "learning_rate": 1.4132297615769308e-06, "loss": 0.4026, "step": 13521 }, { "epoch": 2.5, "learning_rate": 1.4122062045448693e-06, "loss": 0.4251, "step": 13522 }, { "epoch": 2.5, "learning_rate": 1.411182990149883e-06, "loss": 0.4263, "step": 13523 }, { "epoch": 2.5, "learning_rate": 1.4101601184327907e-06, "loss": 0.4093, "step": 13524 }, { "epoch": 2.5, "learning_rate": 1.4091375894344094e-06, "loss": 0.4213, "step": 13525 }, { "epoch": 2.5, "learning_rate": 1.4081154031955314e-06, "loss": 0.403, "step": 13526 }, { "epoch": 2.5, "learning_rate": 1.4070935597569403e-06, "loss": 0.4239, "step": 13527 }, { "epoch": 2.5, "learning_rate": 1.406072059159408e-06, "loss": 0.4049, "step": 13528 }, { "epoch": 2.5, "learning_rate": 1.4050509014436875e-06, "loss": 0.4044, "step": 13529 }, { "epoch": 2.5, "learning_rate": 1.4040300866505252e-06, "loss": 0.4222, "step": 13530 }, { "epoch": 2.5, "learning_rate": 1.4030096148206473e-06, "loss": 0.4241, "step": 13531 }, { "epoch": 2.5, "learning_rate": 1.4019894859947669e-06, "loss": 0.3955, "step": 13532 }, { "epoch": 2.5, "learning_rate": 1.400969700213589e-06, "loss": 0.4009, "step": 13533 }, { "epoch": 2.5, "learning_rate": 1.399950257517798e-06, "loss": 0.4147, "step": 13534 }, { "epoch": 2.5, "learning_rate": 1.3989311579480701e-06, "loss": 0.4134, "step": 13535 }, { "epoch": 2.5, "learning_rate": 1.3979124015450663e-06, "loss": 0.4144, "step": 13536 }, { "epoch": 2.5, "learning_rate": 1.3968939883494281e-06, "loss": 0.4113, "step": 13537 }, { "epoch": 2.5, "learning_rate": 1.3958759184017934e-06, "loss": 0.4114, "step": 13538 }, { "epoch": 2.5, "learning_rate": 1.3948581917427772e-06, "loss": 0.4304, "step": 13539 }, { "epoch": 2.51, "learning_rate": 1.3938408084129907e-06, "loss": 0.4207, "step": 13540 }, { "epoch": 2.51, "learning_rate": 1.392823768453021e-06, "loss": 0.4204, "step": 13541 }, { "epoch": 2.51, "learning_rate": 1.3918070719034448e-06, "loss": 0.417, "step": 13542 }, { "epoch": 2.51, "learning_rate": 1.3907907188048309e-06, "loss": 0.4197, "step": 13543 }, { "epoch": 2.51, "learning_rate": 1.3897747091977266e-06, "loss": 0.4058, "step": 13544 }, { "epoch": 2.51, "learning_rate": 1.3887590431226717e-06, "loss": 0.4234, "step": 13545 }, { "epoch": 2.51, "learning_rate": 1.3877437206201849e-06, "loss": 0.4077, "step": 13546 }, { "epoch": 2.51, "learning_rate": 1.3867287417307806e-06, "loss": 0.4183, "step": 13547 }, { "epoch": 2.51, "learning_rate": 1.3857141064949532e-06, "loss": 0.4213, "step": 13548 }, { "epoch": 2.51, "learning_rate": 1.384699814953182e-06, "loss": 0.4119, "step": 13549 }, { "epoch": 2.51, "learning_rate": 1.3836858671459385e-06, "loss": 0.4201, "step": 13550 }, { "epoch": 2.51, "learning_rate": 1.3826722631136758e-06, "loss": 0.3822, "step": 13551 }, { "epoch": 2.51, "learning_rate": 1.3816590028968357e-06, "loss": 0.415, "step": 13552 }, { "epoch": 2.51, "learning_rate": 1.3806460865358462e-06, "loss": 0.3987, "step": 13553 }, { "epoch": 2.51, "learning_rate": 1.379633514071116e-06, "loss": 0.4084, "step": 13554 }, { "epoch": 2.51, "learning_rate": 1.3786212855430515e-06, "loss": 0.4179, "step": 13555 }, { "epoch": 2.51, "learning_rate": 1.3776094009920337e-06, "loss": 0.4117, "step": 13556 }, { "epoch": 2.51, "learning_rate": 1.3765978604584385e-06, "loss": 0.4154, "step": 13557 }, { "epoch": 2.51, "learning_rate": 1.3755866639826232e-06, "loss": 0.4214, "step": 13558 }, { "epoch": 2.51, "learning_rate": 1.3745758116049301e-06, "loss": 0.4328, "step": 13559 }, { "epoch": 2.51, "learning_rate": 1.373565303365695e-06, "loss": 0.4103, "step": 13560 }, { "epoch": 2.51, "learning_rate": 1.3725551393052294e-06, "loss": 0.4503, "step": 13561 }, { "epoch": 2.51, "learning_rate": 1.371545319463844e-06, "loss": 0.408, "step": 13562 }, { "epoch": 2.51, "learning_rate": 1.370535843881825e-06, "loss": 0.4103, "step": 13563 }, { "epoch": 2.51, "learning_rate": 1.369526712599446e-06, "loss": 0.3991, "step": 13564 }, { "epoch": 2.51, "learning_rate": 1.3685179256569747e-06, "loss": 0.4204, "step": 13565 }, { "epoch": 2.51, "learning_rate": 1.3675094830946555e-06, "loss": 0.4137, "step": 13566 }, { "epoch": 2.51, "learning_rate": 1.3665013849527275e-06, "loss": 0.3817, "step": 13567 }, { "epoch": 2.51, "learning_rate": 1.3654936312714073e-06, "loss": 0.421, "step": 13568 }, { "epoch": 2.51, "learning_rate": 1.3644862220909072e-06, "loss": 0.4301, "step": 13569 }, { "epoch": 2.51, "learning_rate": 1.363479157451416e-06, "loss": 0.3874, "step": 13570 }, { "epoch": 2.51, "learning_rate": 1.3624724373931187e-06, "loss": 0.4031, "step": 13571 }, { "epoch": 2.51, "learning_rate": 1.361466061956177e-06, "loss": 0.4078, "step": 13572 }, { "epoch": 2.51, "learning_rate": 1.360460031180748e-06, "loss": 0.4249, "step": 13573 }, { "epoch": 2.51, "learning_rate": 1.3594543451069664e-06, "loss": 0.3999, "step": 13574 }, { "epoch": 2.51, "learning_rate": 1.358449003774961e-06, "loss": 0.4262, "step": 13575 }, { "epoch": 2.51, "learning_rate": 1.3574440072248375e-06, "loss": 0.4132, "step": 13576 }, { "epoch": 2.51, "learning_rate": 1.3564393554967003e-06, "loss": 0.4185, "step": 13577 }, { "epoch": 2.51, "learning_rate": 1.3554350486306267e-06, "loss": 0.4135, "step": 13578 }, { "epoch": 2.51, "learning_rate": 1.354431086666692e-06, "loss": 0.4142, "step": 13579 }, { "epoch": 2.51, "learning_rate": 1.35342746964495e-06, "loss": 0.4024, "step": 13580 }, { "epoch": 2.51, "learning_rate": 1.352424197605442e-06, "loss": 0.4033, "step": 13581 }, { "epoch": 2.51, "learning_rate": 1.3514212705881991e-06, "loss": 0.4055, "step": 13582 }, { "epoch": 2.51, "learning_rate": 1.3504186886332338e-06, "loss": 0.4259, "step": 13583 }, { "epoch": 2.51, "learning_rate": 1.3494164517805498e-06, "loss": 0.4239, "step": 13584 }, { "epoch": 2.51, "learning_rate": 1.3484145600701337e-06, "loss": 0.4069, "step": 13585 }, { "epoch": 2.51, "learning_rate": 1.3474130135419561e-06, "loss": 0.3906, "step": 13586 }, { "epoch": 2.51, "learning_rate": 1.3464118122359825e-06, "loss": 0.415, "step": 13587 }, { "epoch": 2.51, "learning_rate": 1.3454109561921524e-06, "loss": 0.4266, "step": 13588 }, { "epoch": 2.51, "learning_rate": 1.3444104454504048e-06, "loss": 0.4155, "step": 13589 }, { "epoch": 2.51, "learning_rate": 1.3434102800506531e-06, "loss": 0.429, "step": 13590 }, { "epoch": 2.51, "learning_rate": 1.3424104600328059e-06, "loss": 0.3893, "step": 13591 }, { "epoch": 2.51, "learning_rate": 1.341410985436752e-06, "loss": 0.4101, "step": 13592 }, { "epoch": 2.51, "learning_rate": 1.3404118563023661e-06, "loss": 0.4224, "step": 13593 }, { "epoch": 2.52, "learning_rate": 1.3394130726695175e-06, "loss": 0.3997, "step": 13594 }, { "epoch": 2.52, "learning_rate": 1.3384146345780501e-06, "loss": 0.3944, "step": 13595 }, { "epoch": 2.52, "learning_rate": 1.3374165420678043e-06, "loss": 0.4092, "step": 13596 }, { "epoch": 2.52, "learning_rate": 1.3364187951786e-06, "loss": 0.4066, "step": 13597 }, { "epoch": 2.52, "learning_rate": 1.3354213939502436e-06, "loss": 0.4128, "step": 13598 }, { "epoch": 2.52, "learning_rate": 1.3344243384225342e-06, "loss": 0.4303, "step": 13599 }, { "epoch": 2.52, "learning_rate": 1.3334276286352466e-06, "loss": 0.4311, "step": 13600 }, { "epoch": 2.52, "learning_rate": 1.3324312646281533e-06, "loss": 0.4225, "step": 13601 }, { "epoch": 2.52, "learning_rate": 1.3314352464410063e-06, "loss": 0.3899, "step": 13602 }, { "epoch": 2.52, "learning_rate": 1.33043957411354e-06, "loss": 0.4164, "step": 13603 }, { "epoch": 2.52, "learning_rate": 1.3294442476854862e-06, "loss": 0.4061, "step": 13604 }, { "epoch": 2.52, "learning_rate": 1.328449267196551e-06, "loss": 0.4142, "step": 13605 }, { "epoch": 2.52, "learning_rate": 1.327454632686438e-06, "loss": 0.427, "step": 13606 }, { "epoch": 2.52, "learning_rate": 1.3264603441948276e-06, "loss": 0.4175, "step": 13607 }, { "epoch": 2.52, "learning_rate": 1.3254664017613895e-06, "loss": 0.4132, "step": 13608 }, { "epoch": 2.52, "learning_rate": 1.3244728054257839e-06, "loss": 0.4122, "step": 13609 }, { "epoch": 2.52, "learning_rate": 1.3234795552276481e-06, "loss": 0.4379, "step": 13610 }, { "epoch": 2.52, "learning_rate": 1.322486651206616e-06, "loss": 0.4211, "step": 13611 }, { "epoch": 2.52, "learning_rate": 1.3214940934023002e-06, "loss": 0.4242, "step": 13612 }, { "epoch": 2.52, "learning_rate": 1.3205018818543014e-06, "loss": 0.4046, "step": 13613 }, { "epoch": 2.52, "learning_rate": 1.319510016602209e-06, "loss": 0.4196, "step": 13614 }, { "epoch": 2.52, "learning_rate": 1.3185184976855936e-06, "loss": 0.4163, "step": 13615 }, { "epoch": 2.52, "learning_rate": 1.3175273251440191e-06, "loss": 0.4369, "step": 13616 }, { "epoch": 2.52, "learning_rate": 1.316536499017026e-06, "loss": 0.4325, "step": 13617 }, { "epoch": 2.52, "learning_rate": 1.3155460193441528e-06, "loss": 0.3988, "step": 13618 }, { "epoch": 2.52, "learning_rate": 1.3145558861649122e-06, "loss": 0.4121, "step": 13619 }, { "epoch": 2.52, "learning_rate": 1.3135660995188138e-06, "loss": 0.4234, "step": 13620 }, { "epoch": 2.52, "learning_rate": 1.3125766594453427e-06, "loss": 0.4282, "step": 13621 }, { "epoch": 2.52, "learning_rate": 1.3115875659839806e-06, "loss": 0.4035, "step": 13622 }, { "epoch": 2.52, "learning_rate": 1.3105988191741858e-06, "loss": 0.4207, "step": 13623 }, { "epoch": 2.52, "learning_rate": 1.3096104190554137e-06, "loss": 0.4386, "step": 13624 }, { "epoch": 2.52, "learning_rate": 1.3086223656670926e-06, "loss": 0.3951, "step": 13625 }, { "epoch": 2.52, "learning_rate": 1.30763465904865e-06, "loss": 0.4226, "step": 13626 }, { "epoch": 2.52, "learning_rate": 1.3066472992394895e-06, "loss": 0.4095, "step": 13627 }, { "epoch": 2.52, "learning_rate": 1.305660286279008e-06, "loss": 0.427, "step": 13628 }, { "epoch": 2.52, "learning_rate": 1.3046736202065846e-06, "loss": 0.4175, "step": 13629 }, { "epoch": 2.52, "learning_rate": 1.3036873010615813e-06, "loss": 0.4236, "step": 13630 }, { "epoch": 2.52, "learning_rate": 1.3027013288833567e-06, "loss": 0.4311, "step": 13631 }, { "epoch": 2.52, "learning_rate": 1.301715703711245e-06, "loss": 0.425, "step": 13632 }, { "epoch": 2.52, "learning_rate": 1.3007304255845743e-06, "loss": 0.4096, "step": 13633 }, { "epoch": 2.52, "learning_rate": 1.2997454945426524e-06, "loss": 0.3901, "step": 13634 }, { "epoch": 2.52, "learning_rate": 1.2987609106247756e-06, "loss": 0.4111, "step": 13635 }, { "epoch": 2.52, "learning_rate": 1.2977766738702303e-06, "loss": 0.4238, "step": 13636 }, { "epoch": 2.52, "learning_rate": 1.2967927843182827e-06, "loss": 0.4282, "step": 13637 }, { "epoch": 2.52, "learning_rate": 1.2958092420081915e-06, "loss": 0.4007, "step": 13638 }, { "epoch": 2.52, "learning_rate": 1.2948260469791929e-06, "loss": 0.4345, "step": 13639 }, { "epoch": 2.52, "learning_rate": 1.2938431992705202e-06, "loss": 0.4372, "step": 13640 }, { "epoch": 2.52, "learning_rate": 1.2928606989213854e-06, "loss": 0.403, "step": 13641 }, { "epoch": 2.52, "learning_rate": 1.291878545970986e-06, "loss": 0.4206, "step": 13642 }, { "epoch": 2.52, "learning_rate": 1.2908967404585115e-06, "loss": 0.4057, "step": 13643 }, { "epoch": 2.52, "learning_rate": 1.289915282423131e-06, "loss": 0.4036, "step": 13644 }, { "epoch": 2.52, "learning_rate": 1.2889341719040061e-06, "loss": 0.4185, "step": 13645 }, { "epoch": 2.52, "learning_rate": 1.28795340894028e-06, "loss": 0.421, "step": 13646 }, { "epoch": 2.52, "learning_rate": 1.2869729935710807e-06, "loss": 0.3976, "step": 13647 }, { "epoch": 2.53, "learning_rate": 1.2859929258355287e-06, "loss": 0.4107, "step": 13648 }, { "epoch": 2.53, "learning_rate": 1.2850132057727237e-06, "loss": 0.4181, "step": 13649 }, { "epoch": 2.53, "learning_rate": 1.2840338334217594e-06, "loss": 0.4079, "step": 13650 }, { "epoch": 2.53, "learning_rate": 1.2830548088217065e-06, "loss": 0.4212, "step": 13651 }, { "epoch": 2.53, "learning_rate": 1.282076132011627e-06, "loss": 0.4176, "step": 13652 }, { "epoch": 2.53, "learning_rate": 1.28109780303057e-06, "loss": 0.4131, "step": 13653 }, { "epoch": 2.53, "learning_rate": 1.280119821917567e-06, "loss": 0.3879, "step": 13654 }, { "epoch": 2.53, "learning_rate": 1.2791421887116395e-06, "loss": 0.4098, "step": 13655 }, { "epoch": 2.53, "learning_rate": 1.278164903451793e-06, "loss": 0.4101, "step": 13656 }, { "epoch": 2.53, "learning_rate": 1.277187966177017e-06, "loss": 0.4027, "step": 13657 }, { "epoch": 2.53, "learning_rate": 1.276211376926293e-06, "loss": 0.4124, "step": 13658 }, { "epoch": 2.53, "learning_rate": 1.2752351357385818e-06, "loss": 0.4221, "step": 13659 }, { "epoch": 2.53, "learning_rate": 1.2742592426528377e-06, "loss": 0.3812, "step": 13660 }, { "epoch": 2.53, "learning_rate": 1.273283697707991e-06, "loss": 0.4223, "step": 13661 }, { "epoch": 2.53, "learning_rate": 1.2723085009429702e-06, "loss": 0.3989, "step": 13662 }, { "epoch": 2.53, "learning_rate": 1.2713336523966824e-06, "loss": 0.4132, "step": 13663 }, { "epoch": 2.53, "learning_rate": 1.2703591521080183e-06, "loss": 0.3943, "step": 13664 }, { "epoch": 2.53, "learning_rate": 1.2693850001158636e-06, "loss": 0.4096, "step": 13665 }, { "epoch": 2.53, "learning_rate": 1.2684111964590806e-06, "loss": 0.4273, "step": 13666 }, { "epoch": 2.53, "learning_rate": 1.2674377411765282e-06, "loss": 0.4215, "step": 13667 }, { "epoch": 2.53, "learning_rate": 1.2664646343070385e-06, "loss": 0.4303, "step": 13668 }, { "epoch": 2.53, "learning_rate": 1.265491875889443e-06, "loss": 0.4146, "step": 13669 }, { "epoch": 2.53, "learning_rate": 1.2645194659625482e-06, "loss": 0.4203, "step": 13670 }, { "epoch": 2.53, "learning_rate": 1.2635474045651553e-06, "loss": 0.4231, "step": 13671 }, { "epoch": 2.53, "learning_rate": 1.2625756917360433e-06, "loss": 0.4203, "step": 13672 }, { "epoch": 2.53, "learning_rate": 1.2616043275139866e-06, "loss": 0.4061, "step": 13673 }, { "epoch": 2.53, "learning_rate": 1.2606333119377367e-06, "loss": 0.4097, "step": 13674 }, { "epoch": 2.53, "learning_rate": 1.259662645046039e-06, "loss": 0.4095, "step": 13675 }, { "epoch": 2.53, "learning_rate": 1.2586923268776174e-06, "loss": 0.4056, "step": 13676 }, { "epoch": 2.53, "learning_rate": 1.2577223574711893e-06, "loss": 0.4181, "step": 13677 }, { "epoch": 2.53, "learning_rate": 1.2567527368654543e-06, "loss": 0.4096, "step": 13678 }, { "epoch": 2.53, "learning_rate": 1.2557834650990952e-06, "loss": 0.4452, "step": 13679 }, { "epoch": 2.53, "learning_rate": 1.2548145422107882e-06, "loss": 0.417, "step": 13680 }, { "epoch": 2.53, "learning_rate": 1.253845968239188e-06, "loss": 0.3973, "step": 13681 }, { "epoch": 2.53, "learning_rate": 1.2528777432229422e-06, "loss": 0.4189, "step": 13682 }, { "epoch": 2.53, "learning_rate": 1.2519098672006769e-06, "loss": 0.4237, "step": 13683 }, { "epoch": 2.53, "learning_rate": 1.2509423402110144e-06, "loss": 0.4294, "step": 13684 }, { "epoch": 2.53, "learning_rate": 1.2499751622925537e-06, "loss": 0.4249, "step": 13685 }, { "epoch": 2.53, "learning_rate": 1.249008333483881e-06, "loss": 0.4036, "step": 13686 }, { "epoch": 2.53, "learning_rate": 1.2480418538235772e-06, "loss": 0.4205, "step": 13687 }, { "epoch": 2.53, "learning_rate": 1.2470757233501963e-06, "loss": 0.4104, "step": 13688 }, { "epoch": 2.53, "learning_rate": 1.2461099421022916e-06, "loss": 0.4087, "step": 13689 }, { "epoch": 2.53, "learning_rate": 1.2451445101183924e-06, "loss": 0.4078, "step": 13690 }, { "epoch": 2.53, "learning_rate": 1.2441794274370155e-06, "loss": 0.4198, "step": 13691 }, { "epoch": 2.53, "learning_rate": 1.2432146940966706e-06, "loss": 0.4165, "step": 13692 }, { "epoch": 2.53, "learning_rate": 1.2422503101358451e-06, "loss": 0.3991, "step": 13693 }, { "epoch": 2.53, "learning_rate": 1.24128627559302e-06, "loss": 0.4425, "step": 13694 }, { "epoch": 2.53, "learning_rate": 1.240322590506655e-06, "loss": 0.4301, "step": 13695 }, { "epoch": 2.53, "learning_rate": 1.2393592549152e-06, "loss": 0.437, "step": 13696 }, { "epoch": 2.53, "learning_rate": 1.2383962688570916e-06, "loss": 0.4152, "step": 13697 }, { "epoch": 2.53, "learning_rate": 1.237433632370749e-06, "loss": 0.4102, "step": 13698 }, { "epoch": 2.53, "learning_rate": 1.2364713454945832e-06, "loss": 0.4246, "step": 13699 }, { "epoch": 2.53, "learning_rate": 1.2355094082669849e-06, "loss": 0.392, "step": 13700 }, { "epoch": 2.53, "learning_rate": 1.2345478207263316e-06, "loss": 0.4071, "step": 13701 }, { "epoch": 2.54, "learning_rate": 1.233586582910995e-06, "loss": 0.3949, "step": 13702 }, { "epoch": 2.54, "learning_rate": 1.2326256948593207e-06, "loss": 0.4169, "step": 13703 }, { "epoch": 2.54, "learning_rate": 1.2316651566096505e-06, "loss": 0.4019, "step": 13704 }, { "epoch": 2.54, "learning_rate": 1.2307049682003035e-06, "loss": 0.4358, "step": 13705 }, { "epoch": 2.54, "learning_rate": 1.2297451296695962e-06, "loss": 0.4192, "step": 13706 }, { "epoch": 2.54, "learning_rate": 1.2287856410558196e-06, "loss": 0.3974, "step": 13707 }, { "epoch": 2.54, "learning_rate": 1.2278265023972546e-06, "loss": 0.4263, "step": 13708 }, { "epoch": 2.54, "learning_rate": 1.2268677137321727e-06, "loss": 0.4116, "step": 13709 }, { "epoch": 2.54, "learning_rate": 1.2259092750988232e-06, "loss": 0.4061, "step": 13710 }, { "epoch": 2.54, "learning_rate": 1.2249511865354524e-06, "loss": 0.4029, "step": 13711 }, { "epoch": 2.54, "learning_rate": 1.2239934480802818e-06, "loss": 0.4191, "step": 13712 }, { "epoch": 2.54, "learning_rate": 1.223036059771523e-06, "loss": 0.4366, "step": 13713 }, { "epoch": 2.54, "learning_rate": 1.2220790216473766e-06, "loss": 0.4052, "step": 13714 }, { "epoch": 2.54, "learning_rate": 1.2211223337460233e-06, "loss": 0.4178, "step": 13715 }, { "epoch": 2.54, "learning_rate": 1.2201659961056378e-06, "loss": 0.4052, "step": 13716 }, { "epoch": 2.54, "learning_rate": 1.219210008764371e-06, "loss": 0.3955, "step": 13717 }, { "epoch": 2.54, "learning_rate": 1.21825437176037e-06, "loss": 0.4415, "step": 13718 }, { "epoch": 2.54, "learning_rate": 1.2172990851317578e-06, "loss": 0.4174, "step": 13719 }, { "epoch": 2.54, "learning_rate": 1.216344148916655e-06, "loss": 0.4033, "step": 13720 }, { "epoch": 2.54, "learning_rate": 1.2153895631531554e-06, "loss": 0.4101, "step": 13721 }, { "epoch": 2.54, "learning_rate": 1.2144353278793497e-06, "loss": 0.4027, "step": 13722 }, { "epoch": 2.54, "learning_rate": 1.2134814431333065e-06, "loss": 0.435, "step": 13723 }, { "epoch": 2.54, "learning_rate": 1.2125279089530872e-06, "loss": 0.4215, "step": 13724 }, { "epoch": 2.54, "learning_rate": 1.211574725376734e-06, "loss": 0.4016, "step": 13725 }, { "epoch": 2.54, "learning_rate": 1.2106218924422796e-06, "loss": 0.4191, "step": 13726 }, { "epoch": 2.54, "learning_rate": 1.209669410187736e-06, "loss": 0.4156, "step": 13727 }, { "epoch": 2.54, "learning_rate": 1.2087172786511104e-06, "loss": 0.4187, "step": 13728 }, { "epoch": 2.54, "learning_rate": 1.207765497870389e-06, "loss": 0.4096, "step": 13729 }, { "epoch": 2.54, "learning_rate": 1.2068140678835438e-06, "loss": 0.4305, "step": 13730 }, { "epoch": 2.54, "learning_rate": 1.205862988728539e-06, "loss": 0.4223, "step": 13731 }, { "epoch": 2.54, "learning_rate": 1.2049122604433162e-06, "loss": 0.4357, "step": 13732 }, { "epoch": 2.54, "learning_rate": 1.203961883065814e-06, "loss": 0.4087, "step": 13733 }, { "epoch": 2.54, "learning_rate": 1.2030118566339465e-06, "loss": 0.4323, "step": 13734 }, { "epoch": 2.54, "learning_rate": 1.202062181185617e-06, "loss": 0.4259, "step": 13735 }, { "epoch": 2.54, "learning_rate": 1.2011128567587195e-06, "loss": 0.419, "step": 13736 }, { "epoch": 2.54, "learning_rate": 1.2001638833911256e-06, "loss": 0.4068, "step": 13737 }, { "epoch": 2.54, "learning_rate": 1.1992152611207031e-06, "loss": 0.4322, "step": 13738 }, { "epoch": 2.54, "learning_rate": 1.1982669899852971e-06, "loss": 0.4115, "step": 13739 }, { "epoch": 2.54, "learning_rate": 1.19731907002274e-06, "loss": 0.3906, "step": 13740 }, { "epoch": 2.54, "learning_rate": 1.1963715012708565e-06, "loss": 0.4332, "step": 13741 }, { "epoch": 2.54, "learning_rate": 1.195424283767449e-06, "loss": 0.4118, "step": 13742 }, { "epoch": 2.54, "learning_rate": 1.1944774175503138e-06, "loss": 0.4062, "step": 13743 }, { "epoch": 2.54, "learning_rate": 1.193530902657225e-06, "loss": 0.4134, "step": 13744 }, { "epoch": 2.54, "learning_rate": 1.1925847391259481e-06, "loss": 0.428, "step": 13745 }, { "epoch": 2.54, "learning_rate": 1.191638926994234e-06, "loss": 0.4119, "step": 13746 }, { "epoch": 2.54, "learning_rate": 1.1906934662998182e-06, "loss": 0.407, "step": 13747 }, { "epoch": 2.54, "learning_rate": 1.1897483570804237e-06, "loss": 0.4128, "step": 13748 }, { "epoch": 2.54, "learning_rate": 1.1888035993737569e-06, "loss": 0.4409, "step": 13749 }, { "epoch": 2.54, "learning_rate": 1.1878591932175142e-06, "loss": 0.4129, "step": 13750 }, { "epoch": 2.54, "learning_rate": 1.186915138649375e-06, "loss": 0.4114, "step": 13751 }, { "epoch": 2.54, "learning_rate": 1.185971435707003e-06, "loss": 0.415, "step": 13752 }, { "epoch": 2.54, "learning_rate": 1.1850280844280537e-06, "loss": 0.4168, "step": 13753 }, { "epoch": 2.54, "learning_rate": 1.1840850848501605e-06, "loss": 0.41, "step": 13754 }, { "epoch": 2.54, "learning_rate": 1.1831424370109535e-06, "loss": 0.4141, "step": 13755 }, { "epoch": 2.55, "learning_rate": 1.1822001409480388e-06, "loss": 0.424, "step": 13756 }, { "epoch": 2.55, "learning_rate": 1.1812581966990112e-06, "loss": 0.4162, "step": 13757 }, { "epoch": 2.55, "learning_rate": 1.1803166043014546e-06, "loss": 0.3962, "step": 13758 }, { "epoch": 2.55, "learning_rate": 1.1793753637929361e-06, "loss": 0.4005, "step": 13759 }, { "epoch": 2.55, "learning_rate": 1.17843447521101e-06, "loss": 0.4137, "step": 13760 }, { "epoch": 2.55, "learning_rate": 1.1774939385932172e-06, "loss": 0.4103, "step": 13761 }, { "epoch": 2.55, "learning_rate": 1.176553753977079e-06, "loss": 0.4179, "step": 13762 }, { "epoch": 2.55, "learning_rate": 1.1756139214001117e-06, "loss": 0.4345, "step": 13763 }, { "epoch": 2.55, "learning_rate": 1.174674440899809e-06, "loss": 0.4148, "step": 13764 }, { "epoch": 2.55, "learning_rate": 1.1737353125136586e-06, "loss": 0.4067, "step": 13765 }, { "epoch": 2.55, "learning_rate": 1.172796536279126e-06, "loss": 0.3815, "step": 13766 }, { "epoch": 2.55, "learning_rate": 1.1718581122336704e-06, "loss": 0.4233, "step": 13767 }, { "epoch": 2.55, "learning_rate": 1.170920040414729e-06, "loss": 0.405, "step": 13768 }, { "epoch": 2.55, "learning_rate": 1.1699823208597338e-06, "loss": 0.4217, "step": 13769 }, { "epoch": 2.55, "learning_rate": 1.1690449536060932e-06, "loss": 0.402, "step": 13770 }, { "epoch": 2.55, "learning_rate": 1.168107938691212e-06, "loss": 0.4142, "step": 13771 }, { "epoch": 2.55, "learning_rate": 1.167171276152469e-06, "loss": 0.4045, "step": 13772 }, { "epoch": 2.55, "learning_rate": 1.166234966027241e-06, "loss": 0.3996, "step": 13773 }, { "epoch": 2.55, "learning_rate": 1.1652990083528804e-06, "loss": 0.4212, "step": 13774 }, { "epoch": 2.55, "learning_rate": 1.164363403166735e-06, "loss": 0.4179, "step": 13775 }, { "epoch": 2.55, "learning_rate": 1.1634281505061284e-06, "loss": 0.4064, "step": 13776 }, { "epoch": 2.55, "learning_rate": 1.1624932504083797e-06, "loss": 0.4089, "step": 13777 }, { "epoch": 2.55, "learning_rate": 1.1615587029107888e-06, "loss": 0.4267, "step": 13778 }, { "epoch": 2.55, "learning_rate": 1.1606245080506396e-06, "loss": 0.4115, "step": 13779 }, { "epoch": 2.55, "learning_rate": 1.1596906658652086e-06, "loss": 0.4208, "step": 13780 }, { "epoch": 2.55, "learning_rate": 1.1587571763917505e-06, "loss": 0.4101, "step": 13781 }, { "epoch": 2.55, "learning_rate": 1.1578240396675145e-06, "loss": 0.4136, "step": 13782 }, { "epoch": 2.55, "learning_rate": 1.1568912557297284e-06, "loss": 0.3922, "step": 13783 }, { "epoch": 2.55, "learning_rate": 1.1559588246156061e-06, "loss": 0.3937, "step": 13784 }, { "epoch": 2.55, "learning_rate": 1.1550267463623554e-06, "loss": 0.4197, "step": 13785 }, { "epoch": 2.55, "learning_rate": 1.1540950210071588e-06, "loss": 0.4224, "step": 13786 }, { "epoch": 2.55, "learning_rate": 1.1531636485871955e-06, "loss": 0.4269, "step": 13787 }, { "epoch": 2.55, "learning_rate": 1.1522326291396224e-06, "loss": 0.4251, "step": 13788 }, { "epoch": 2.55, "learning_rate": 1.1513019627015843e-06, "loss": 0.4052, "step": 13789 }, { "epoch": 2.55, "learning_rate": 1.150371649310218e-06, "loss": 0.4122, "step": 13790 }, { "epoch": 2.55, "learning_rate": 1.149441689002635e-06, "loss": 0.4319, "step": 13791 }, { "epoch": 2.55, "learning_rate": 1.1485120818159445e-06, "loss": 0.4369, "step": 13792 }, { "epoch": 2.55, "learning_rate": 1.1475828277872325e-06, "loss": 0.4088, "step": 13793 }, { "epoch": 2.55, "learning_rate": 1.1466539269535771e-06, "loss": 0.4072, "step": 13794 }, { "epoch": 2.55, "learning_rate": 1.1457253793520385e-06, "loss": 0.4265, "step": 13795 }, { "epoch": 2.55, "learning_rate": 1.1447971850196627e-06, "loss": 0.4089, "step": 13796 }, { "epoch": 2.55, "learning_rate": 1.1438693439934856e-06, "loss": 0.4206, "step": 13797 }, { "epoch": 2.55, "learning_rate": 1.1429418563105232e-06, "loss": 0.3988, "step": 13798 }, { "epoch": 2.55, "learning_rate": 1.142014722007785e-06, "loss": 0.4135, "step": 13799 }, { "epoch": 2.55, "learning_rate": 1.1410879411222586e-06, "loss": 0.4043, "step": 13800 }, { "epoch": 2.55, "learning_rate": 1.1401615136909194e-06, "loss": 0.4158, "step": 13801 }, { "epoch": 2.55, "learning_rate": 1.1392354397507344e-06, "loss": 0.4178, "step": 13802 }, { "epoch": 2.55, "learning_rate": 1.1383097193386484e-06, "loss": 0.4025, "step": 13803 }, { "epoch": 2.55, "learning_rate": 1.1373843524915983e-06, "loss": 0.4328, "step": 13804 }, { "epoch": 2.55, "learning_rate": 1.136459339246505e-06, "loss": 0.3911, "step": 13805 }, { "epoch": 2.55, "learning_rate": 1.1355346796402723e-06, "loss": 0.3767, "step": 13806 }, { "epoch": 2.55, "learning_rate": 1.1346103737097947e-06, "loss": 0.4092, "step": 13807 }, { "epoch": 2.55, "learning_rate": 1.1336864214919474e-06, "loss": 0.4301, "step": 13808 }, { "epoch": 2.55, "learning_rate": 1.1327628230235987e-06, "loss": 0.4161, "step": 13809 }, { "epoch": 2.56, "learning_rate": 1.1318395783415958e-06, "loss": 0.4236, "step": 13810 }, { "epoch": 2.56, "learning_rate": 1.1309166874827727e-06, "loss": 0.412, "step": 13811 }, { "epoch": 2.56, "learning_rate": 1.1299941504839552e-06, "loss": 0.4133, "step": 13812 }, { "epoch": 2.56, "learning_rate": 1.1290719673819472e-06, "loss": 0.4015, "step": 13813 }, { "epoch": 2.56, "learning_rate": 1.128150138213545e-06, "loss": 0.4128, "step": 13814 }, { "epoch": 2.56, "learning_rate": 1.127228663015525e-06, "loss": 0.4253, "step": 13815 }, { "epoch": 2.56, "learning_rate": 1.126307541824656e-06, "loss": 0.4228, "step": 13816 }, { "epoch": 2.56, "learning_rate": 1.1253867746776837e-06, "loss": 0.4009, "step": 13817 }, { "epoch": 2.56, "learning_rate": 1.1244663616113516e-06, "loss": 0.4254, "step": 13818 }, { "epoch": 2.56, "learning_rate": 1.1235463026623761e-06, "loss": 0.4087, "step": 13819 }, { "epoch": 2.56, "learning_rate": 1.122626597867471e-06, "loss": 0.4204, "step": 13820 }, { "epoch": 2.56, "learning_rate": 1.1217072472633272e-06, "loss": 0.4006, "step": 13821 }, { "epoch": 2.56, "learning_rate": 1.1207882508866274e-06, "loss": 0.4027, "step": 13822 }, { "epoch": 2.56, "learning_rate": 1.1198696087740358e-06, "loss": 0.4426, "step": 13823 }, { "epoch": 2.56, "learning_rate": 1.1189513209622072e-06, "loss": 0.4199, "step": 13824 }, { "epoch": 2.56, "learning_rate": 1.1180333874877769e-06, "loss": 0.4189, "step": 13825 }, { "epoch": 2.56, "learning_rate": 1.1171158083873713e-06, "loss": 0.4253, "step": 13826 }, { "epoch": 2.56, "learning_rate": 1.1161985836975986e-06, "loss": 0.4275, "step": 13827 }, { "epoch": 2.56, "learning_rate": 1.1152817134550532e-06, "loss": 0.4397, "step": 13828 }, { "epoch": 2.56, "learning_rate": 1.1143651976963188e-06, "loss": 0.394, "step": 13829 }, { "epoch": 2.56, "learning_rate": 1.1134490364579609e-06, "loss": 0.4257, "step": 13830 }, { "epoch": 2.56, "learning_rate": 1.1125332297765345e-06, "loss": 0.4008, "step": 13831 }, { "epoch": 2.56, "learning_rate": 1.1116177776885773e-06, "loss": 0.4059, "step": 13832 }, { "epoch": 2.56, "learning_rate": 1.1107026802306132e-06, "loss": 0.4017, "step": 13833 }, { "epoch": 2.56, "learning_rate": 1.1097879374391562e-06, "loss": 0.4236, "step": 13834 }, { "epoch": 2.56, "learning_rate": 1.1088735493506974e-06, "loss": 0.418, "step": 13835 }, { "epoch": 2.56, "learning_rate": 1.1079595160017253e-06, "loss": 0.4296, "step": 13836 }, { "epoch": 2.56, "learning_rate": 1.107045837428704e-06, "loss": 0.4116, "step": 13837 }, { "epoch": 2.56, "learning_rate": 1.10613251366809e-06, "loss": 0.4182, "step": 13838 }, { "epoch": 2.56, "learning_rate": 1.105219544756323e-06, "loss": 0.4272, "step": 13839 }, { "epoch": 2.56, "learning_rate": 1.1043069307298249e-06, "loss": 0.4203, "step": 13840 }, { "epoch": 2.56, "learning_rate": 1.1033946716250133e-06, "loss": 0.4142, "step": 13841 }, { "epoch": 2.56, "learning_rate": 1.10248276747828e-06, "loss": 0.4131, "step": 13842 }, { "epoch": 2.56, "learning_rate": 1.101571218326013e-06, "loss": 0.4379, "step": 13843 }, { "epoch": 2.56, "learning_rate": 1.1006600242045796e-06, "loss": 0.4136, "step": 13844 }, { "epoch": 2.56, "learning_rate": 1.0997491851503317e-06, "loss": 0.4141, "step": 13845 }, { "epoch": 2.56, "learning_rate": 1.098838701199616e-06, "loss": 0.4223, "step": 13846 }, { "epoch": 2.56, "learning_rate": 1.0979285723887534e-06, "loss": 0.4312, "step": 13847 }, { "epoch": 2.56, "learning_rate": 1.0970187987540614e-06, "loss": 0.406, "step": 13848 }, { "epoch": 2.56, "learning_rate": 1.0961093803318357e-06, "loss": 0.4157, "step": 13849 }, { "epoch": 2.56, "learning_rate": 1.0952003171583593e-06, "loss": 0.4088, "step": 13850 }, { "epoch": 2.56, "learning_rate": 1.0942916092699051e-06, "loss": 0.4081, "step": 13851 }, { "epoch": 2.56, "learning_rate": 1.0933832567027248e-06, "loss": 0.4238, "step": 13852 }, { "epoch": 2.56, "learning_rate": 1.0924752594930643e-06, "loss": 0.421, "step": 13853 }, { "epoch": 2.56, "learning_rate": 1.0915676176771495e-06, "loss": 0.4019, "step": 13854 }, { "epoch": 2.56, "learning_rate": 1.0906603312911913e-06, "loss": 0.4304, "step": 13855 }, { "epoch": 2.56, "learning_rate": 1.0897534003713927e-06, "loss": 0.4069, "step": 13856 }, { "epoch": 2.56, "learning_rate": 1.088846824953934e-06, "loss": 0.4016, "step": 13857 }, { "epoch": 2.56, "learning_rate": 1.0879406050749908e-06, "loss": 0.4211, "step": 13858 }, { "epoch": 2.56, "learning_rate": 1.087034740770716e-06, "loss": 0.4057, "step": 13859 }, { "epoch": 2.56, "learning_rate": 1.0861292320772543e-06, "loss": 0.4144, "step": 13860 }, { "epoch": 2.56, "learning_rate": 1.0852240790307323e-06, "loss": 0.3904, "step": 13861 }, { "epoch": 2.56, "learning_rate": 1.0843192816672632e-06, "loss": 0.4284, "step": 13862 }, { "epoch": 2.56, "learning_rate": 1.0834148400229484e-06, "loss": 0.4241, "step": 13863 }, { "epoch": 2.57, "learning_rate": 1.082510754133872e-06, "loss": 0.4226, "step": 13864 }, { "epoch": 2.57, "learning_rate": 1.0816070240361075e-06, "loss": 0.3953, "step": 13865 }, { "epoch": 2.57, "learning_rate": 1.080703649765712e-06, "loss": 0.3916, "step": 13866 }, { "epoch": 2.57, "learning_rate": 1.0798006313587238e-06, "loss": 0.3979, "step": 13867 }, { "epoch": 2.57, "learning_rate": 1.0788979688511781e-06, "loss": 0.4121, "step": 13868 }, { "epoch": 2.57, "learning_rate": 1.0779956622790845e-06, "loss": 0.397, "step": 13869 }, { "epoch": 2.57, "learning_rate": 1.0770937116784475e-06, "loss": 0.4037, "step": 13870 }, { "epoch": 2.57, "learning_rate": 1.0761921170852484e-06, "loss": 0.4117, "step": 13871 }, { "epoch": 2.57, "learning_rate": 1.0752908785354632e-06, "loss": 0.4075, "step": 13872 }, { "epoch": 2.57, "learning_rate": 1.0743899960650472e-06, "loss": 0.4206, "step": 13873 }, { "epoch": 2.57, "learning_rate": 1.0734894697099474e-06, "loss": 0.4006, "step": 13874 }, { "epoch": 2.57, "learning_rate": 1.0725892995060882e-06, "loss": 0.4295, "step": 13875 }, { "epoch": 2.57, "learning_rate": 1.0716894854893889e-06, "loss": 0.4201, "step": 13876 }, { "epoch": 2.57, "learning_rate": 1.0707900276957473e-06, "loss": 0.4164, "step": 13877 }, { "epoch": 2.57, "learning_rate": 1.0698909261610536e-06, "loss": 0.4301, "step": 13878 }, { "epoch": 2.57, "learning_rate": 1.0689921809211768e-06, "loss": 0.406, "step": 13879 }, { "epoch": 2.57, "learning_rate": 1.0680937920119782e-06, "loss": 0.4065, "step": 13880 }, { "epoch": 2.57, "learning_rate": 1.0671957594692983e-06, "loss": 0.4246, "step": 13881 }, { "epoch": 2.57, "learning_rate": 1.0662980833289704e-06, "loss": 0.4198, "step": 13882 }, { "epoch": 2.57, "learning_rate": 1.0654007636268094e-06, "loss": 0.4196, "step": 13883 }, { "epoch": 2.57, "learning_rate": 1.064503800398614e-06, "loss": 0.4189, "step": 13884 }, { "epoch": 2.57, "learning_rate": 1.063607193680175e-06, "loss": 0.4174, "step": 13885 }, { "epoch": 2.57, "learning_rate": 1.0627109435072613e-06, "loss": 0.4119, "step": 13886 }, { "epoch": 2.57, "learning_rate": 1.0618150499156365e-06, "loss": 0.416, "step": 13887 }, { "epoch": 2.57, "learning_rate": 1.060919512941042e-06, "loss": 0.4017, "step": 13888 }, { "epoch": 2.57, "learning_rate": 1.0600243326192073e-06, "loss": 0.3957, "step": 13889 }, { "epoch": 2.57, "learning_rate": 1.0591295089858522e-06, "loss": 0.4141, "step": 13890 }, { "epoch": 2.57, "learning_rate": 1.058235042076674e-06, "loss": 0.4028, "step": 13891 }, { "epoch": 2.57, "learning_rate": 1.0573409319273632e-06, "loss": 0.4329, "step": 13892 }, { "epoch": 2.57, "learning_rate": 1.056447178573593e-06, "loss": 0.4068, "step": 13893 }, { "epoch": 2.57, "learning_rate": 1.055553782051021e-06, "loss": 0.4175, "step": 13894 }, { "epoch": 2.57, "learning_rate": 1.0546607423952937e-06, "loss": 0.4229, "step": 13895 }, { "epoch": 2.57, "learning_rate": 1.0537680596420385e-06, "loss": 0.4222, "step": 13896 }, { "epoch": 2.57, "learning_rate": 1.0528757338268768e-06, "loss": 0.4165, "step": 13897 }, { "epoch": 2.57, "learning_rate": 1.051983764985408e-06, "loss": 0.4229, "step": 13898 }, { "epoch": 2.57, "learning_rate": 1.0510921531532192e-06, "loss": 0.4295, "step": 13899 }, { "epoch": 2.57, "learning_rate": 1.0502008983658852e-06, "loss": 0.4199, "step": 13900 }, { "epoch": 2.57, "learning_rate": 1.049310000658965e-06, "loss": 0.4056, "step": 13901 }, { "epoch": 2.57, "learning_rate": 1.0484194600680054e-06, "loss": 0.4157, "step": 13902 }, { "epoch": 2.57, "learning_rate": 1.0475292766285328e-06, "loss": 0.3921, "step": 13903 }, { "epoch": 2.57, "learning_rate": 1.0466394503760702e-06, "loss": 0.4247, "step": 13904 }, { "epoch": 2.57, "learning_rate": 1.0457499813461169e-06, "loss": 0.4059, "step": 13905 }, { "epoch": 2.57, "learning_rate": 1.044860869574158e-06, "loss": 0.4196, "step": 13906 }, { "epoch": 2.57, "learning_rate": 1.043972115095674e-06, "loss": 0.4123, "step": 13907 }, { "epoch": 2.57, "learning_rate": 1.0430837179461173e-06, "loss": 0.4271, "step": 13908 }, { "epoch": 2.57, "learning_rate": 1.04219567816094e-06, "loss": 0.4132, "step": 13909 }, { "epoch": 2.57, "learning_rate": 1.04130799577557e-06, "loss": 0.4138, "step": 13910 }, { "epoch": 2.57, "learning_rate": 1.0404206708254216e-06, "loss": 0.4113, "step": 13911 }, { "epoch": 2.57, "learning_rate": 1.039533703345903e-06, "loss": 0.4001, "step": 13912 }, { "epoch": 2.57, "learning_rate": 1.038647093372398e-06, "loss": 0.4037, "step": 13913 }, { "epoch": 2.57, "learning_rate": 1.037760840940284e-06, "loss": 0.4001, "step": 13914 }, { "epoch": 2.57, "learning_rate": 1.0368749460849192e-06, "loss": 0.4307, "step": 13915 }, { "epoch": 2.57, "learning_rate": 1.0359894088416477e-06, "loss": 0.426, "step": 13916 }, { "epoch": 2.57, "learning_rate": 1.0351042292458048e-06, "loss": 0.4081, "step": 13917 }, { "epoch": 2.58, "learning_rate": 1.0342194073327016e-06, "loss": 0.4033, "step": 13918 }, { "epoch": 2.58, "learning_rate": 1.0333349431376483e-06, "loss": 0.4247, "step": 13919 }, { "epoch": 2.58, "learning_rate": 1.0324508366959263e-06, "loss": 0.4226, "step": 13920 }, { "epoch": 2.58, "learning_rate": 1.0315670880428142e-06, "loss": 0.4175, "step": 13921 }, { "epoch": 2.58, "learning_rate": 1.0306836972135702e-06, "loss": 0.4138, "step": 13922 }, { "epoch": 2.58, "learning_rate": 1.029800664243441e-06, "loss": 0.4054, "step": 13923 }, { "epoch": 2.58, "learning_rate": 1.028917989167656e-06, "loss": 0.4078, "step": 13924 }, { "epoch": 2.58, "learning_rate": 1.0280356720214358e-06, "loss": 0.4084, "step": 13925 }, { "epoch": 2.58, "learning_rate": 1.02715371283998e-06, "loss": 0.4214, "step": 13926 }, { "epoch": 2.58, "learning_rate": 1.0262721116584796e-06, "loss": 0.4177, "step": 13927 }, { "epoch": 2.58, "learning_rate": 1.025390868512105e-06, "loss": 0.4071, "step": 13928 }, { "epoch": 2.58, "learning_rate": 1.0245099834360206e-06, "loss": 0.4205, "step": 13929 }, { "epoch": 2.58, "learning_rate": 1.0236294564653692e-06, "loss": 0.4021, "step": 13930 }, { "epoch": 2.58, "learning_rate": 1.022749287635284e-06, "loss": 0.413, "step": 13931 }, { "epoch": 2.58, "learning_rate": 1.0218694769808823e-06, "loss": 0.418, "step": 13932 }, { "epoch": 2.58, "learning_rate": 1.020990024537264e-06, "loss": 0.425, "step": 13933 }, { "epoch": 2.58, "learning_rate": 1.0201109303395207e-06, "loss": 0.4321, "step": 13934 }, { "epoch": 2.58, "learning_rate": 1.0192321944227235e-06, "loss": 0.4188, "step": 13935 }, { "epoch": 2.58, "learning_rate": 1.0183538168219365e-06, "loss": 0.4114, "step": 13936 }, { "epoch": 2.58, "learning_rate": 1.0174757975722038e-06, "loss": 0.4237, "step": 13937 }, { "epoch": 2.58, "learning_rate": 1.0165981367085532e-06, "loss": 0.4255, "step": 13938 }, { "epoch": 2.58, "learning_rate": 1.0157208342660074e-06, "loss": 0.4256, "step": 13939 }, { "epoch": 2.58, "learning_rate": 1.0148438902795632e-06, "loss": 0.4177, "step": 13940 }, { "epoch": 2.58, "learning_rate": 1.0139673047842159e-06, "loss": 0.4102, "step": 13941 }, { "epoch": 2.58, "learning_rate": 1.0130910778149338e-06, "loss": 0.4169, "step": 13942 }, { "epoch": 2.58, "learning_rate": 1.0122152094066783e-06, "loss": 0.4159, "step": 13943 }, { "epoch": 2.58, "learning_rate": 1.011339699594398e-06, "loss": 0.4008, "step": 13944 }, { "epoch": 2.58, "learning_rate": 1.0104645484130182e-06, "loss": 0.4077, "step": 13945 }, { "epoch": 2.58, "learning_rate": 1.0095897558974622e-06, "loss": 0.4008, "step": 13946 }, { "epoch": 2.58, "learning_rate": 1.0087153220826296e-06, "loss": 0.4208, "step": 13947 }, { "epoch": 2.58, "learning_rate": 1.007841247003406e-06, "loss": 0.4193, "step": 13948 }, { "epoch": 2.58, "learning_rate": 1.0069675306946702e-06, "loss": 0.4096, "step": 13949 }, { "epoch": 2.58, "learning_rate": 1.0060941731912788e-06, "loss": 0.4377, "step": 13950 }, { "epoch": 2.58, "learning_rate": 1.0052211745280794e-06, "loss": 0.4046, "step": 13951 }, { "epoch": 2.58, "learning_rate": 1.0043485347398995e-06, "loss": 0.4038, "step": 13952 }, { "epoch": 2.58, "learning_rate": 1.0034762538615606e-06, "loss": 0.4268, "step": 13953 }, { "epoch": 2.58, "learning_rate": 1.0026043319278622e-06, "loss": 0.4073, "step": 13954 }, { "epoch": 2.58, "learning_rate": 1.0017327689735913e-06, "loss": 0.4106, "step": 13955 }, { "epoch": 2.58, "learning_rate": 1.0008615650335241e-06, "loss": 0.4332, "step": 13956 }, { "epoch": 2.58, "learning_rate": 9.999907201424175e-07, "loss": 0.4197, "step": 13957 }, { "epoch": 2.58, "learning_rate": 9.991202343350204e-07, "loss": 0.4013, "step": 13958 }, { "epoch": 2.58, "learning_rate": 9.982501076460604e-07, "loss": 0.4287, "step": 13959 }, { "epoch": 2.58, "learning_rate": 9.973803401102532e-07, "loss": 0.4165, "step": 13960 }, { "epoch": 2.58, "learning_rate": 9.965109317623045e-07, "loss": 0.3979, "step": 13961 }, { "epoch": 2.58, "learning_rate": 9.956418826368986e-07, "loss": 0.4216, "step": 13962 }, { "epoch": 2.58, "learning_rate": 9.947731927687122e-07, "loss": 0.4143, "step": 13963 }, { "epoch": 2.58, "learning_rate": 9.93904862192403e-07, "loss": 0.4206, "step": 13964 }, { "epoch": 2.58, "learning_rate": 9.930368909426124e-07, "loss": 0.4006, "step": 13965 }, { "epoch": 2.58, "learning_rate": 9.921692790539772e-07, "loss": 0.4037, "step": 13966 }, { "epoch": 2.58, "learning_rate": 9.913020265611073e-07, "loss": 0.4125, "step": 13967 }, { "epoch": 2.58, "learning_rate": 9.904351334986095e-07, "loss": 0.4171, "step": 13968 }, { "epoch": 2.58, "learning_rate": 9.895685999010674e-07, "loss": 0.4034, "step": 13969 }, { "epoch": 2.58, "learning_rate": 9.887024258030575e-07, "loss": 0.4041, "step": 13970 }, { "epoch": 2.58, "learning_rate": 9.878366112391358e-07, "loss": 0.3995, "step": 13971 }, { "epoch": 2.59, "learning_rate": 9.86971156243849e-07, "loss": 0.4112, "step": 13972 }, { "epoch": 2.59, "learning_rate": 9.861060608517237e-07, "loss": 0.411, "step": 13973 }, { "epoch": 2.59, "learning_rate": 9.852413250972792e-07, "loss": 0.4005, "step": 13974 }, { "epoch": 2.59, "learning_rate": 9.843769490150145e-07, "loss": 0.4079, "step": 13975 }, { "epoch": 2.59, "learning_rate": 9.8351293263942e-07, "loss": 0.4249, "step": 13976 }, { "epoch": 2.59, "learning_rate": 9.826492760049623e-07, "loss": 0.4122, "step": 13977 }, { "epoch": 2.59, "learning_rate": 9.81785979146106e-07, "loss": 0.4269, "step": 13978 }, { "epoch": 2.59, "learning_rate": 9.809230420972904e-07, "loss": 0.4175, "step": 13979 }, { "epoch": 2.59, "learning_rate": 9.8006046489295e-07, "loss": 0.4261, "step": 13980 }, { "epoch": 2.59, "learning_rate": 9.791982475674955e-07, "loss": 0.4228, "step": 13981 }, { "epoch": 2.59, "learning_rate": 9.783363901553288e-07, "loss": 0.4359, "step": 13982 }, { "epoch": 2.59, "learning_rate": 9.774748926908383e-07, "loss": 0.4093, "step": 13983 }, { "epoch": 2.59, "learning_rate": 9.76613755208392e-07, "loss": 0.4265, "step": 13984 }, { "epoch": 2.59, "learning_rate": 9.757529777423535e-07, "loss": 0.421, "step": 13985 }, { "epoch": 2.59, "learning_rate": 9.748925603270632e-07, "loss": 0.4196, "step": 13986 }, { "epoch": 2.59, "learning_rate": 9.740325029968477e-07, "loss": 0.4011, "step": 13987 }, { "epoch": 2.59, "learning_rate": 9.731728057860269e-07, "loss": 0.4134, "step": 13988 }, { "epoch": 2.59, "learning_rate": 9.72313468728896e-07, "loss": 0.4024, "step": 13989 }, { "epoch": 2.59, "learning_rate": 9.714544918597458e-07, "loss": 0.3968, "step": 13990 }, { "epoch": 2.59, "learning_rate": 9.705958752128442e-07, "loss": 0.3927, "step": 13991 }, { "epoch": 2.59, "learning_rate": 9.697376188224494e-07, "loss": 0.4216, "step": 13992 }, { "epoch": 2.59, "learning_rate": 9.688797227228053e-07, "loss": 0.4367, "step": 13993 }, { "epoch": 2.59, "learning_rate": 9.680221869481377e-07, "loss": 0.3952, "step": 13994 }, { "epoch": 2.59, "learning_rate": 9.671650115326648e-07, "loss": 0.424, "step": 13995 }, { "epoch": 2.59, "learning_rate": 9.663081965105824e-07, "loss": 0.4013, "step": 13996 }, { "epoch": 2.59, "learning_rate": 9.654517419160791e-07, "loss": 0.4146, "step": 13997 }, { "epoch": 2.59, "learning_rate": 9.64595647783325e-07, "loss": 0.4136, "step": 13998 }, { "epoch": 2.59, "learning_rate": 9.63739914146473e-07, "loss": 0.4054, "step": 13999 }, { "epoch": 2.59, "learning_rate": 9.628845410396704e-07, "loss": 0.3761, "step": 14000 }, { "epoch": 2.59, "learning_rate": 9.620295284970415e-07, "loss": 0.4025, "step": 14001 }, { "epoch": 2.59, "learning_rate": 9.61174876552703e-07, "loss": 0.4073, "step": 14002 }, { "epoch": 2.59, "learning_rate": 9.603205852407515e-07, "loss": 0.4124, "step": 14003 }, { "epoch": 2.59, "learning_rate": 9.594666545952702e-07, "loss": 0.4057, "step": 14004 }, { "epoch": 2.59, "learning_rate": 9.586130846503327e-07, "loss": 0.4115, "step": 14005 }, { "epoch": 2.59, "learning_rate": 9.577598754399919e-07, "loss": 0.4322, "step": 14006 }, { "epoch": 2.59, "learning_rate": 9.56907026998294e-07, "loss": 0.4088, "step": 14007 }, { "epoch": 2.59, "learning_rate": 9.560545393592614e-07, "loss": 0.3884, "step": 14008 }, { "epoch": 2.59, "learning_rate": 9.55202412556907e-07, "loss": 0.41, "step": 14009 }, { "epoch": 2.59, "learning_rate": 9.543506466252317e-07, "loss": 0.4267, "step": 14010 }, { "epoch": 2.59, "learning_rate": 9.53499241598217e-07, "loss": 0.4124, "step": 14011 }, { "epoch": 2.59, "learning_rate": 9.526481975098346e-07, "loss": 0.3819, "step": 14012 }, { "epoch": 2.59, "learning_rate": 9.517975143940384e-07, "loss": 0.4172, "step": 14013 }, { "epoch": 2.59, "learning_rate": 9.509471922847668e-07, "loss": 0.4151, "step": 14014 }, { "epoch": 2.59, "learning_rate": 9.500972312159507e-07, "loss": 0.4099, "step": 14015 }, { "epoch": 2.59, "learning_rate": 9.492476312214982e-07, "loss": 0.4112, "step": 14016 }, { "epoch": 2.59, "learning_rate": 9.483983923353091e-07, "loss": 0.4278, "step": 14017 }, { "epoch": 2.59, "learning_rate": 9.47549514591265e-07, "loss": 0.4267, "step": 14018 }, { "epoch": 2.59, "learning_rate": 9.467009980232356e-07, "loss": 0.4145, "step": 14019 }, { "epoch": 2.59, "learning_rate": 9.458528426650737e-07, "loss": 0.3922, "step": 14020 }, { "epoch": 2.59, "learning_rate": 9.450050485506212e-07, "loss": 0.4231, "step": 14021 }, { "epoch": 2.59, "learning_rate": 9.441576157137012e-07, "loss": 0.4227, "step": 14022 }, { "epoch": 2.59, "learning_rate": 9.433105441881274e-07, "loss": 0.4125, "step": 14023 }, { "epoch": 2.59, "learning_rate": 9.42463834007693e-07, "loss": 0.4049, "step": 14024 }, { "epoch": 2.59, "learning_rate": 9.416174852061844e-07, "loss": 0.4359, "step": 14025 }, { "epoch": 2.6, "learning_rate": 9.407714978173654e-07, "loss": 0.4261, "step": 14026 }, { "epoch": 2.6, "learning_rate": 9.399258718749915e-07, "loss": 0.4008, "step": 14027 }, { "epoch": 2.6, "learning_rate": 9.390806074128e-07, "loss": 0.4225, "step": 14028 }, { "epoch": 2.6, "learning_rate": 9.382357044645185e-07, "loss": 0.4104, "step": 14029 }, { "epoch": 2.6, "learning_rate": 9.373911630638544e-07, "loss": 0.4272, "step": 14030 }, { "epoch": 2.6, "learning_rate": 9.365469832445018e-07, "loss": 0.4086, "step": 14031 }, { "epoch": 2.6, "learning_rate": 9.357031650401472e-07, "loss": 0.4185, "step": 14032 }, { "epoch": 2.6, "learning_rate": 9.348597084844513e-07, "loss": 0.4178, "step": 14033 }, { "epoch": 2.6, "learning_rate": 9.340166136110706e-07, "loss": 0.4119, "step": 14034 }, { "epoch": 2.6, "learning_rate": 9.331738804536428e-07, "loss": 0.4383, "step": 14035 }, { "epoch": 2.6, "learning_rate": 9.323315090457885e-07, "loss": 0.4006, "step": 14036 }, { "epoch": 2.6, "learning_rate": 9.314894994211199e-07, "loss": 0.4344, "step": 14037 }, { "epoch": 2.6, "learning_rate": 9.3064785161323e-07, "loss": 0.4221, "step": 14038 }, { "epoch": 2.6, "learning_rate": 9.298065656556998e-07, "loss": 0.4175, "step": 14039 }, { "epoch": 2.6, "learning_rate": 9.289656415820935e-07, "loss": 0.4139, "step": 14040 }, { "epoch": 2.6, "learning_rate": 9.281250794259644e-07, "loss": 0.4134, "step": 14041 }, { "epoch": 2.6, "learning_rate": 9.272848792208489e-07, "loss": 0.4258, "step": 14042 }, { "epoch": 2.6, "learning_rate": 9.264450410002679e-07, "loss": 0.4181, "step": 14043 }, { "epoch": 2.6, "learning_rate": 9.256055647977313e-07, "loss": 0.411, "step": 14044 }, { "epoch": 2.6, "learning_rate": 9.247664506467313e-07, "loss": 0.4015, "step": 14045 }, { "epoch": 2.6, "learning_rate": 9.239276985807488e-07, "loss": 0.4105, "step": 14046 }, { "epoch": 2.6, "learning_rate": 9.230893086332471e-07, "loss": 0.4201, "step": 14047 }, { "epoch": 2.6, "learning_rate": 9.222512808376748e-07, "loss": 0.4187, "step": 14048 }, { "epoch": 2.6, "learning_rate": 9.21413615227471e-07, "loss": 0.3972, "step": 14049 }, { "epoch": 2.6, "learning_rate": 9.205763118360533e-07, "loss": 0.3922, "step": 14050 }, { "epoch": 2.6, "learning_rate": 9.197393706968328e-07, "loss": 0.4211, "step": 14051 }, { "epoch": 2.6, "learning_rate": 9.189027918432003e-07, "loss": 0.4334, "step": 14052 }, { "epoch": 2.6, "learning_rate": 9.180665753085305e-07, "loss": 0.4161, "step": 14053 }, { "epoch": 2.6, "learning_rate": 9.172307211261922e-07, "loss": 0.4046, "step": 14054 }, { "epoch": 2.6, "learning_rate": 9.163952293295298e-07, "loss": 0.4004, "step": 14055 }, { "epoch": 2.6, "learning_rate": 9.155600999518821e-07, "loss": 0.4169, "step": 14056 }, { "epoch": 2.6, "learning_rate": 9.147253330265659e-07, "loss": 0.4154, "step": 14057 }, { "epoch": 2.6, "learning_rate": 9.138909285868869e-07, "loss": 0.4, "step": 14058 }, { "epoch": 2.6, "learning_rate": 9.130568866661393e-07, "loss": 0.3882, "step": 14059 }, { "epoch": 2.6, "learning_rate": 9.122232072975956e-07, "loss": 0.4021, "step": 14060 }, { "epoch": 2.6, "learning_rate": 9.113898905145225e-07, "loss": 0.403, "step": 14061 }, { "epoch": 2.6, "learning_rate": 9.105569363501632e-07, "loss": 0.4056, "step": 14062 }, { "epoch": 2.6, "learning_rate": 9.097243448377568e-07, "loss": 0.4138, "step": 14063 }, { "epoch": 2.6, "learning_rate": 9.08892116010518e-07, "loss": 0.4116, "step": 14064 }, { "epoch": 2.6, "learning_rate": 9.0806024990165e-07, "loss": 0.4437, "step": 14065 }, { "epoch": 2.6, "learning_rate": 9.072287465443463e-07, "loss": 0.4177, "step": 14066 }, { "epoch": 2.6, "learning_rate": 9.063976059717794e-07, "loss": 0.4313, "step": 14067 }, { "epoch": 2.6, "learning_rate": 9.055668282171137e-07, "loss": 0.4311, "step": 14068 }, { "epoch": 2.6, "learning_rate": 9.047364133134917e-07, "loss": 0.4078, "step": 14069 }, { "epoch": 2.6, "learning_rate": 9.039063612940491e-07, "loss": 0.4134, "step": 14070 }, { "epoch": 2.6, "learning_rate": 9.030766721918993e-07, "loss": 0.4236, "step": 14071 }, { "epoch": 2.6, "learning_rate": 9.022473460401505e-07, "loss": 0.4131, "step": 14072 }, { "epoch": 2.6, "learning_rate": 9.014183828718859e-07, "loss": 0.4001, "step": 14073 }, { "epoch": 2.6, "learning_rate": 9.005897827201848e-07, "loss": 0.413, "step": 14074 }, { "epoch": 2.6, "learning_rate": 8.99761545618102e-07, "loss": 0.4164, "step": 14075 }, { "epoch": 2.6, "learning_rate": 8.989336715986874e-07, "loss": 0.4177, "step": 14076 }, { "epoch": 2.6, "learning_rate": 8.981061606949671e-07, "loss": 0.4199, "step": 14077 }, { "epoch": 2.6, "learning_rate": 8.9727901293996e-07, "loss": 0.4211, "step": 14078 }, { "epoch": 2.6, "learning_rate": 8.964522283666677e-07, "loss": 0.4179, "step": 14079 }, { "epoch": 2.6, "learning_rate": 8.956258070080759e-07, "loss": 0.4034, "step": 14080 }, { "epoch": 2.61, "learning_rate": 8.947997488971583e-07, "loss": 0.4084, "step": 14081 }, { "epoch": 2.61, "learning_rate": 8.939740540668718e-07, "loss": 0.431, "step": 14082 }, { "epoch": 2.61, "learning_rate": 8.931487225501634e-07, "loss": 0.3936, "step": 14083 }, { "epoch": 2.61, "learning_rate": 8.923237543799579e-07, "loss": 0.4189, "step": 14084 }, { "epoch": 2.61, "learning_rate": 8.914991495891745e-07, "loss": 0.4335, "step": 14085 }, { "epoch": 2.61, "learning_rate": 8.906749082107103e-07, "loss": 0.4148, "step": 14086 }, { "epoch": 2.61, "learning_rate": 8.8985103027745e-07, "loss": 0.4003, "step": 14087 }, { "epoch": 2.61, "learning_rate": 8.890275158222695e-07, "loss": 0.4005, "step": 14088 }, { "epoch": 2.61, "learning_rate": 8.882043648780192e-07, "loss": 0.4109, "step": 14089 }, { "epoch": 2.61, "learning_rate": 8.873815774775474e-07, "loss": 0.4051, "step": 14090 }, { "epoch": 2.61, "learning_rate": 8.865591536536788e-07, "loss": 0.4075, "step": 14091 }, { "epoch": 2.61, "learning_rate": 8.857370934392262e-07, "loss": 0.4278, "step": 14092 }, { "epoch": 2.61, "learning_rate": 8.849153968669899e-07, "loss": 0.3958, "step": 14093 }, { "epoch": 2.61, "learning_rate": 8.840940639697504e-07, "loss": 0.4171, "step": 14094 }, { "epoch": 2.61, "learning_rate": 8.832730947802837e-07, "loss": 0.4101, "step": 14095 }, { "epoch": 2.61, "learning_rate": 8.824524893313402e-07, "loss": 0.4005, "step": 14096 }, { "epoch": 2.61, "learning_rate": 8.816322476556593e-07, "loss": 0.4177, "step": 14097 }, { "epoch": 2.61, "learning_rate": 8.808123697859728e-07, "loss": 0.4146, "step": 14098 }, { "epoch": 2.61, "learning_rate": 8.799928557549864e-07, "loss": 0.4247, "step": 14099 }, { "epoch": 2.61, "learning_rate": 8.791737055954019e-07, "loss": 0.4248, "step": 14100 }, { "epoch": 2.61, "learning_rate": 8.783549193398999e-07, "loss": 0.412, "step": 14101 }, { "epoch": 2.61, "learning_rate": 8.775364970211464e-07, "loss": 0.4297, "step": 14102 }, { "epoch": 2.61, "learning_rate": 8.767184386717986e-07, "loss": 0.3918, "step": 14103 }, { "epoch": 2.61, "learning_rate": 8.759007443244915e-07, "loss": 0.42, "step": 14104 }, { "epoch": 2.61, "learning_rate": 8.750834140118536e-07, "loss": 0.4051, "step": 14105 }, { "epoch": 2.61, "learning_rate": 8.74266447766492e-07, "loss": 0.3968, "step": 14106 }, { "epoch": 2.61, "learning_rate": 8.73449845621005e-07, "loss": 0.4277, "step": 14107 }, { "epoch": 2.61, "learning_rate": 8.726336076079723e-07, "loss": 0.3967, "step": 14108 }, { "epoch": 2.61, "learning_rate": 8.718177337599576e-07, "loss": 0.408, "step": 14109 }, { "epoch": 2.61, "learning_rate": 8.710022241095162e-07, "loss": 0.4112, "step": 14110 }, { "epoch": 2.61, "learning_rate": 8.70187078689183e-07, "loss": 0.4235, "step": 14111 }, { "epoch": 2.61, "learning_rate": 8.693722975314833e-07, "loss": 0.4045, "step": 14112 }, { "epoch": 2.61, "learning_rate": 8.685578806689243e-07, "loss": 0.4194, "step": 14113 }, { "epoch": 2.61, "learning_rate": 8.677438281339978e-07, "loss": 0.3985, "step": 14114 }, { "epoch": 2.61, "learning_rate": 8.669301399591867e-07, "loss": 0.4345, "step": 14115 }, { "epoch": 2.61, "learning_rate": 8.661168161769507e-07, "loss": 0.4248, "step": 14116 }, { "epoch": 2.61, "learning_rate": 8.653038568197458e-07, "loss": 0.3995, "step": 14117 }, { "epoch": 2.61, "learning_rate": 8.644912619200041e-07, "loss": 0.3901, "step": 14118 }, { "epoch": 2.61, "learning_rate": 8.636790315101451e-07, "loss": 0.4295, "step": 14119 }, { "epoch": 2.61, "learning_rate": 8.628671656225785e-07, "loss": 0.3972, "step": 14120 }, { "epoch": 2.61, "learning_rate": 8.620556642896938e-07, "loss": 0.4074, "step": 14121 }, { "epoch": 2.61, "learning_rate": 8.612445275438719e-07, "loss": 0.4127, "step": 14122 }, { "epoch": 2.61, "learning_rate": 8.604337554174713e-07, "loss": 0.4337, "step": 14123 }, { "epoch": 2.61, "learning_rate": 8.59623347942844e-07, "loss": 0.4256, "step": 14124 }, { "epoch": 2.61, "learning_rate": 8.588133051523207e-07, "loss": 0.4058, "step": 14125 }, { "epoch": 2.61, "learning_rate": 8.580036270782243e-07, "loss": 0.4243, "step": 14126 }, { "epoch": 2.61, "learning_rate": 8.571943137528549e-07, "loss": 0.4301, "step": 14127 }, { "epoch": 2.61, "learning_rate": 8.563853652085064e-07, "loss": 0.4245, "step": 14128 }, { "epoch": 2.61, "learning_rate": 8.555767814774507e-07, "loss": 0.4086, "step": 14129 }, { "epoch": 2.61, "learning_rate": 8.547685625919544e-07, "loss": 0.4051, "step": 14130 }, { "epoch": 2.61, "learning_rate": 8.539607085842572e-07, "loss": 0.4173, "step": 14131 }, { "epoch": 2.61, "learning_rate": 8.531532194865966e-07, "loss": 0.42, "step": 14132 }, { "epoch": 2.61, "learning_rate": 8.523460953311858e-07, "loss": 0.4256, "step": 14133 }, { "epoch": 2.61, "learning_rate": 8.515393361502311e-07, "loss": 0.4069, "step": 14134 }, { "epoch": 2.62, "learning_rate": 8.507329419759192e-07, "loss": 0.4218, "step": 14135 }, { "epoch": 2.62, "learning_rate": 8.49926912840422e-07, "loss": 0.4184, "step": 14136 }, { "epoch": 2.62, "learning_rate": 8.491212487759015e-07, "loss": 0.4175, "step": 14137 }, { "epoch": 2.62, "learning_rate": 8.483159498144989e-07, "loss": 0.4143, "step": 14138 }, { "epoch": 2.62, "learning_rate": 8.47511015988347e-07, "loss": 0.4316, "step": 14139 }, { "epoch": 2.62, "learning_rate": 8.467064473295616e-07, "loss": 0.4215, "step": 14140 }, { "epoch": 2.62, "learning_rate": 8.459022438702391e-07, "loss": 0.4097, "step": 14141 }, { "epoch": 2.62, "learning_rate": 8.450984056424716e-07, "loss": 0.4049, "step": 14142 }, { "epoch": 2.62, "learning_rate": 8.442949326783256e-07, "loss": 0.4068, "step": 14143 }, { "epoch": 2.62, "learning_rate": 8.434918250098623e-07, "loss": 0.4205, "step": 14144 }, { "epoch": 2.62, "learning_rate": 8.426890826691214e-07, "loss": 0.3978, "step": 14145 }, { "epoch": 2.62, "learning_rate": 8.418867056881308e-07, "loss": 0.3991, "step": 14146 }, { "epoch": 2.62, "learning_rate": 8.41084694098907e-07, "loss": 0.4148, "step": 14147 }, { "epoch": 2.62, "learning_rate": 8.402830479334445e-07, "loss": 0.3953, "step": 14148 }, { "epoch": 2.62, "learning_rate": 8.394817672237321e-07, "loss": 0.3986, "step": 14149 }, { "epoch": 2.62, "learning_rate": 8.386808520017342e-07, "loss": 0.4046, "step": 14150 }, { "epoch": 2.62, "learning_rate": 8.378803022994109e-07, "loss": 0.4067, "step": 14151 }, { "epoch": 2.62, "learning_rate": 8.370801181486998e-07, "loss": 0.4058, "step": 14152 }, { "epoch": 2.62, "learning_rate": 8.362802995815255e-07, "loss": 0.3984, "step": 14153 }, { "epoch": 2.62, "learning_rate": 8.354808466298037e-07, "loss": 0.436, "step": 14154 }, { "epoch": 2.62, "learning_rate": 8.346817593254253e-07, "loss": 0.4206, "step": 14155 }, { "epoch": 2.62, "learning_rate": 8.338830377002782e-07, "loss": 0.421, "step": 14156 }, { "epoch": 2.62, "learning_rate": 8.33084681786227e-07, "loss": 0.4033, "step": 14157 }, { "epoch": 2.62, "learning_rate": 8.32286691615124e-07, "loss": 0.4294, "step": 14158 }, { "epoch": 2.62, "learning_rate": 8.314890672188092e-07, "loss": 0.4134, "step": 14159 }, { "epoch": 2.62, "learning_rate": 8.306918086291049e-07, "loss": 0.4143, "step": 14160 }, { "epoch": 2.62, "learning_rate": 8.298949158778213e-07, "loss": 0.4121, "step": 14161 }, { "epoch": 2.62, "learning_rate": 8.29098388996753e-07, "loss": 0.4204, "step": 14162 }, { "epoch": 2.62, "learning_rate": 8.283022280176789e-07, "loss": 0.3902, "step": 14163 }, { "epoch": 2.62, "learning_rate": 8.275064329723648e-07, "loss": 0.4114, "step": 14164 }, { "epoch": 2.62, "learning_rate": 8.267110038925607e-07, "loss": 0.4081, "step": 14165 }, { "epoch": 2.62, "learning_rate": 8.259159408100059e-07, "loss": 0.4074, "step": 14166 }, { "epoch": 2.62, "learning_rate": 8.251212437564193e-07, "loss": 0.4213, "step": 14167 }, { "epoch": 2.62, "learning_rate": 8.243269127635067e-07, "loss": 0.4115, "step": 14168 }, { "epoch": 2.62, "learning_rate": 8.235329478629638e-07, "loss": 0.4127, "step": 14169 }, { "epoch": 2.62, "learning_rate": 8.227393490864644e-07, "loss": 0.4257, "step": 14170 }, { "epoch": 2.62, "learning_rate": 8.21946116465675e-07, "loss": 0.4024, "step": 14171 }, { "epoch": 2.62, "learning_rate": 8.211532500322417e-07, "loss": 0.4195, "step": 14172 }, { "epoch": 2.62, "learning_rate": 8.203607498178012e-07, "loss": 0.3976, "step": 14173 }, { "epoch": 2.62, "learning_rate": 8.195686158539695e-07, "loss": 0.4288, "step": 14174 }, { "epoch": 2.62, "learning_rate": 8.187768481723546e-07, "loss": 0.3977, "step": 14175 }, { "epoch": 2.62, "learning_rate": 8.179854468045434e-07, "loss": 0.4321, "step": 14176 }, { "epoch": 2.62, "learning_rate": 8.171944117821141e-07, "loss": 0.389, "step": 14177 }, { "epoch": 2.62, "learning_rate": 8.164037431366256e-07, "loss": 0.4115, "step": 14178 }, { "epoch": 2.62, "learning_rate": 8.156134408996252e-07, "loss": 0.4137, "step": 14179 }, { "epoch": 2.62, "learning_rate": 8.148235051026432e-07, "loss": 0.4263, "step": 14180 }, { "epoch": 2.62, "learning_rate": 8.140339357771987e-07, "loss": 0.4132, "step": 14181 }, { "epoch": 2.62, "learning_rate": 8.132447329547911e-07, "loss": 0.4333, "step": 14182 }, { "epoch": 2.62, "learning_rate": 8.124558966669117e-07, "loss": 0.418, "step": 14183 }, { "epoch": 2.62, "learning_rate": 8.116674269450308e-07, "loss": 0.4286, "step": 14184 }, { "epoch": 2.62, "learning_rate": 8.10879323820607e-07, "loss": 0.4396, "step": 14185 }, { "epoch": 2.62, "learning_rate": 8.10091587325087e-07, "loss": 0.4144, "step": 14186 }, { "epoch": 2.62, "learning_rate": 8.093042174898958e-07, "loss": 0.4134, "step": 14187 }, { "epoch": 2.62, "learning_rate": 8.085172143464515e-07, "loss": 0.4116, "step": 14188 }, { "epoch": 2.63, "learning_rate": 8.077305779261535e-07, "loss": 0.4173, "step": 14189 }, { "epoch": 2.63, "learning_rate": 8.069443082603846e-07, "loss": 0.4027, "step": 14190 }, { "epoch": 2.63, "learning_rate": 8.061584053805194e-07, "loss": 0.4182, "step": 14191 }, { "epoch": 2.63, "learning_rate": 8.053728693179086e-07, "loss": 0.417, "step": 14192 }, { "epoch": 2.63, "learning_rate": 8.045877001039004e-07, "loss": 0.4029, "step": 14193 }, { "epoch": 2.63, "learning_rate": 8.038028977698154e-07, "loss": 0.4224, "step": 14194 }, { "epoch": 2.63, "learning_rate": 8.030184623469706e-07, "loss": 0.4098, "step": 14195 }, { "epoch": 2.63, "learning_rate": 8.02234393866661e-07, "loss": 0.4196, "step": 14196 }, { "epoch": 2.63, "learning_rate": 8.014506923601684e-07, "loss": 0.4385, "step": 14197 }, { "epoch": 2.63, "learning_rate": 8.006673578587642e-07, "loss": 0.416, "step": 14198 }, { "epoch": 2.63, "learning_rate": 7.998843903936993e-07, "loss": 0.425, "step": 14199 }, { "epoch": 2.63, "learning_rate": 7.99101789996215e-07, "loss": 0.3955, "step": 14200 }, { "epoch": 2.63, "learning_rate": 7.983195566975333e-07, "loss": 0.4201, "step": 14201 }, { "epoch": 2.63, "learning_rate": 7.975376905288645e-07, "loss": 0.4016, "step": 14202 }, { "epoch": 2.63, "learning_rate": 7.967561915214039e-07, "loss": 0.404, "step": 14203 }, { "epoch": 2.63, "learning_rate": 7.95975059706332e-07, "loss": 0.3866, "step": 14204 }, { "epoch": 2.63, "learning_rate": 7.951942951148151e-07, "loss": 0.4029, "step": 14205 }, { "epoch": 2.63, "learning_rate": 7.944138977780036e-07, "loss": 0.4028, "step": 14206 }, { "epoch": 2.63, "learning_rate": 7.936338677270328e-07, "loss": 0.4139, "step": 14207 }, { "epoch": 2.63, "learning_rate": 7.928542049930266e-07, "loss": 0.4193, "step": 14208 }, { "epoch": 2.63, "learning_rate": 7.9207490960709e-07, "loss": 0.431, "step": 14209 }, { "epoch": 2.63, "learning_rate": 7.912959816003174e-07, "loss": 0.4114, "step": 14210 }, { "epoch": 2.63, "learning_rate": 7.90517421003787e-07, "loss": 0.4195, "step": 14211 }, { "epoch": 2.63, "learning_rate": 7.897392278485572e-07, "loss": 0.406, "step": 14212 }, { "epoch": 2.63, "learning_rate": 7.889614021656833e-07, "loss": 0.3942, "step": 14213 }, { "epoch": 2.63, "learning_rate": 7.881839439861926e-07, "loss": 0.4072, "step": 14214 }, { "epoch": 2.63, "learning_rate": 7.874068533411094e-07, "loss": 0.4158, "step": 14215 }, { "epoch": 2.63, "learning_rate": 7.866301302614343e-07, "loss": 0.4053, "step": 14216 }, { "epoch": 2.63, "learning_rate": 7.858537747781614e-07, "loss": 0.4149, "step": 14217 }, { "epoch": 2.63, "learning_rate": 7.850777869222626e-07, "loss": 0.4266, "step": 14218 }, { "epoch": 2.63, "learning_rate": 7.843021667246975e-07, "loss": 0.4149, "step": 14219 }, { "epoch": 2.63, "learning_rate": 7.835269142164148e-07, "loss": 0.3876, "step": 14220 }, { "epoch": 2.63, "learning_rate": 7.827520294283431e-07, "loss": 0.4267, "step": 14221 }, { "epoch": 2.63, "learning_rate": 7.81977512391402e-07, "loss": 0.4267, "step": 14222 }, { "epoch": 2.63, "learning_rate": 7.812033631364901e-07, "loss": 0.4127, "step": 14223 }, { "epoch": 2.63, "learning_rate": 7.804295816944962e-07, "loss": 0.4035, "step": 14224 }, { "epoch": 2.63, "learning_rate": 7.796561680962921e-07, "loss": 0.411, "step": 14225 }, { "epoch": 2.63, "learning_rate": 7.788831223727367e-07, "loss": 0.4089, "step": 14226 }, { "epoch": 2.63, "learning_rate": 7.781104445546717e-07, "loss": 0.4322, "step": 14227 }, { "epoch": 2.63, "learning_rate": 7.773381346729269e-07, "loss": 0.4093, "step": 14228 }, { "epoch": 2.63, "learning_rate": 7.765661927583134e-07, "loss": 0.4163, "step": 14229 }, { "epoch": 2.63, "learning_rate": 7.757946188416343e-07, "loss": 0.408, "step": 14230 }, { "epoch": 2.63, "learning_rate": 7.750234129536693e-07, "loss": 0.4274, "step": 14231 }, { "epoch": 2.63, "learning_rate": 7.742525751251928e-07, "loss": 0.4144, "step": 14232 }, { "epoch": 2.63, "learning_rate": 7.734821053869579e-07, "loss": 0.4294, "step": 14233 }, { "epoch": 2.63, "learning_rate": 7.727120037697023e-07, "loss": 0.4075, "step": 14234 }, { "epoch": 2.63, "learning_rate": 7.719422703041557e-07, "loss": 0.4183, "step": 14235 }, { "epoch": 2.63, "learning_rate": 7.711729050210259e-07, "loss": 0.4235, "step": 14236 }, { "epoch": 2.63, "learning_rate": 7.704039079510117e-07, "loss": 0.4112, "step": 14237 }, { "epoch": 2.63, "learning_rate": 7.696352791247919e-07, "loss": 0.4167, "step": 14238 }, { "epoch": 2.63, "learning_rate": 7.688670185730363e-07, "loss": 0.4104, "step": 14239 }, { "epoch": 2.63, "learning_rate": 7.680991263263959e-07, "loss": 0.3836, "step": 14240 }, { "epoch": 2.63, "learning_rate": 7.673316024155064e-07, "loss": 0.4093, "step": 14241 }, { "epoch": 2.63, "learning_rate": 7.665644468709932e-07, "loss": 0.436, "step": 14242 }, { "epoch": 2.64, "learning_rate": 7.657976597234628e-07, "loss": 0.3991, "step": 14243 }, { "epoch": 2.64, "learning_rate": 7.650312410035099e-07, "loss": 0.4092, "step": 14244 }, { "epoch": 2.64, "learning_rate": 7.64265190741712e-07, "loss": 0.4109, "step": 14245 }, { "epoch": 2.64, "learning_rate": 7.634995089686326e-07, "loss": 0.4124, "step": 14246 }, { "epoch": 2.64, "learning_rate": 7.627341957148238e-07, "loss": 0.3972, "step": 14247 }, { "epoch": 2.64, "learning_rate": 7.619692510108157e-07, "loss": 0.4117, "step": 14248 }, { "epoch": 2.64, "learning_rate": 7.612046748871327e-07, "loss": 0.434, "step": 14249 }, { "epoch": 2.64, "learning_rate": 7.604404673742782e-07, "loss": 0.4235, "step": 14250 }, { "epoch": 2.64, "learning_rate": 7.596766285027413e-07, "loss": 0.4264, "step": 14251 }, { "epoch": 2.64, "learning_rate": 7.589131583029996e-07, "loss": 0.4174, "step": 14252 }, { "epoch": 2.64, "learning_rate": 7.581500568055122e-07, "loss": 0.4203, "step": 14253 }, { "epoch": 2.64, "learning_rate": 7.573873240407281e-07, "loss": 0.429, "step": 14254 }, { "epoch": 2.64, "learning_rate": 7.566249600390785e-07, "loss": 0.4106, "step": 14255 }, { "epoch": 2.64, "learning_rate": 7.558629648309767e-07, "loss": 0.4075, "step": 14256 }, { "epoch": 2.64, "learning_rate": 7.551013384468297e-07, "loss": 0.4, "step": 14257 }, { "epoch": 2.64, "learning_rate": 7.543400809170209e-07, "loss": 0.415, "step": 14258 }, { "epoch": 2.64, "learning_rate": 7.53579192271926e-07, "loss": 0.4134, "step": 14259 }, { "epoch": 2.64, "learning_rate": 7.528186725419029e-07, "loss": 0.4183, "step": 14260 }, { "epoch": 2.64, "learning_rate": 7.520585217572918e-07, "loss": 0.3928, "step": 14261 }, { "epoch": 2.64, "learning_rate": 7.512987399484262e-07, "loss": 0.4119, "step": 14262 }, { "epoch": 2.64, "learning_rate": 7.505393271456151e-07, "loss": 0.4126, "step": 14263 }, { "epoch": 2.64, "learning_rate": 7.497802833791612e-07, "loss": 0.405, "step": 14264 }, { "epoch": 2.64, "learning_rate": 7.490216086793467e-07, "loss": 0.4258, "step": 14265 }, { "epoch": 2.64, "learning_rate": 7.482633030764442e-07, "loss": 0.4365, "step": 14266 }, { "epoch": 2.64, "learning_rate": 7.475053666007059e-07, "loss": 0.4103, "step": 14267 }, { "epoch": 2.64, "learning_rate": 7.467477992823713e-07, "loss": 0.4192, "step": 14268 }, { "epoch": 2.64, "learning_rate": 7.459906011516704e-07, "loss": 0.4161, "step": 14269 }, { "epoch": 2.64, "learning_rate": 7.452337722388081e-07, "loss": 0.38, "step": 14270 }, { "epoch": 2.64, "learning_rate": 7.444773125739857e-07, "loss": 0.4121, "step": 14271 }, { "epoch": 2.64, "learning_rate": 7.437212221873813e-07, "loss": 0.4336, "step": 14272 }, { "epoch": 2.64, "learning_rate": 7.42965501109163e-07, "loss": 0.388, "step": 14273 }, { "epoch": 2.64, "learning_rate": 7.422101493694822e-07, "loss": 0.4172, "step": 14274 }, { "epoch": 2.64, "learning_rate": 7.41455166998477e-07, "loss": 0.4021, "step": 14275 }, { "epoch": 2.64, "learning_rate": 7.407005540262669e-07, "loss": 0.4081, "step": 14276 }, { "epoch": 2.64, "learning_rate": 7.399463104829629e-07, "loss": 0.4178, "step": 14277 }, { "epoch": 2.64, "learning_rate": 7.391924363986558e-07, "loss": 0.4256, "step": 14278 }, { "epoch": 2.64, "learning_rate": 7.384389318034258e-07, "loss": 0.4201, "step": 14279 }, { "epoch": 2.64, "learning_rate": 7.376857967273344e-07, "loss": 0.4005, "step": 14280 }, { "epoch": 2.64, "learning_rate": 7.369330312004308e-07, "loss": 0.4116, "step": 14281 }, { "epoch": 2.64, "learning_rate": 7.361806352527501e-07, "loss": 0.4248, "step": 14282 }, { "epoch": 2.64, "learning_rate": 7.354286089143093e-07, "loss": 0.3944, "step": 14283 }, { "epoch": 2.64, "learning_rate": 7.346769522151154e-07, "loss": 0.4219, "step": 14284 }, { "epoch": 2.64, "learning_rate": 7.339256651851556e-07, "loss": 0.4197, "step": 14285 }, { "epoch": 2.64, "learning_rate": 7.331747478544071e-07, "loss": 0.3995, "step": 14286 }, { "epoch": 2.64, "learning_rate": 7.32424200252827e-07, "loss": 0.4023, "step": 14287 }, { "epoch": 2.64, "learning_rate": 7.316740224103658e-07, "loss": 0.4335, "step": 14288 }, { "epoch": 2.64, "learning_rate": 7.309242143569506e-07, "loss": 0.4108, "step": 14289 }, { "epoch": 2.64, "learning_rate": 7.301747761224964e-07, "loss": 0.3959, "step": 14290 }, { "epoch": 2.64, "learning_rate": 7.294257077369072e-07, "loss": 0.4209, "step": 14291 }, { "epoch": 2.64, "learning_rate": 7.286770092300676e-07, "loss": 0.4174, "step": 14292 }, { "epoch": 2.64, "learning_rate": 7.279286806318508e-07, "loss": 0.4103, "step": 14293 }, { "epoch": 2.64, "learning_rate": 7.271807219721128e-07, "loss": 0.4109, "step": 14294 }, { "epoch": 2.64, "learning_rate": 7.264331332806951e-07, "loss": 0.428, "step": 14295 }, { "epoch": 2.64, "learning_rate": 7.256859145874262e-07, "loss": 0.4191, "step": 14296 }, { "epoch": 2.65, "learning_rate": 7.249390659221178e-07, "loss": 0.4129, "step": 14297 }, { "epoch": 2.65, "learning_rate": 7.241925873145694e-07, "loss": 0.4093, "step": 14298 }, { "epoch": 2.65, "learning_rate": 7.234464787945627e-07, "loss": 0.4031, "step": 14299 }, { "epoch": 2.65, "learning_rate": 7.227007403918651e-07, "loss": 0.4203, "step": 14300 }, { "epoch": 2.65, "learning_rate": 7.219553721362337e-07, "loss": 0.4182, "step": 14301 }, { "epoch": 2.65, "learning_rate": 7.212103740574028e-07, "loss": 0.4094, "step": 14302 }, { "epoch": 2.65, "learning_rate": 7.204657461851006e-07, "loss": 0.4055, "step": 14303 }, { "epoch": 2.65, "learning_rate": 7.197214885490355e-07, "loss": 0.3969, "step": 14304 }, { "epoch": 2.65, "learning_rate": 7.189776011788985e-07, "loss": 0.4345, "step": 14305 }, { "epoch": 2.65, "learning_rate": 7.182340841043733e-07, "loss": 0.4099, "step": 14306 }, { "epoch": 2.65, "learning_rate": 7.17490937355122e-07, "loss": 0.425, "step": 14307 }, { "epoch": 2.65, "learning_rate": 7.167481609607974e-07, "loss": 0.4008, "step": 14308 }, { "epoch": 2.65, "learning_rate": 7.160057549510324e-07, "loss": 0.4188, "step": 14309 }, { "epoch": 2.65, "learning_rate": 7.152637193554513e-07, "loss": 0.4116, "step": 14310 }, { "epoch": 2.65, "learning_rate": 7.145220542036569e-07, "loss": 0.4015, "step": 14311 }, { "epoch": 2.65, "learning_rate": 7.137807595252388e-07, "loss": 0.4112, "step": 14312 }, { "epoch": 2.65, "learning_rate": 7.130398353497781e-07, "loss": 0.4129, "step": 14313 }, { "epoch": 2.65, "learning_rate": 7.122992817068309e-07, "loss": 0.4257, "step": 14314 }, { "epoch": 2.65, "learning_rate": 7.11559098625949e-07, "loss": 0.414, "step": 14315 }, { "epoch": 2.65, "learning_rate": 7.108192861366614e-07, "loss": 0.3934, "step": 14316 }, { "epoch": 2.65, "learning_rate": 7.100798442684842e-07, "loss": 0.4052, "step": 14317 }, { "epoch": 2.65, "learning_rate": 7.093407730509239e-07, "loss": 0.4224, "step": 14318 }, { "epoch": 2.65, "learning_rate": 7.086020725134635e-07, "loss": 0.4031, "step": 14319 }, { "epoch": 2.65, "learning_rate": 7.078637426855795e-07, "loss": 0.3996, "step": 14320 }, { "epoch": 2.65, "learning_rate": 7.07125783596726e-07, "loss": 0.4202, "step": 14321 }, { "epoch": 2.65, "learning_rate": 7.063881952763507e-07, "loss": 0.4049, "step": 14322 }, { "epoch": 2.65, "learning_rate": 7.056509777538778e-07, "loss": 0.4189, "step": 14323 }, { "epoch": 2.65, "learning_rate": 7.049141310587248e-07, "loss": 0.4365, "step": 14324 }, { "epoch": 2.65, "learning_rate": 7.041776552202872e-07, "loss": 0.4604, "step": 14325 }, { "epoch": 2.65, "learning_rate": 7.034415502679514e-07, "loss": 0.4109, "step": 14326 }, { "epoch": 2.65, "learning_rate": 7.02705816231084e-07, "loss": 0.4047, "step": 14327 }, { "epoch": 2.65, "learning_rate": 7.019704531390426e-07, "loss": 0.4127, "step": 14328 }, { "epoch": 2.65, "learning_rate": 7.012354610211647e-07, "loss": 0.3992, "step": 14329 }, { "epoch": 2.65, "learning_rate": 7.005008399067759e-07, "loss": 0.4323, "step": 14330 }, { "epoch": 2.65, "learning_rate": 6.997665898251849e-07, "loss": 0.4253, "step": 14331 }, { "epoch": 2.65, "learning_rate": 6.990327108056905e-07, "loss": 0.4197, "step": 14332 }, { "epoch": 2.65, "learning_rate": 6.982992028775692e-07, "loss": 0.41, "step": 14333 }, { "epoch": 2.65, "learning_rate": 6.975660660700878e-07, "loss": 0.41, "step": 14334 }, { "epoch": 2.65, "learning_rate": 6.968333004124983e-07, "loss": 0.3923, "step": 14335 }, { "epoch": 2.65, "learning_rate": 6.96100905934034e-07, "loss": 0.4155, "step": 14336 }, { "epoch": 2.65, "learning_rate": 6.953688826639204e-07, "loss": 0.4015, "step": 14337 }, { "epoch": 2.65, "learning_rate": 6.946372306313609e-07, "loss": 0.4055, "step": 14338 }, { "epoch": 2.65, "learning_rate": 6.939059498655454e-07, "loss": 0.4144, "step": 14339 }, { "epoch": 2.65, "learning_rate": 6.931750403956538e-07, "loss": 0.4045, "step": 14340 }, { "epoch": 2.65, "learning_rate": 6.924445022508464e-07, "loss": 0.4234, "step": 14341 }, { "epoch": 2.65, "learning_rate": 6.917143354602718e-07, "loss": 0.434, "step": 14342 }, { "epoch": 2.65, "learning_rate": 6.909845400530623e-07, "loss": 0.4234, "step": 14343 }, { "epoch": 2.65, "learning_rate": 6.902551160583326e-07, "loss": 0.4191, "step": 14344 }, { "epoch": 2.65, "learning_rate": 6.895260635051882e-07, "loss": 0.4124, "step": 14345 }, { "epoch": 2.65, "learning_rate": 6.887973824227146e-07, "loss": 0.4086, "step": 14346 }, { "epoch": 2.65, "learning_rate": 6.880690728399886e-07, "loss": 0.4173, "step": 14347 }, { "epoch": 2.65, "learning_rate": 6.873411347860648e-07, "loss": 0.4185, "step": 14348 }, { "epoch": 2.65, "learning_rate": 6.866135682899866e-07, "loss": 0.4169, "step": 14349 }, { "epoch": 2.65, "learning_rate": 6.858863733807863e-07, "loss": 0.4072, "step": 14350 }, { "epoch": 2.66, "learning_rate": 6.85159550087472e-07, "loss": 0.3952, "step": 14351 }, { "epoch": 2.66, "learning_rate": 6.844330984390479e-07, "loss": 0.4262, "step": 14352 }, { "epoch": 2.66, "learning_rate": 6.837070184644945e-07, "loss": 0.4198, "step": 14353 }, { "epoch": 2.66, "learning_rate": 6.82981310192784e-07, "loss": 0.4113, "step": 14354 }, { "epoch": 2.66, "learning_rate": 6.822559736528689e-07, "loss": 0.4002, "step": 14355 }, { "epoch": 2.66, "learning_rate": 6.815310088736882e-07, "loss": 0.4267, "step": 14356 }, { "epoch": 2.66, "learning_rate": 6.808064158841688e-07, "loss": 0.4109, "step": 14357 }, { "epoch": 2.66, "learning_rate": 6.800821947132175e-07, "loss": 0.412, "step": 14358 }, { "epoch": 2.66, "learning_rate": 6.793583453897323e-07, "loss": 0.4047, "step": 14359 }, { "epoch": 2.66, "learning_rate": 6.786348679425936e-07, "loss": 0.4039, "step": 14360 }, { "epoch": 2.66, "learning_rate": 6.779117624006637e-07, "loss": 0.4124, "step": 14361 }, { "epoch": 2.66, "learning_rate": 6.771890287927962e-07, "loss": 0.4123, "step": 14362 }, { "epoch": 2.66, "learning_rate": 6.764666671478248e-07, "loss": 0.4024, "step": 14363 }, { "epoch": 2.66, "learning_rate": 6.75744677494572e-07, "loss": 0.3979, "step": 14364 }, { "epoch": 2.66, "learning_rate": 6.750230598618434e-07, "loss": 0.4168, "step": 14365 }, { "epoch": 2.66, "learning_rate": 6.743018142784286e-07, "loss": 0.3973, "step": 14366 }, { "epoch": 2.66, "learning_rate": 6.735809407731075e-07, "loss": 0.4224, "step": 14367 }, { "epoch": 2.66, "learning_rate": 6.728604393746374e-07, "loss": 0.4187, "step": 14368 }, { "epoch": 2.66, "learning_rate": 6.721403101117685e-07, "loss": 0.4202, "step": 14369 }, { "epoch": 2.66, "learning_rate": 6.714205530132301e-07, "loss": 0.3966, "step": 14370 }, { "epoch": 2.66, "learning_rate": 6.707011681077413e-07, "loss": 0.4262, "step": 14371 }, { "epoch": 2.66, "learning_rate": 6.699821554240016e-07, "loss": 0.3836, "step": 14372 }, { "epoch": 2.66, "learning_rate": 6.692635149907012e-07, "loss": 0.427, "step": 14373 }, { "epoch": 2.66, "learning_rate": 6.685452468365095e-07, "loss": 0.4109, "step": 14374 }, { "epoch": 2.66, "learning_rate": 6.678273509900879e-07, "loss": 0.4135, "step": 14375 }, { "epoch": 2.66, "learning_rate": 6.671098274800758e-07, "loss": 0.3954, "step": 14376 }, { "epoch": 2.66, "learning_rate": 6.663926763351025e-07, "loss": 0.4066, "step": 14377 }, { "epoch": 2.66, "learning_rate": 6.656758975837796e-07, "loss": 0.4124, "step": 14378 }, { "epoch": 2.66, "learning_rate": 6.649594912547086e-07, "loss": 0.4246, "step": 14379 }, { "epoch": 2.66, "learning_rate": 6.642434573764678e-07, "loss": 0.3997, "step": 14380 }, { "epoch": 2.66, "learning_rate": 6.635277959776309e-07, "loss": 0.4182, "step": 14381 }, { "epoch": 2.66, "learning_rate": 6.628125070867486e-07, "loss": 0.4104, "step": 14382 }, { "epoch": 2.66, "learning_rate": 6.620975907323579e-07, "loss": 0.4171, "step": 14383 }, { "epoch": 2.66, "learning_rate": 6.613830469429871e-07, "loss": 0.4171, "step": 14384 }, { "epoch": 2.66, "learning_rate": 6.606688757471402e-07, "loss": 0.419, "step": 14385 }, { "epoch": 2.66, "learning_rate": 6.599550771733165e-07, "loss": 0.3963, "step": 14386 }, { "epoch": 2.66, "learning_rate": 6.592416512499922e-07, "loss": 0.3965, "step": 14387 }, { "epoch": 2.66, "learning_rate": 6.585285980056299e-07, "loss": 0.4086, "step": 14388 }, { "epoch": 2.66, "learning_rate": 6.578159174686838e-07, "loss": 0.4043, "step": 14389 }, { "epoch": 2.66, "learning_rate": 6.571036096675831e-07, "loss": 0.413, "step": 14390 }, { "epoch": 2.66, "learning_rate": 6.563916746307531e-07, "loss": 0.4208, "step": 14391 }, { "epoch": 2.66, "learning_rate": 6.556801123865952e-07, "loss": 0.4271, "step": 14392 }, { "epoch": 2.66, "learning_rate": 6.549689229634992e-07, "loss": 0.4157, "step": 14393 }, { "epoch": 2.66, "learning_rate": 6.542581063898434e-07, "loss": 0.4072, "step": 14394 }, { "epoch": 2.66, "learning_rate": 6.535476626939841e-07, "loss": 0.4143, "step": 14395 }, { "epoch": 2.66, "learning_rate": 6.528375919042695e-07, "loss": 0.4101, "step": 14396 }, { "epoch": 2.66, "learning_rate": 6.521278940490283e-07, "loss": 0.4224, "step": 14397 }, { "epoch": 2.66, "learning_rate": 6.514185691565788e-07, "loss": 0.414, "step": 14398 }, { "epoch": 2.66, "learning_rate": 6.507096172552196e-07, "loss": 0.3929, "step": 14399 }, { "epoch": 2.66, "learning_rate": 6.500010383732347e-07, "loss": 0.4179, "step": 14400 }, { "epoch": 2.66, "learning_rate": 6.492928325388992e-07, "loss": 0.4204, "step": 14401 }, { "epoch": 2.66, "learning_rate": 6.48584999780466e-07, "loss": 0.4235, "step": 14402 }, { "epoch": 2.66, "learning_rate": 6.478775401261795e-07, "loss": 0.4002, "step": 14403 }, { "epoch": 2.66, "learning_rate": 6.471704536042633e-07, "loss": 0.4065, "step": 14404 }, { "epoch": 2.67, "learning_rate": 6.464637402429297e-07, "loss": 0.4168, "step": 14405 }, { "epoch": 2.67, "learning_rate": 6.457574000703748e-07, "loss": 0.4059, "step": 14406 }, { "epoch": 2.67, "learning_rate": 6.450514331147806e-07, "loss": 0.4291, "step": 14407 }, { "epoch": 2.67, "learning_rate": 6.443458394043156e-07, "loss": 0.4003, "step": 14408 }, { "epoch": 2.67, "learning_rate": 6.436406189671285e-07, "loss": 0.4065, "step": 14409 }, { "epoch": 2.67, "learning_rate": 6.429357718313578e-07, "loss": 0.3971, "step": 14410 }, { "epoch": 2.67, "learning_rate": 6.422312980251266e-07, "loss": 0.4251, "step": 14411 }, { "epoch": 2.67, "learning_rate": 6.415271975765403e-07, "loss": 0.434, "step": 14412 }, { "epoch": 2.67, "learning_rate": 6.408234705136928e-07, "loss": 0.4081, "step": 14413 }, { "epoch": 2.67, "learning_rate": 6.401201168646609e-07, "loss": 0.4163, "step": 14414 }, { "epoch": 2.67, "learning_rate": 6.394171366575053e-07, "loss": 0.4276, "step": 14415 }, { "epoch": 2.67, "learning_rate": 6.387145299202779e-07, "loss": 0.4362, "step": 14416 }, { "epoch": 2.67, "learning_rate": 6.380122966810065e-07, "loss": 0.3949, "step": 14417 }, { "epoch": 2.67, "learning_rate": 6.37310436967713e-07, "loss": 0.429, "step": 14418 }, { "epoch": 2.67, "learning_rate": 6.366089508083961e-07, "loss": 0.4032, "step": 14419 }, { "epoch": 2.67, "learning_rate": 6.35907838231048e-07, "loss": 0.4286, "step": 14420 }, { "epoch": 2.67, "learning_rate": 6.352070992636406e-07, "loss": 0.412, "step": 14421 }, { "epoch": 2.67, "learning_rate": 6.345067339341305e-07, "loss": 0.4108, "step": 14422 }, { "epoch": 2.67, "learning_rate": 6.338067422704619e-07, "loss": 0.4328, "step": 14423 }, { "epoch": 2.67, "learning_rate": 6.331071243005627e-07, "loss": 0.422, "step": 14424 }, { "epoch": 2.67, "learning_rate": 6.324078800523481e-07, "loss": 0.4387, "step": 14425 }, { "epoch": 2.67, "learning_rate": 6.317090095537137e-07, "loss": 0.4011, "step": 14426 }, { "epoch": 2.67, "learning_rate": 6.310105128325472e-07, "loss": 0.4171, "step": 14427 }, { "epoch": 2.67, "learning_rate": 6.303123899167129e-07, "loss": 0.4058, "step": 14428 }, { "epoch": 2.67, "learning_rate": 6.296146408340686e-07, "loss": 0.4041, "step": 14429 }, { "epoch": 2.67, "learning_rate": 6.289172656124498e-07, "loss": 0.4252, "step": 14430 }, { "epoch": 2.67, "learning_rate": 6.282202642796831e-07, "loss": 0.4228, "step": 14431 }, { "epoch": 2.67, "learning_rate": 6.275236368635751e-07, "loss": 0.4217, "step": 14432 }, { "epoch": 2.67, "learning_rate": 6.268273833919236e-07, "loss": 0.4181, "step": 14433 }, { "epoch": 2.67, "learning_rate": 6.261315038925031e-07, "loss": 0.4178, "step": 14434 }, { "epoch": 2.67, "learning_rate": 6.254359983930825e-07, "loss": 0.4178, "step": 14435 }, { "epoch": 2.67, "learning_rate": 6.247408669214083e-07, "loss": 0.425, "step": 14436 }, { "epoch": 2.67, "learning_rate": 6.240461095052141e-07, "loss": 0.4196, "step": 14437 }, { "epoch": 2.67, "learning_rate": 6.233517261722232e-07, "loss": 0.4022, "step": 14438 }, { "epoch": 2.67, "learning_rate": 6.226577169501357e-07, "loss": 0.4225, "step": 14439 }, { "epoch": 2.67, "learning_rate": 6.219640818666462e-07, "loss": 0.4167, "step": 14440 }, { "epoch": 2.67, "learning_rate": 6.212708209494245e-07, "loss": 0.4022, "step": 14441 }, { "epoch": 2.67, "learning_rate": 6.205779342261353e-07, "loss": 0.4157, "step": 14442 }, { "epoch": 2.67, "learning_rate": 6.198854217244199e-07, "loss": 0.4131, "step": 14443 }, { "epoch": 2.67, "learning_rate": 6.191932834719083e-07, "loss": 0.4202, "step": 14444 }, { "epoch": 2.67, "learning_rate": 6.185015194962174e-07, "loss": 0.4284, "step": 14445 }, { "epoch": 2.67, "learning_rate": 6.178101298249462e-07, "loss": 0.3984, "step": 14446 }, { "epoch": 2.67, "learning_rate": 6.171191144856814e-07, "loss": 0.4174, "step": 14447 }, { "epoch": 2.67, "learning_rate": 6.164284735059911e-07, "loss": 0.4276, "step": 14448 }, { "epoch": 2.67, "learning_rate": 6.15738206913431e-07, "loss": 0.4234, "step": 14449 }, { "epoch": 2.67, "learning_rate": 6.150483147355424e-07, "loss": 0.4064, "step": 14450 }, { "epoch": 2.67, "learning_rate": 6.143587969998499e-07, "loss": 0.4288, "step": 14451 }, { "epoch": 2.67, "learning_rate": 6.136696537338649e-07, "loss": 0.4156, "step": 14452 }, { "epoch": 2.67, "learning_rate": 6.129808849650831e-07, "loss": 0.4254, "step": 14453 }, { "epoch": 2.67, "learning_rate": 6.122924907209826e-07, "loss": 0.4384, "step": 14454 }, { "epoch": 2.67, "learning_rate": 6.116044710290325e-07, "loss": 0.4264, "step": 14455 }, { "epoch": 2.67, "learning_rate": 6.109168259166798e-07, "loss": 0.403, "step": 14456 }, { "epoch": 2.67, "learning_rate": 6.102295554113647e-07, "loss": 0.4091, "step": 14457 }, { "epoch": 2.67, "learning_rate": 6.095426595405052e-07, "loss": 0.4135, "step": 14458 }, { "epoch": 2.68, "learning_rate": 6.088561383315062e-07, "loss": 0.4247, "step": 14459 }, { "epoch": 2.68, "learning_rate": 6.081699918117612e-07, "loss": 0.41, "step": 14460 }, { "epoch": 2.68, "learning_rate": 6.074842200086429e-07, "loss": 0.4285, "step": 14461 }, { "epoch": 2.68, "learning_rate": 6.06798822949517e-07, "loss": 0.412, "step": 14462 }, { "epoch": 2.68, "learning_rate": 6.061138006617251e-07, "loss": 0.3969, "step": 14463 }, { "epoch": 2.68, "learning_rate": 6.05429153172602e-07, "loss": 0.4228, "step": 14464 }, { "epoch": 2.68, "learning_rate": 6.047448805094624e-07, "loss": 0.4013, "step": 14465 }, { "epoch": 2.68, "learning_rate": 6.040609826996058e-07, "loss": 0.4216, "step": 14466 }, { "epoch": 2.68, "learning_rate": 6.033774597703201e-07, "loss": 0.4328, "step": 14467 }, { "epoch": 2.68, "learning_rate": 6.02694311748876e-07, "loss": 0.4172, "step": 14468 }, { "epoch": 2.68, "learning_rate": 6.020115386625313e-07, "loss": 0.4137, "step": 14469 }, { "epoch": 2.68, "learning_rate": 6.013291405385268e-07, "loss": 0.4217, "step": 14470 }, { "epoch": 2.68, "learning_rate": 6.006471174040862e-07, "loss": 0.4122, "step": 14471 }, { "epoch": 2.68, "learning_rate": 5.999654692864254e-07, "loss": 0.4128, "step": 14472 }, { "epoch": 2.68, "learning_rate": 5.99284196212736e-07, "loss": 0.4149, "step": 14473 }, { "epoch": 2.68, "learning_rate": 5.986032982102053e-07, "loss": 0.4106, "step": 14474 }, { "epoch": 2.68, "learning_rate": 5.979227753059936e-07, "loss": 0.4099, "step": 14475 }, { "epoch": 2.68, "learning_rate": 5.97242627527258e-07, "loss": 0.4054, "step": 14476 }, { "epoch": 2.68, "learning_rate": 5.965628549011315e-07, "loss": 0.3992, "step": 14477 }, { "epoch": 2.68, "learning_rate": 5.95883457454739e-07, "loss": 0.3997, "step": 14478 }, { "epoch": 2.68, "learning_rate": 5.952044352151831e-07, "loss": 0.4272, "step": 14479 }, { "epoch": 2.68, "learning_rate": 5.94525788209559e-07, "loss": 0.3936, "step": 14480 }, { "epoch": 2.68, "learning_rate": 5.938475164649415e-07, "loss": 0.423, "step": 14481 }, { "epoch": 2.68, "learning_rate": 5.931696200083936e-07, "loss": 0.4053, "step": 14482 }, { "epoch": 2.68, "learning_rate": 5.924920988669602e-07, "loss": 0.4153, "step": 14483 }, { "epoch": 2.68, "learning_rate": 5.918149530676765e-07, "loss": 0.389, "step": 14484 }, { "epoch": 2.68, "learning_rate": 5.911381826375561e-07, "loss": 0.3977, "step": 14485 }, { "epoch": 2.68, "learning_rate": 5.904617876036034e-07, "loss": 0.4035, "step": 14486 }, { "epoch": 2.68, "learning_rate": 5.897857679928043e-07, "loss": 0.4152, "step": 14487 }, { "epoch": 2.68, "learning_rate": 5.891101238321284e-07, "loss": 0.4297, "step": 14488 }, { "epoch": 2.68, "learning_rate": 5.884348551485364e-07, "loss": 0.4074, "step": 14489 }, { "epoch": 2.68, "learning_rate": 5.877599619689678e-07, "loss": 0.3886, "step": 14490 }, { "epoch": 2.68, "learning_rate": 5.870854443203511e-07, "loss": 0.4095, "step": 14491 }, { "epoch": 2.68, "learning_rate": 5.864113022295981e-07, "loss": 0.4075, "step": 14492 }, { "epoch": 2.68, "learning_rate": 5.857375357236039e-07, "loss": 0.4122, "step": 14493 }, { "epoch": 2.68, "learning_rate": 5.850641448292526e-07, "loss": 0.4112, "step": 14494 }, { "epoch": 2.68, "learning_rate": 5.843911295734106e-07, "loss": 0.3976, "step": 14495 }, { "epoch": 2.68, "learning_rate": 5.837184899829307e-07, "loss": 0.4186, "step": 14496 }, { "epoch": 2.68, "learning_rate": 5.830462260846492e-07, "loss": 0.4088, "step": 14497 }, { "epoch": 2.68, "learning_rate": 5.82374337905387e-07, "loss": 0.4079, "step": 14498 }, { "epoch": 2.68, "learning_rate": 5.817028254719537e-07, "loss": 0.4355, "step": 14499 }, { "epoch": 2.68, "learning_rate": 5.81031688811139e-07, "loss": 0.4116, "step": 14500 }, { "epoch": 2.68, "learning_rate": 5.803609279497225e-07, "loss": 0.4121, "step": 14501 }, { "epoch": 2.68, "learning_rate": 5.796905429144639e-07, "loss": 0.3966, "step": 14502 }, { "epoch": 2.68, "learning_rate": 5.790205337321108e-07, "loss": 0.4184, "step": 14503 }, { "epoch": 2.68, "learning_rate": 5.783509004293986e-07, "loss": 0.4153, "step": 14504 }, { "epoch": 2.68, "learning_rate": 5.776816430330389e-07, "loss": 0.4272, "step": 14505 }, { "epoch": 2.68, "learning_rate": 5.770127615697385e-07, "loss": 0.4118, "step": 14506 }, { "epoch": 2.68, "learning_rate": 5.763442560661803e-07, "loss": 0.4065, "step": 14507 }, { "epoch": 2.68, "learning_rate": 5.756761265490418e-07, "loss": 0.4095, "step": 14508 }, { "epoch": 2.68, "learning_rate": 5.750083730449763e-07, "loss": 0.4219, "step": 14509 }, { "epoch": 2.68, "learning_rate": 5.743409955806256e-07, "loss": 0.4132, "step": 14510 }, { "epoch": 2.68, "learning_rate": 5.736739941826197e-07, "loss": 0.4214, "step": 14511 }, { "epoch": 2.68, "learning_rate": 5.730073688775672e-07, "loss": 0.4053, "step": 14512 }, { "epoch": 2.69, "learning_rate": 5.723411196920692e-07, "loss": 0.4189, "step": 14513 }, { "epoch": 2.69, "learning_rate": 5.716752466527053e-07, "loss": 0.4051, "step": 14514 }, { "epoch": 2.69, "learning_rate": 5.710097497860412e-07, "loss": 0.3928, "step": 14515 }, { "epoch": 2.69, "learning_rate": 5.703446291186321e-07, "loss": 0.4322, "step": 14516 }, { "epoch": 2.69, "learning_rate": 5.696798846770124e-07, "loss": 0.4112, "step": 14517 }, { "epoch": 2.69, "learning_rate": 5.690155164877076e-07, "loss": 0.4008, "step": 14518 }, { "epoch": 2.69, "learning_rate": 5.68351524577223e-07, "loss": 0.3926, "step": 14519 }, { "epoch": 2.69, "learning_rate": 5.676879089720478e-07, "loss": 0.4093, "step": 14520 }, { "epoch": 2.69, "learning_rate": 5.670246696986636e-07, "loss": 0.4294, "step": 14521 }, { "epoch": 2.69, "learning_rate": 5.663618067835286e-07, "loss": 0.4076, "step": 14522 }, { "epoch": 2.69, "learning_rate": 5.656993202530936e-07, "loss": 0.415, "step": 14523 }, { "epoch": 2.69, "learning_rate": 5.650372101337864e-07, "loss": 0.4119, "step": 14524 }, { "epoch": 2.69, "learning_rate": 5.643754764520282e-07, "loss": 0.4076, "step": 14525 }, { "epoch": 2.69, "learning_rate": 5.637141192342165e-07, "loss": 0.4201, "step": 14526 }, { "epoch": 2.69, "learning_rate": 5.630531385067429e-07, "loss": 0.4107, "step": 14527 }, { "epoch": 2.69, "learning_rate": 5.623925342959757e-07, "loss": 0.3954, "step": 14528 }, { "epoch": 2.69, "learning_rate": 5.617323066282742e-07, "loss": 0.4139, "step": 14529 }, { "epoch": 2.69, "learning_rate": 5.610724555299785e-07, "loss": 0.4043, "step": 14530 }, { "epoch": 2.69, "learning_rate": 5.604129810274162e-07, "loss": 0.4055, "step": 14531 }, { "epoch": 2.69, "learning_rate": 5.597538831468985e-07, "loss": 0.3956, "step": 14532 }, { "epoch": 2.69, "learning_rate": 5.590951619147244e-07, "loss": 0.4141, "step": 14533 }, { "epoch": 2.69, "learning_rate": 5.584368173571719e-07, "loss": 0.4394, "step": 14534 }, { "epoch": 2.69, "learning_rate": 5.577788495005109e-07, "loss": 0.4063, "step": 14535 }, { "epoch": 2.69, "learning_rate": 5.571212583709929e-07, "loss": 0.4174, "step": 14536 }, { "epoch": 2.69, "learning_rate": 5.56464043994852e-07, "loss": 0.4028, "step": 14537 }, { "epoch": 2.69, "learning_rate": 5.558072063983122e-07, "loss": 0.4233, "step": 14538 }, { "epoch": 2.69, "learning_rate": 5.551507456075789e-07, "loss": 0.4173, "step": 14539 }, { "epoch": 2.69, "learning_rate": 5.544946616488456e-07, "loss": 0.395, "step": 14540 }, { "epoch": 2.69, "learning_rate": 5.538389545482869e-07, "loss": 0.407, "step": 14541 }, { "epoch": 2.69, "learning_rate": 5.531836243320632e-07, "loss": 0.3855, "step": 14542 }, { "epoch": 2.69, "learning_rate": 5.525286710263244e-07, "loss": 0.382, "step": 14543 }, { "epoch": 2.69, "learning_rate": 5.518740946571988e-07, "loss": 0.4139, "step": 14544 }, { "epoch": 2.69, "learning_rate": 5.512198952508053e-07, "loss": 0.4205, "step": 14545 }, { "epoch": 2.69, "learning_rate": 5.50566072833244e-07, "loss": 0.418, "step": 14546 }, { "epoch": 2.69, "learning_rate": 5.499126274305999e-07, "loss": 0.4083, "step": 14547 }, { "epoch": 2.69, "learning_rate": 5.492595590689476e-07, "loss": 0.4137, "step": 14548 }, { "epoch": 2.69, "learning_rate": 5.486068677743395e-07, "loss": 0.4178, "step": 14549 }, { "epoch": 2.69, "learning_rate": 5.479545535728192e-07, "loss": 0.4161, "step": 14550 }, { "epoch": 2.69, "learning_rate": 5.473026164904116e-07, "loss": 0.3959, "step": 14551 }, { "epoch": 2.69, "learning_rate": 5.466510565531302e-07, "loss": 0.4051, "step": 14552 }, { "epoch": 2.69, "learning_rate": 5.459998737869687e-07, "loss": 0.4197, "step": 14553 }, { "epoch": 2.69, "learning_rate": 5.453490682179063e-07, "loss": 0.4249, "step": 14554 }, { "epoch": 2.69, "learning_rate": 5.446986398719134e-07, "loss": 0.419, "step": 14555 }, { "epoch": 2.69, "learning_rate": 5.44048588774938e-07, "loss": 0.3981, "step": 14556 }, { "epoch": 2.69, "learning_rate": 5.433989149529173e-07, "loss": 0.4093, "step": 14557 }, { "epoch": 2.69, "learning_rate": 5.427496184317716e-07, "loss": 0.4306, "step": 14558 }, { "epoch": 2.69, "learning_rate": 5.421006992374056e-07, "loss": 0.4395, "step": 14559 }, { "epoch": 2.69, "learning_rate": 5.414521573957121e-07, "loss": 0.3958, "step": 14560 }, { "epoch": 2.69, "learning_rate": 5.408039929325637e-07, "loss": 0.4247, "step": 14561 }, { "epoch": 2.69, "learning_rate": 5.401562058738242e-07, "loss": 0.4237, "step": 14562 }, { "epoch": 2.69, "learning_rate": 5.395087962453382e-07, "loss": 0.4194, "step": 14563 }, { "epoch": 2.69, "learning_rate": 5.388617640729332e-07, "loss": 0.4314, "step": 14564 }, { "epoch": 2.69, "learning_rate": 5.382151093824295e-07, "loss": 0.4017, "step": 14565 }, { "epoch": 2.69, "learning_rate": 5.375688321996231e-07, "loss": 0.398, "step": 14566 }, { "epoch": 2.7, "learning_rate": 5.369229325503022e-07, "loss": 0.4295, "step": 14567 }, { "epoch": 2.7, "learning_rate": 5.362774104602353e-07, "loss": 0.4126, "step": 14568 }, { "epoch": 2.7, "learning_rate": 5.356322659551772e-07, "loss": 0.4129, "step": 14569 }, { "epoch": 2.7, "learning_rate": 5.349874990608706e-07, "loss": 0.4271, "step": 14570 }, { "epoch": 2.7, "learning_rate": 5.343431098030371e-07, "loss": 0.4089, "step": 14571 }, { "epoch": 2.7, "learning_rate": 5.336990982073908e-07, "loss": 0.3967, "step": 14572 }, { "epoch": 2.7, "learning_rate": 5.330554642996211e-07, "loss": 0.4229, "step": 14573 }, { "epoch": 2.7, "learning_rate": 5.324122081054128e-07, "loss": 0.4297, "step": 14574 }, { "epoch": 2.7, "learning_rate": 5.317693296504279e-07, "loss": 0.416, "step": 14575 }, { "epoch": 2.7, "learning_rate": 5.311268289603178e-07, "loss": 0.4292, "step": 14576 }, { "epoch": 2.7, "learning_rate": 5.304847060607143e-07, "loss": 0.4322, "step": 14577 }, { "epoch": 2.7, "learning_rate": 5.298429609772404e-07, "loss": 0.4204, "step": 14578 }, { "epoch": 2.7, "learning_rate": 5.292015937354966e-07, "loss": 0.4079, "step": 14579 }, { "epoch": 2.7, "learning_rate": 5.28560604361077e-07, "loss": 0.4069, "step": 14580 }, { "epoch": 2.7, "learning_rate": 5.279199928795509e-07, "loss": 0.4194, "step": 14581 }, { "epoch": 2.7, "learning_rate": 5.272797593164825e-07, "loss": 0.419, "step": 14582 }, { "epoch": 2.7, "learning_rate": 5.266399036974112e-07, "loss": 0.4099, "step": 14583 }, { "epoch": 2.7, "learning_rate": 5.260004260478702e-07, "loss": 0.4243, "step": 14584 }, { "epoch": 2.7, "learning_rate": 5.253613263933721e-07, "loss": 0.4132, "step": 14585 }, { "epoch": 2.7, "learning_rate": 5.247226047594122e-07, "loss": 0.418, "step": 14586 }, { "epoch": 2.7, "learning_rate": 5.240842611714803e-07, "loss": 0.4044, "step": 14587 }, { "epoch": 2.7, "learning_rate": 5.234462956550402e-07, "loss": 0.425, "step": 14588 }, { "epoch": 2.7, "learning_rate": 5.228087082355493e-07, "loss": 0.4014, "step": 14589 }, { "epoch": 2.7, "learning_rate": 5.221714989384441e-07, "loss": 0.4095, "step": 14590 }, { "epoch": 2.7, "learning_rate": 5.215346677891464e-07, "loss": 0.4121, "step": 14591 }, { "epoch": 2.7, "learning_rate": 5.208982148130681e-07, "loss": 0.3995, "step": 14592 }, { "epoch": 2.7, "learning_rate": 5.202621400356001e-07, "loss": 0.395, "step": 14593 }, { "epoch": 2.7, "learning_rate": 5.19626443482123e-07, "loss": 0.4143, "step": 14594 }, { "epoch": 2.7, "learning_rate": 5.189911251779977e-07, "loss": 0.3939, "step": 14595 }, { "epoch": 2.7, "learning_rate": 5.183561851485719e-07, "loss": 0.4066, "step": 14596 }, { "epoch": 2.7, "learning_rate": 5.177216234191806e-07, "loss": 0.4266, "step": 14597 }, { "epoch": 2.7, "learning_rate": 5.170874400151393e-07, "loss": 0.3957, "step": 14598 }, { "epoch": 2.7, "learning_rate": 5.164536349617533e-07, "loss": 0.4261, "step": 14599 }, { "epoch": 2.7, "learning_rate": 5.158202082843078e-07, "loss": 0.4175, "step": 14600 }, { "epoch": 2.7, "learning_rate": 5.151871600080782e-07, "loss": 0.4073, "step": 14601 }, { "epoch": 2.7, "learning_rate": 5.1455449015832e-07, "loss": 0.4359, "step": 14602 }, { "epoch": 2.7, "learning_rate": 5.139221987602738e-07, "loss": 0.4205, "step": 14603 }, { "epoch": 2.7, "learning_rate": 5.132902858391708e-07, "loss": 0.4217, "step": 14604 }, { "epoch": 2.7, "learning_rate": 5.126587514202197e-07, "loss": 0.4188, "step": 14605 }, { "epoch": 2.7, "learning_rate": 5.120275955286202e-07, "loss": 0.4223, "step": 14606 }, { "epoch": 2.7, "learning_rate": 5.113968181895535e-07, "loss": 0.4177, "step": 14607 }, { "epoch": 2.7, "learning_rate": 5.107664194281847e-07, "loss": 0.4411, "step": 14608 }, { "epoch": 2.7, "learning_rate": 5.101363992696684e-07, "loss": 0.4093, "step": 14609 }, { "epoch": 2.7, "learning_rate": 5.095067577391377e-07, "loss": 0.4088, "step": 14610 }, { "epoch": 2.7, "learning_rate": 5.088774948617181e-07, "loss": 0.3993, "step": 14611 }, { "epoch": 2.7, "learning_rate": 5.082486106625139e-07, "loss": 0.4188, "step": 14612 }, { "epoch": 2.7, "learning_rate": 5.076201051666164e-07, "loss": 0.4136, "step": 14613 }, { "epoch": 2.7, "learning_rate": 5.069919783991018e-07, "loss": 0.421, "step": 14614 }, { "epoch": 2.7, "learning_rate": 5.063642303850302e-07, "loss": 0.4157, "step": 14615 }, { "epoch": 2.7, "learning_rate": 5.057368611494507e-07, "loss": 0.4041, "step": 14616 }, { "epoch": 2.7, "learning_rate": 5.051098707173929e-07, "loss": 0.4185, "step": 14617 }, { "epoch": 2.7, "learning_rate": 5.044832591138693e-07, "loss": 0.4244, "step": 14618 }, { "epoch": 2.7, "learning_rate": 5.038570263638854e-07, "loss": 0.4228, "step": 14619 }, { "epoch": 2.7, "learning_rate": 5.032311724924232e-07, "loss": 0.3895, "step": 14620 }, { "epoch": 2.71, "learning_rate": 5.026056975244554e-07, "loss": 0.4281, "step": 14621 }, { "epoch": 2.71, "learning_rate": 5.019806014849349e-07, "loss": 0.4166, "step": 14622 }, { "epoch": 2.71, "learning_rate": 5.013558843988042e-07, "loss": 0.4143, "step": 14623 }, { "epoch": 2.71, "learning_rate": 5.007315462909867e-07, "loss": 0.3965, "step": 14624 }, { "epoch": 2.71, "learning_rate": 5.001075871863948e-07, "loss": 0.4146, "step": 14625 }, { "epoch": 2.71, "learning_rate": 4.994840071099194e-07, "loss": 0.4287, "step": 14626 }, { "epoch": 2.71, "learning_rate": 4.988608060864442e-07, "loss": 0.4171, "step": 14627 }, { "epoch": 2.71, "learning_rate": 4.982379841408314e-07, "loss": 0.4118, "step": 14628 }, { "epoch": 2.71, "learning_rate": 4.976155412979311e-07, "loss": 0.4345, "step": 14629 }, { "epoch": 2.71, "learning_rate": 4.969934775825769e-07, "loss": 0.4201, "step": 14630 }, { "epoch": 2.71, "learning_rate": 4.963717930195888e-07, "loss": 0.4157, "step": 14631 }, { "epoch": 2.71, "learning_rate": 4.957504876337704e-07, "loss": 0.3919, "step": 14632 }, { "epoch": 2.71, "learning_rate": 4.951295614499118e-07, "loss": 0.4049, "step": 14633 }, { "epoch": 2.71, "learning_rate": 4.945090144927867e-07, "loss": 0.4203, "step": 14634 }, { "epoch": 2.71, "learning_rate": 4.938888467871505e-07, "loss": 0.4052, "step": 14635 }, { "epoch": 2.71, "learning_rate": 4.932690583577516e-07, "loss": 0.4129, "step": 14636 }, { "epoch": 2.71, "learning_rate": 4.926496492293132e-07, "loss": 0.4083, "step": 14637 }, { "epoch": 2.71, "learning_rate": 4.920306194265534e-07, "loss": 0.4006, "step": 14638 }, { "epoch": 2.71, "learning_rate": 4.914119689741692e-07, "loss": 0.4121, "step": 14639 }, { "epoch": 2.71, "learning_rate": 4.907936978968408e-07, "loss": 0.3947, "step": 14640 }, { "epoch": 2.71, "learning_rate": 4.901758062192396e-07, "loss": 0.4079, "step": 14641 }, { "epoch": 2.71, "learning_rate": 4.895582939660149e-07, "loss": 0.4169, "step": 14642 }, { "epoch": 2.71, "learning_rate": 4.889411611618078e-07, "loss": 0.4145, "step": 14643 }, { "epoch": 2.71, "learning_rate": 4.883244078312377e-07, "loss": 0.4317, "step": 14644 }, { "epoch": 2.71, "learning_rate": 4.877080339989149e-07, "loss": 0.4042, "step": 14645 }, { "epoch": 2.71, "learning_rate": 4.870920396894296e-07, "loss": 0.4099, "step": 14646 }, { "epoch": 2.71, "learning_rate": 4.864764249273579e-07, "loss": 0.425, "step": 14647 }, { "epoch": 2.71, "learning_rate": 4.858611897372656e-07, "loss": 0.4132, "step": 14648 }, { "epoch": 2.71, "learning_rate": 4.852463341436941e-07, "loss": 0.4046, "step": 14649 }, { "epoch": 2.71, "learning_rate": 4.846318581711796e-07, "loss": 0.4439, "step": 14650 }, { "epoch": 2.71, "learning_rate": 4.840177618442366e-07, "loss": 0.4053, "step": 14651 }, { "epoch": 2.71, "learning_rate": 4.834040451873657e-07, "loss": 0.4093, "step": 14652 }, { "epoch": 2.71, "learning_rate": 4.827907082250549e-07, "loss": 0.4068, "step": 14653 }, { "epoch": 2.71, "learning_rate": 4.821777509817727e-07, "loss": 0.4125, "step": 14654 }, { "epoch": 2.71, "learning_rate": 4.81565173481977e-07, "loss": 0.388, "step": 14655 }, { "epoch": 2.71, "learning_rate": 4.809529757501096e-07, "loss": 0.418, "step": 14656 }, { "epoch": 2.71, "learning_rate": 4.803411578105921e-07, "loss": 0.4264, "step": 14657 }, { "epoch": 2.71, "learning_rate": 4.797297196878381e-07, "loss": 0.4101, "step": 14658 }, { "epoch": 2.71, "learning_rate": 4.791186614062415e-07, "loss": 0.4252, "step": 14659 }, { "epoch": 2.71, "learning_rate": 4.78507982990184e-07, "loss": 0.4234, "step": 14660 }, { "epoch": 2.71, "learning_rate": 4.778976844640293e-07, "loss": 0.3815, "step": 14661 }, { "epoch": 2.71, "learning_rate": 4.772877658521268e-07, "loss": 0.4173, "step": 14662 }, { "epoch": 2.71, "learning_rate": 4.7667822717881176e-07, "loss": 0.4034, "step": 14663 }, { "epoch": 2.71, "learning_rate": 4.760690684684022e-07, "loss": 0.427, "step": 14664 }, { "epoch": 2.71, "learning_rate": 4.7546028974520655e-07, "loss": 0.4382, "step": 14665 }, { "epoch": 2.71, "learning_rate": 4.748518910335076e-07, "loss": 0.3994, "step": 14666 }, { "epoch": 2.71, "learning_rate": 4.74243872357586e-07, "loss": 0.4046, "step": 14667 }, { "epoch": 2.71, "learning_rate": 4.7363623374169666e-07, "loss": 0.4109, "step": 14668 }, { "epoch": 2.71, "learning_rate": 4.730289752100825e-07, "loss": 0.4042, "step": 14669 }, { "epoch": 2.71, "learning_rate": 4.7242209678697526e-07, "loss": 0.4223, "step": 14670 }, { "epoch": 2.71, "learning_rate": 4.718155984965844e-07, "loss": 0.4109, "step": 14671 }, { "epoch": 2.71, "learning_rate": 4.712094803631129e-07, "loss": 0.4011, "step": 14672 }, { "epoch": 2.71, "learning_rate": 4.7060374241074016e-07, "loss": 0.4348, "step": 14673 }, { "epoch": 2.71, "learning_rate": 4.6999838466363355e-07, "loss": 0.4308, "step": 14674 }, { "epoch": 2.72, "learning_rate": 4.693934071459483e-07, "loss": 0.4196, "step": 14675 }, { "epoch": 2.72, "learning_rate": 4.687888098818194e-07, "loss": 0.4094, "step": 14676 }, { "epoch": 2.72, "learning_rate": 4.681845928953721e-07, "loss": 0.4102, "step": 14677 }, { "epoch": 2.72, "learning_rate": 4.675807562107104e-07, "loss": 0.3968, "step": 14678 }, { "epoch": 2.72, "learning_rate": 4.669772998519295e-07, "loss": 0.4072, "step": 14679 }, { "epoch": 2.72, "learning_rate": 4.663742238431024e-07, "loss": 0.4243, "step": 14680 }, { "epoch": 2.72, "learning_rate": 4.657715282082942e-07, "loss": 0.4268, "step": 14681 }, { "epoch": 2.72, "learning_rate": 4.6516921297154793e-07, "loss": 0.441, "step": 14682 }, { "epoch": 2.72, "learning_rate": 4.6456727815689883e-07, "loss": 0.3981, "step": 14683 }, { "epoch": 2.72, "learning_rate": 4.639657237883599e-07, "loss": 0.4077, "step": 14684 }, { "epoch": 2.72, "learning_rate": 4.633645498899342e-07, "loss": 0.4061, "step": 14685 }, { "epoch": 2.72, "learning_rate": 4.627637564856047e-07, "loss": 0.4106, "step": 14686 }, { "epoch": 2.72, "learning_rate": 4.6216334359934443e-07, "loss": 0.4221, "step": 14687 }, { "epoch": 2.72, "learning_rate": 4.615633112551077e-07, "loss": 0.4108, "step": 14688 }, { "epoch": 2.72, "learning_rate": 4.609636594768363e-07, "loss": 0.405, "step": 14689 }, { "epoch": 2.72, "learning_rate": 4.6036438828845343e-07, "loss": 0.3993, "step": 14690 }, { "epoch": 2.72, "learning_rate": 4.597654977138677e-07, "loss": 0.3906, "step": 14691 }, { "epoch": 2.72, "learning_rate": 4.591669877769767e-07, "loss": 0.427, "step": 14692 }, { "epoch": 2.72, "learning_rate": 4.585688585016568e-07, "loss": 0.4318, "step": 14693 }, { "epoch": 2.72, "learning_rate": 4.579711099117756e-07, "loss": 0.3997, "step": 14694 }, { "epoch": 2.72, "learning_rate": 4.573737420311808e-07, "loss": 0.427, "step": 14695 }, { "epoch": 2.72, "learning_rate": 4.567767548837054e-07, "loss": 0.4015, "step": 14696 }, { "epoch": 2.72, "learning_rate": 4.561801484931694e-07, "loss": 0.4111, "step": 14697 }, { "epoch": 2.72, "learning_rate": 4.555839228833736e-07, "loss": 0.4206, "step": 14698 }, { "epoch": 2.72, "learning_rate": 4.549880780781102e-07, "loss": 0.4246, "step": 14699 }, { "epoch": 2.72, "learning_rate": 4.543926141011501e-07, "loss": 0.3977, "step": 14700 }, { "epoch": 2.72, "learning_rate": 4.537975309762499e-07, "loss": 0.4122, "step": 14701 }, { "epoch": 2.72, "learning_rate": 4.5320282872715613e-07, "loss": 0.419, "step": 14702 }, { "epoch": 2.72, "learning_rate": 4.526085073775921e-07, "loss": 0.3845, "step": 14703 }, { "epoch": 2.72, "learning_rate": 4.520145669512732e-07, "loss": 0.4038, "step": 14704 }, { "epoch": 2.72, "learning_rate": 4.51421007471895e-07, "loss": 0.4277, "step": 14705 }, { "epoch": 2.72, "learning_rate": 4.508278289631396e-07, "loss": 0.3957, "step": 14706 }, { "epoch": 2.72, "learning_rate": 4.5023503144867474e-07, "loss": 0.4154, "step": 14707 }, { "epoch": 2.72, "learning_rate": 4.496426149521504e-07, "loss": 0.3983, "step": 14708 }, { "epoch": 2.72, "learning_rate": 4.4905057949720553e-07, "loss": 0.4049, "step": 14709 }, { "epoch": 2.72, "learning_rate": 4.484589251074567e-07, "loss": 0.404, "step": 14710 }, { "epoch": 2.72, "learning_rate": 4.47867651806515e-07, "loss": 0.4159, "step": 14711 }, { "epoch": 2.72, "learning_rate": 4.4727675961796836e-07, "loss": 0.4089, "step": 14712 }, { "epoch": 2.72, "learning_rate": 4.4668624856539114e-07, "loss": 0.4079, "step": 14713 }, { "epoch": 2.72, "learning_rate": 4.460961186723456e-07, "loss": 0.4219, "step": 14714 }, { "epoch": 2.72, "learning_rate": 4.4550636996237626e-07, "loss": 0.4096, "step": 14715 }, { "epoch": 2.72, "learning_rate": 4.449170024590144e-07, "loss": 0.4243, "step": 14716 }, { "epoch": 2.72, "learning_rate": 4.443280161857721e-07, "loss": 0.418, "step": 14717 }, { "epoch": 2.72, "learning_rate": 4.437394111661508e-07, "loss": 0.4157, "step": 14718 }, { "epoch": 2.72, "learning_rate": 4.4315118742363385e-07, "loss": 0.4176, "step": 14719 }, { "epoch": 2.72, "learning_rate": 4.425633449816891e-07, "loss": 0.4238, "step": 14720 }, { "epoch": 2.72, "learning_rate": 4.4197588386377443e-07, "loss": 0.4114, "step": 14721 }, { "epoch": 2.72, "learning_rate": 4.413888040933245e-07, "loss": 0.4192, "step": 14722 }, { "epoch": 2.72, "learning_rate": 4.408021056937628e-07, "loss": 0.4084, "step": 14723 }, { "epoch": 2.72, "learning_rate": 4.4021578868850054e-07, "loss": 0.4095, "step": 14724 }, { "epoch": 2.72, "learning_rate": 4.3962985310092686e-07, "loss": 0.4249, "step": 14725 }, { "epoch": 2.72, "learning_rate": 4.3904429895442303e-07, "loss": 0.415, "step": 14726 }, { "epoch": 2.72, "learning_rate": 4.3845912627234923e-07, "loss": 0.4081, "step": 14727 }, { "epoch": 2.72, "learning_rate": 4.3787433507805455e-07, "loss": 0.4239, "step": 14728 }, { "epoch": 2.73, "learning_rate": 4.3728992539486925e-07, "loss": 0.4085, "step": 14729 }, { "epoch": 2.73, "learning_rate": 4.3670589724611134e-07, "loss": 0.407, "step": 14730 }, { "epoch": 2.73, "learning_rate": 4.361222506550822e-07, "loss": 0.4323, "step": 14731 }, { "epoch": 2.73, "learning_rate": 4.355389856450687e-07, "loss": 0.4178, "step": 14732 }, { "epoch": 2.73, "learning_rate": 4.3495610223934003e-07, "loss": 0.4071, "step": 14733 }, { "epoch": 2.73, "learning_rate": 4.343736004611554e-07, "loss": 0.4127, "step": 14734 }, { "epoch": 2.73, "learning_rate": 4.337914803337517e-07, "loss": 0.3996, "step": 14735 }, { "epoch": 2.73, "learning_rate": 4.3320974188035825e-07, "loss": 0.4051, "step": 14736 }, { "epoch": 2.73, "learning_rate": 4.32628385124183e-07, "loss": 0.4033, "step": 14737 }, { "epoch": 2.73, "learning_rate": 4.3204741008842313e-07, "loss": 0.4285, "step": 14738 }, { "epoch": 2.73, "learning_rate": 4.314668167962566e-07, "loss": 0.4028, "step": 14739 }, { "epoch": 2.73, "learning_rate": 4.30886605270846e-07, "loss": 0.4142, "step": 14740 }, { "epoch": 2.73, "learning_rate": 4.3030677553534626e-07, "loss": 0.4187, "step": 14741 }, { "epoch": 2.73, "learning_rate": 4.297273276128855e-07, "loss": 0.4261, "step": 14742 }, { "epoch": 2.73, "learning_rate": 4.291482615265874e-07, "loss": 0.4015, "step": 14743 }, { "epoch": 2.73, "learning_rate": 4.285695772995535e-07, "loss": 0.4163, "step": 14744 }, { "epoch": 2.73, "learning_rate": 4.27991274954872e-07, "loss": 0.3918, "step": 14745 }, { "epoch": 2.73, "learning_rate": 4.274133545156167e-07, "loss": 0.3957, "step": 14746 }, { "epoch": 2.73, "learning_rate": 4.268358160048447e-07, "loss": 0.4022, "step": 14747 }, { "epoch": 2.73, "learning_rate": 4.2625865944560086e-07, "loss": 0.4203, "step": 14748 }, { "epoch": 2.73, "learning_rate": 4.256818848609112e-07, "loss": 0.4153, "step": 14749 }, { "epoch": 2.73, "learning_rate": 4.251054922737863e-07, "loss": 0.4106, "step": 14750 }, { "epoch": 2.73, "learning_rate": 4.2452948170722653e-07, "loss": 0.409, "step": 14751 }, { "epoch": 2.73, "learning_rate": 4.239538531842102e-07, "loss": 0.4093, "step": 14752 }, { "epoch": 2.73, "learning_rate": 4.233786067277068e-07, "loss": 0.3894, "step": 14753 }, { "epoch": 2.73, "learning_rate": 4.228037423606657e-07, "loss": 0.43, "step": 14754 }, { "epoch": 2.73, "learning_rate": 4.2222926010602407e-07, "loss": 0.411, "step": 14755 }, { "epoch": 2.73, "learning_rate": 4.216551599867025e-07, "loss": 0.4029, "step": 14756 }, { "epoch": 2.73, "learning_rate": 4.2108144202560485e-07, "loss": 0.3984, "step": 14757 }, { "epoch": 2.73, "learning_rate": 4.20508106245624e-07, "loss": 0.4064, "step": 14758 }, { "epoch": 2.73, "learning_rate": 4.1993515266963267e-07, "loss": 0.4189, "step": 14759 }, { "epoch": 2.73, "learning_rate": 4.1936258132049266e-07, "loss": 0.4168, "step": 14760 }, { "epoch": 2.73, "learning_rate": 4.187903922210479e-07, "loss": 0.4133, "step": 14761 }, { "epoch": 2.73, "learning_rate": 4.1821858539412676e-07, "loss": 0.4177, "step": 14762 }, { "epoch": 2.73, "learning_rate": 4.176471608625443e-07, "loss": 0.4174, "step": 14763 }, { "epoch": 2.73, "learning_rate": 4.170761186490979e-07, "loss": 0.4261, "step": 14764 }, { "epoch": 2.73, "learning_rate": 4.165054587765727e-07, "loss": 0.4133, "step": 14765 }, { "epoch": 2.73, "learning_rate": 4.15935181267737e-07, "loss": 0.4047, "step": 14766 }, { "epoch": 2.73, "learning_rate": 4.153652861453417e-07, "loss": 0.3925, "step": 14767 }, { "epoch": 2.73, "learning_rate": 4.147957734321273e-07, "loss": 0.4005, "step": 14768 }, { "epoch": 2.73, "learning_rate": 4.142266431508135e-07, "loss": 0.4064, "step": 14769 }, { "epoch": 2.73, "learning_rate": 4.1365789532410996e-07, "loss": 0.4076, "step": 14770 }, { "epoch": 2.73, "learning_rate": 4.1308952997470843e-07, "loss": 0.3897, "step": 14771 }, { "epoch": 2.73, "learning_rate": 4.1252154712528416e-07, "loss": 0.4029, "step": 14772 }, { "epoch": 2.73, "learning_rate": 4.119539467985001e-07, "loss": 0.4336, "step": 14773 }, { "epoch": 2.73, "learning_rate": 4.113867290170004e-07, "loss": 0.4325, "step": 14774 }, { "epoch": 2.73, "learning_rate": 4.10819893803418e-07, "loss": 0.3985, "step": 14775 }, { "epoch": 2.73, "learning_rate": 4.1025344118036714e-07, "loss": 0.4118, "step": 14776 }, { "epoch": 2.73, "learning_rate": 4.0968737117045077e-07, "loss": 0.4167, "step": 14777 }, { "epoch": 2.73, "learning_rate": 4.0912168379625085e-07, "loss": 0.409, "step": 14778 }, { "epoch": 2.73, "learning_rate": 4.085563790803404e-07, "loss": 0.4251, "step": 14779 }, { "epoch": 2.73, "learning_rate": 4.0799145704527034e-07, "loss": 0.4214, "step": 14780 }, { "epoch": 2.73, "learning_rate": 4.074269177135837e-07, "loss": 0.416, "step": 14781 }, { "epoch": 2.73, "learning_rate": 4.0686276110780134e-07, "loss": 0.4123, "step": 14782 }, { "epoch": 2.74, "learning_rate": 4.0629898725043525e-07, "loss": 0.429, "step": 14783 }, { "epoch": 2.74, "learning_rate": 4.057355961639753e-07, "loss": 0.4263, "step": 14784 }, { "epoch": 2.74, "learning_rate": 4.0517258787090343e-07, "loss": 0.3918, "step": 14785 }, { "epoch": 2.74, "learning_rate": 4.0460996239367946e-07, "loss": 0.4129, "step": 14786 }, { "epoch": 2.74, "learning_rate": 4.040477197547543e-07, "loss": 0.4159, "step": 14787 }, { "epoch": 2.74, "learning_rate": 4.03485859976559e-07, "loss": 0.4007, "step": 14788 }, { "epoch": 2.74, "learning_rate": 4.0292438308150884e-07, "loss": 0.4259, "step": 14789 }, { "epoch": 2.74, "learning_rate": 4.023632890920082e-07, "loss": 0.4145, "step": 14790 }, { "epoch": 2.74, "learning_rate": 4.018025780304413e-07, "loss": 0.4182, "step": 14791 }, { "epoch": 2.74, "learning_rate": 4.012422499191826e-07, "loss": 0.387, "step": 14792 }, { "epoch": 2.74, "learning_rate": 4.0068230478058634e-07, "loss": 0.4046, "step": 14793 }, { "epoch": 2.74, "learning_rate": 4.0012274263699245e-07, "loss": 0.4138, "step": 14794 }, { "epoch": 2.74, "learning_rate": 3.9956356351072865e-07, "loss": 0.3931, "step": 14795 }, { "epoch": 2.74, "learning_rate": 3.9900476742410267e-07, "loss": 0.3931, "step": 14796 }, { "epoch": 2.74, "learning_rate": 3.9844635439941217e-07, "loss": 0.4105, "step": 14797 }, { "epoch": 2.74, "learning_rate": 3.9788832445893376e-07, "loss": 0.4003, "step": 14798 }, { "epoch": 2.74, "learning_rate": 3.973306776249342e-07, "loss": 0.409, "step": 14799 }, { "epoch": 2.74, "learning_rate": 3.967734139196622e-07, "loss": 0.3934, "step": 14800 }, { "epoch": 2.74, "learning_rate": 3.9621653336535004e-07, "loss": 0.4078, "step": 14801 }, { "epoch": 2.74, "learning_rate": 3.956600359842189e-07, "loss": 0.4091, "step": 14802 }, { "epoch": 2.74, "learning_rate": 3.951039217984687e-07, "loss": 0.3957, "step": 14803 }, { "epoch": 2.74, "learning_rate": 3.945481908302895e-07, "loss": 0.4444, "step": 14804 }, { "epoch": 2.74, "learning_rate": 3.939928431018536e-07, "loss": 0.3986, "step": 14805 }, { "epoch": 2.74, "learning_rate": 3.934378786353177e-07, "loss": 0.4166, "step": 14806 }, { "epoch": 2.74, "learning_rate": 3.9288329745282514e-07, "loss": 0.4385, "step": 14807 }, { "epoch": 2.74, "learning_rate": 3.9232909957650167e-07, "loss": 0.391, "step": 14808 }, { "epoch": 2.74, "learning_rate": 3.9177528502845954e-07, "loss": 0.3904, "step": 14809 }, { "epoch": 2.74, "learning_rate": 3.9122185383079435e-07, "loss": 0.4334, "step": 14810 }, { "epoch": 2.74, "learning_rate": 3.9066880600558523e-07, "loss": 0.4139, "step": 14811 }, { "epoch": 2.74, "learning_rate": 3.901161415749011e-07, "loss": 0.3999, "step": 14812 }, { "epoch": 2.74, "learning_rate": 3.895638605607899e-07, "loss": 0.4186, "step": 14813 }, { "epoch": 2.74, "learning_rate": 3.890119629852884e-07, "loss": 0.4187, "step": 14814 }, { "epoch": 2.74, "learning_rate": 3.8846044887041467e-07, "loss": 0.4141, "step": 14815 }, { "epoch": 2.74, "learning_rate": 3.879093182381732e-07, "loss": 0.4276, "step": 14816 }, { "epoch": 2.74, "learning_rate": 3.8735857111055543e-07, "loss": 0.4207, "step": 14817 }, { "epoch": 2.74, "learning_rate": 3.868082075095314e-07, "loss": 0.4046, "step": 14818 }, { "epoch": 2.74, "learning_rate": 3.862582274570625e-07, "loss": 0.4075, "step": 14819 }, { "epoch": 2.74, "learning_rate": 3.857086309750901e-07, "loss": 0.4185, "step": 14820 }, { "epoch": 2.74, "learning_rate": 3.8515941808554445e-07, "loss": 0.4187, "step": 14821 }, { "epoch": 2.74, "learning_rate": 3.8461058881033574e-07, "loss": 0.4048, "step": 14822 }, { "epoch": 2.74, "learning_rate": 3.84062143171362e-07, "loss": 0.4061, "step": 14823 }, { "epoch": 2.74, "learning_rate": 3.835140811905058e-07, "loss": 0.4175, "step": 14824 }, { "epoch": 2.74, "learning_rate": 3.8296640288963184e-07, "loss": 0.4057, "step": 14825 }, { "epoch": 2.74, "learning_rate": 3.824191082905948e-07, "loss": 0.4489, "step": 14826 }, { "epoch": 2.74, "learning_rate": 3.818721974152273e-07, "loss": 0.4182, "step": 14827 }, { "epoch": 2.74, "learning_rate": 3.8132567028535296e-07, "loss": 0.4112, "step": 14828 }, { "epoch": 2.74, "learning_rate": 3.807795269227743e-07, "loss": 0.4373, "step": 14829 }, { "epoch": 2.74, "learning_rate": 3.8023376734928506e-07, "loss": 0.4231, "step": 14830 }, { "epoch": 2.74, "learning_rate": 3.7968839158665673e-07, "loss": 0.4159, "step": 14831 }, { "epoch": 2.74, "learning_rate": 3.791433996566507e-07, "loss": 0.4136, "step": 14832 }, { "epoch": 2.74, "learning_rate": 3.7859879158100856e-07, "loss": 0.4102, "step": 14833 }, { "epoch": 2.74, "learning_rate": 3.7805456738146396e-07, "loss": 0.4223, "step": 14834 }, { "epoch": 2.74, "learning_rate": 3.775107270797251e-07, "loss": 0.4037, "step": 14835 }, { "epoch": 2.74, "learning_rate": 3.7696727069749475e-07, "loss": 0.4128, "step": 14836 }, { "epoch": 2.75, "learning_rate": 3.7642419825645316e-07, "loss": 0.4161, "step": 14837 }, { "epoch": 2.75, "learning_rate": 3.7588150977826755e-07, "loss": 0.4231, "step": 14838 }, { "epoch": 2.75, "learning_rate": 3.753392052845917e-07, "loss": 0.4031, "step": 14839 }, { "epoch": 2.75, "learning_rate": 3.747972847970616e-07, "loss": 0.4001, "step": 14840 }, { "epoch": 2.75, "learning_rate": 3.7425574833729995e-07, "loss": 0.4035, "step": 14841 }, { "epoch": 2.75, "learning_rate": 3.737145959269106e-07, "loss": 0.4112, "step": 14842 }, { "epoch": 2.75, "learning_rate": 3.7317382758748856e-07, "loss": 0.4245, "step": 14843 }, { "epoch": 2.75, "learning_rate": 3.7263344334060647e-07, "loss": 0.4016, "step": 14844 }, { "epoch": 2.75, "learning_rate": 3.720934432078249e-07, "loss": 0.4062, "step": 14845 }, { "epoch": 2.75, "learning_rate": 3.7155382721069e-07, "loss": 0.4114, "step": 14846 }, { "epoch": 2.75, "learning_rate": 3.7101459537073005e-07, "loss": 0.406, "step": 14847 }, { "epoch": 2.75, "learning_rate": 3.7047574770946114e-07, "loss": 0.4219, "step": 14848 }, { "epoch": 2.75, "learning_rate": 3.699372842483817e-07, "loss": 0.3852, "step": 14849 }, { "epoch": 2.75, "learning_rate": 3.693992050089734e-07, "loss": 0.41, "step": 14850 }, { "epoch": 2.75, "learning_rate": 3.688615100127069e-07, "loss": 0.3986, "step": 14851 }, { "epoch": 2.75, "learning_rate": 3.683241992810338e-07, "loss": 0.3993, "step": 14852 }, { "epoch": 2.75, "learning_rate": 3.6778727283539375e-07, "loss": 0.443, "step": 14853 }, { "epoch": 2.75, "learning_rate": 3.672507306972084e-07, "loss": 0.4102, "step": 14854 }, { "epoch": 2.75, "learning_rate": 3.667145728878829e-07, "loss": 0.4213, "step": 14855 }, { "epoch": 2.75, "learning_rate": 3.661787994288113e-07, "loss": 0.4202, "step": 14856 }, { "epoch": 2.75, "learning_rate": 3.6564341034136864e-07, "loss": 0.4037, "step": 14857 }, { "epoch": 2.75, "learning_rate": 3.6510840564691676e-07, "loss": 0.4157, "step": 14858 }, { "epoch": 2.75, "learning_rate": 3.645737853668008e-07, "loss": 0.4042, "step": 14859 }, { "epoch": 2.75, "learning_rate": 3.640395495223503e-07, "loss": 0.4213, "step": 14860 }, { "epoch": 2.75, "learning_rate": 3.635056981348828e-07, "loss": 0.4245, "step": 14861 }, { "epoch": 2.75, "learning_rate": 3.629722312256956e-07, "loss": 0.4239, "step": 14862 }, { "epoch": 2.75, "learning_rate": 3.624391488160739e-07, "loss": 0.4121, "step": 14863 }, { "epoch": 2.75, "learning_rate": 3.619064509272863e-07, "loss": 0.3921, "step": 14864 }, { "epoch": 2.75, "learning_rate": 3.613741375805879e-07, "loss": 0.4126, "step": 14865 }, { "epoch": 2.75, "learning_rate": 3.608422087972163e-07, "loss": 0.4283, "step": 14866 }, { "epoch": 2.75, "learning_rate": 3.6031066459839225e-07, "loss": 0.4312, "step": 14867 }, { "epoch": 2.75, "learning_rate": 3.5977950500532764e-07, "loss": 0.3915, "step": 14868 }, { "epoch": 2.75, "learning_rate": 3.5924873003921e-07, "loss": 0.4159, "step": 14869 }, { "epoch": 2.75, "learning_rate": 3.5871833972122016e-07, "loss": 0.4284, "step": 14870 }, { "epoch": 2.75, "learning_rate": 3.5818833407251894e-07, "loss": 0.4182, "step": 14871 }, { "epoch": 2.75, "learning_rate": 3.576587131142495e-07, "loss": 0.3983, "step": 14872 }, { "epoch": 2.75, "learning_rate": 3.5712947686754705e-07, "loss": 0.4138, "step": 14873 }, { "epoch": 2.75, "learning_rate": 3.566006253535237e-07, "loss": 0.4237, "step": 14874 }, { "epoch": 2.75, "learning_rate": 3.560721585932825e-07, "loss": 0.4142, "step": 14875 }, { "epoch": 2.75, "learning_rate": 3.5554407660790547e-07, "loss": 0.411, "step": 14876 }, { "epoch": 2.75, "learning_rate": 3.5501637941846467e-07, "loss": 0.431, "step": 14877 }, { "epoch": 2.75, "learning_rate": 3.5448906704601215e-07, "loss": 0.421, "step": 14878 }, { "epoch": 2.75, "learning_rate": 3.5396213951158885e-07, "loss": 0.4052, "step": 14879 }, { "epoch": 2.75, "learning_rate": 3.5343559683621573e-07, "loss": 0.4312, "step": 14880 }, { "epoch": 2.75, "learning_rate": 3.529094390409038e-07, "loss": 0.4086, "step": 14881 }, { "epoch": 2.75, "learning_rate": 3.523836661466429e-07, "loss": 0.4191, "step": 14882 }, { "epoch": 2.75, "learning_rate": 3.5185827817441174e-07, "loss": 0.4267, "step": 14883 }, { "epoch": 2.75, "learning_rate": 3.513332751451726e-07, "loss": 0.4195, "step": 14884 }, { "epoch": 2.75, "learning_rate": 3.5080865707987187e-07, "loss": 0.4164, "step": 14885 }, { "epoch": 2.75, "learning_rate": 3.502844239994396e-07, "loss": 0.4189, "step": 14886 }, { "epoch": 2.75, "learning_rate": 3.4976057592479465e-07, "loss": 0.4017, "step": 14887 }, { "epoch": 2.75, "learning_rate": 3.492371128768346e-07, "loss": 0.4253, "step": 14888 }, { "epoch": 2.75, "learning_rate": 3.487140348764462e-07, "loss": 0.4023, "step": 14889 }, { "epoch": 2.75, "learning_rate": 3.481913419444993e-07, "loss": 0.4216, "step": 14890 }, { "epoch": 2.76, "learning_rate": 3.4766903410184627e-07, "loss": 0.4181, "step": 14891 }, { "epoch": 2.76, "learning_rate": 3.4714711136933033e-07, "loss": 0.4022, "step": 14892 }, { "epoch": 2.76, "learning_rate": 3.4662557376777153e-07, "loss": 0.4269, "step": 14893 }, { "epoch": 2.76, "learning_rate": 3.4610442131797983e-07, "loss": 0.4215, "step": 14894 }, { "epoch": 2.76, "learning_rate": 3.4558365404074755e-07, "loss": 0.3943, "step": 14895 }, { "epoch": 2.76, "learning_rate": 3.450632719568525e-07, "loss": 0.4161, "step": 14896 }, { "epoch": 2.76, "learning_rate": 3.445432750870592e-07, "loss": 0.431, "step": 14897 }, { "epoch": 2.76, "learning_rate": 3.440236634521121e-07, "loss": 0.4175, "step": 14898 }, { "epoch": 2.76, "learning_rate": 3.435044370727414e-07, "loss": 0.4152, "step": 14899 }, { "epoch": 2.76, "learning_rate": 3.4298559596966705e-07, "loss": 0.4034, "step": 14900 }, { "epoch": 2.76, "learning_rate": 3.4246714016358596e-07, "loss": 0.4048, "step": 14901 }, { "epoch": 2.76, "learning_rate": 3.4194906967518815e-07, "loss": 0.4326, "step": 14902 }, { "epoch": 2.76, "learning_rate": 3.4143138452513936e-07, "loss": 0.4072, "step": 14903 }, { "epoch": 2.76, "learning_rate": 3.409140847340964e-07, "loss": 0.4058, "step": 14904 }, { "epoch": 2.76, "learning_rate": 3.403971703226983e-07, "loss": 0.4308, "step": 14905 }, { "epoch": 2.76, "learning_rate": 3.398806413115674e-07, "loss": 0.4101, "step": 14906 }, { "epoch": 2.76, "learning_rate": 3.393644977213162e-07, "loss": 0.4082, "step": 14907 }, { "epoch": 2.76, "learning_rate": 3.3884873957253373e-07, "loss": 0.4185, "step": 14908 }, { "epoch": 2.76, "learning_rate": 3.3833336688579907e-07, "loss": 0.4473, "step": 14909 }, { "epoch": 2.76, "learning_rate": 3.3781837968167585e-07, "loss": 0.4214, "step": 14910 }, { "epoch": 2.76, "learning_rate": 3.373037779807098e-07, "loss": 0.3939, "step": 14911 }, { "epoch": 2.76, "learning_rate": 3.3678956180343334e-07, "loss": 0.3922, "step": 14912 }, { "epoch": 2.76, "learning_rate": 3.3627573117036127e-07, "loss": 0.4073, "step": 14913 }, { "epoch": 2.76, "learning_rate": 3.3576228610199713e-07, "loss": 0.4169, "step": 14914 }, { "epoch": 2.76, "learning_rate": 3.352492266188245e-07, "loss": 0.4467, "step": 14915 }, { "epoch": 2.76, "learning_rate": 3.347365527413138e-07, "loss": 0.4148, "step": 14916 }, { "epoch": 2.76, "learning_rate": 3.3422426448992073e-07, "loss": 0.4146, "step": 14917 }, { "epoch": 2.76, "learning_rate": 3.3371236188508127e-07, "loss": 0.4218, "step": 14918 }, { "epoch": 2.76, "learning_rate": 3.332008449472246e-07, "loss": 0.423, "step": 14919 }, { "epoch": 2.76, "learning_rate": 3.326897136967555e-07, "loss": 0.4354, "step": 14920 }, { "epoch": 2.76, "learning_rate": 3.321789681540677e-07, "loss": 0.4141, "step": 14921 }, { "epoch": 2.76, "learning_rate": 3.316686083395415e-07, "loss": 0.4145, "step": 14922 }, { "epoch": 2.76, "learning_rate": 3.3115863427353513e-07, "loss": 0.4072, "step": 14923 }, { "epoch": 2.76, "learning_rate": 3.306490459763989e-07, "loss": 0.4179, "step": 14924 }, { "epoch": 2.76, "learning_rate": 3.301398434684633e-07, "loss": 0.4001, "step": 14925 }, { "epoch": 2.76, "learning_rate": 3.296310267700453e-07, "loss": 0.412, "step": 14926 }, { "epoch": 2.76, "learning_rate": 3.2912259590144324e-07, "loss": 0.4008, "step": 14927 }, { "epoch": 2.76, "learning_rate": 3.2861455088294637e-07, "loss": 0.4316, "step": 14928 }, { "epoch": 2.76, "learning_rate": 3.281068917348218e-07, "loss": 0.3931, "step": 14929 }, { "epoch": 2.76, "learning_rate": 3.2759961847732666e-07, "loss": 0.422, "step": 14930 }, { "epoch": 2.76, "learning_rate": 3.270927311306971e-07, "loss": 0.4206, "step": 14931 }, { "epoch": 2.76, "learning_rate": 3.2658622971515896e-07, "loss": 0.4115, "step": 14932 }, { "epoch": 2.76, "learning_rate": 3.2608011425092066e-07, "loss": 0.4051, "step": 14933 }, { "epoch": 2.76, "learning_rate": 3.2557438475817495e-07, "loss": 0.4224, "step": 14934 }, { "epoch": 2.76, "learning_rate": 3.250690412571e-07, "loss": 0.4127, "step": 14935 }, { "epoch": 2.76, "learning_rate": 3.2456408376785763e-07, "loss": 0.4182, "step": 14936 }, { "epoch": 2.76, "learning_rate": 3.2405951231059495e-07, "loss": 0.4441, "step": 14937 }, { "epoch": 2.76, "learning_rate": 3.2355532690544143e-07, "loss": 0.4099, "step": 14938 }, { "epoch": 2.76, "learning_rate": 3.2305152757251656e-07, "loss": 0.4347, "step": 14939 }, { "epoch": 2.76, "learning_rate": 3.225481143319187e-07, "loss": 0.4076, "step": 14940 }, { "epoch": 2.76, "learning_rate": 3.2204508720373506e-07, "loss": 0.4162, "step": 14941 }, { "epoch": 2.76, "learning_rate": 3.2154244620803297e-07, "loss": 0.4046, "step": 14942 }, { "epoch": 2.76, "learning_rate": 3.210401913648675e-07, "loss": 0.423, "step": 14943 }, { "epoch": 2.76, "learning_rate": 3.2053832269428044e-07, "loss": 0.4393, "step": 14944 }, { "epoch": 2.77, "learning_rate": 3.200368402162912e-07, "loss": 0.4225, "step": 14945 }, { "epoch": 2.77, "learning_rate": 3.1953574395091056e-07, "loss": 0.4015, "step": 14946 }, { "epoch": 2.77, "learning_rate": 3.190350339181314e-07, "loss": 0.4263, "step": 14947 }, { "epoch": 2.77, "learning_rate": 3.185347101379299e-07, "loss": 0.4077, "step": 14948 }, { "epoch": 2.77, "learning_rate": 3.1803477263026906e-07, "loss": 0.4224, "step": 14949 }, { "epoch": 2.77, "learning_rate": 3.1753522141509506e-07, "loss": 0.4033, "step": 14950 }, { "epoch": 2.77, "learning_rate": 3.170360565123387e-07, "loss": 0.4082, "step": 14951 }, { "epoch": 2.77, "learning_rate": 3.1653727794191734e-07, "loss": 0.3959, "step": 14952 }, { "epoch": 2.77, "learning_rate": 3.1603888572372845e-07, "loss": 0.4285, "step": 14953 }, { "epoch": 2.77, "learning_rate": 3.155408798776605e-07, "loss": 0.3896, "step": 14954 }, { "epoch": 2.77, "learning_rate": 3.150432604235798e-07, "loss": 0.4268, "step": 14955 }, { "epoch": 2.77, "learning_rate": 3.1454602738134276e-07, "loss": 0.4246, "step": 14956 }, { "epoch": 2.77, "learning_rate": 3.140491807707857e-07, "loss": 0.4204, "step": 14957 }, { "epoch": 2.77, "learning_rate": 3.1355272061173394e-07, "loss": 0.4171, "step": 14958 }, { "epoch": 2.77, "learning_rate": 3.1305664692399593e-07, "loss": 0.4267, "step": 14959 }, { "epoch": 2.77, "learning_rate": 3.1256095972736045e-07, "loss": 0.3963, "step": 14960 }, { "epoch": 2.77, "learning_rate": 3.1206565904160826e-07, "loss": 0.4213, "step": 14961 }, { "epoch": 2.77, "learning_rate": 3.115707448864991e-07, "loss": 0.4147, "step": 14962 }, { "epoch": 2.77, "learning_rate": 3.110762172817805e-07, "loss": 0.4156, "step": 14963 }, { "epoch": 2.77, "learning_rate": 3.105820762471823e-07, "loss": 0.4005, "step": 14964 }, { "epoch": 2.77, "learning_rate": 3.1008832180241754e-07, "loss": 0.3979, "step": 14965 }, { "epoch": 2.77, "learning_rate": 3.0959495396719053e-07, "loss": 0.4103, "step": 14966 }, { "epoch": 2.77, "learning_rate": 3.091019727611821e-07, "loss": 0.4161, "step": 14967 }, { "epoch": 2.77, "learning_rate": 3.0860937820406445e-07, "loss": 0.4014, "step": 14968 }, { "epoch": 2.77, "learning_rate": 3.0811717031548837e-07, "loss": 0.4066, "step": 14969 }, { "epoch": 2.77, "learning_rate": 3.076253491150938e-07, "loss": 0.4257, "step": 14970 }, { "epoch": 2.77, "learning_rate": 3.0713391462250276e-07, "loss": 0.4093, "step": 14971 }, { "epoch": 2.77, "learning_rate": 3.066428668573207e-07, "loss": 0.4184, "step": 14972 }, { "epoch": 2.77, "learning_rate": 3.061522058391442e-07, "loss": 0.4214, "step": 14973 }, { "epoch": 2.77, "learning_rate": 3.0566193158754643e-07, "loss": 0.4175, "step": 14974 }, { "epoch": 2.77, "learning_rate": 3.0517204412208733e-07, "loss": 0.4235, "step": 14975 }, { "epoch": 2.77, "learning_rate": 3.0468254346231573e-07, "loss": 0.4148, "step": 14976 }, { "epoch": 2.77, "learning_rate": 3.0419342962775933e-07, "loss": 0.4088, "step": 14977 }, { "epoch": 2.77, "learning_rate": 3.037047026379347e-07, "loss": 0.4073, "step": 14978 }, { "epoch": 2.77, "learning_rate": 3.0321636251233965e-07, "loss": 0.3914, "step": 14979 }, { "epoch": 2.77, "learning_rate": 3.0272840927045853e-07, "loss": 0.3886, "step": 14980 }, { "epoch": 2.77, "learning_rate": 3.0224084293175913e-07, "loss": 0.4379, "step": 14981 }, { "epoch": 2.77, "learning_rate": 3.01753663515697e-07, "loss": 0.4278, "step": 14982 }, { "epoch": 2.77, "learning_rate": 3.012668710417066e-07, "loss": 0.4126, "step": 14983 }, { "epoch": 2.77, "learning_rate": 3.007804655292124e-07, "loss": 0.434, "step": 14984 }, { "epoch": 2.77, "learning_rate": 3.0029444699761876e-07, "loss": 0.4089, "step": 14985 }, { "epoch": 2.77, "learning_rate": 2.9980881546631813e-07, "loss": 0.4087, "step": 14986 }, { "epoch": 2.77, "learning_rate": 2.993235709546871e-07, "loss": 0.4315, "step": 14987 }, { "epoch": 2.77, "learning_rate": 2.988387134820847e-07, "loss": 0.4157, "step": 14988 }, { "epoch": 2.77, "learning_rate": 2.9835424306785656e-07, "loss": 0.4153, "step": 14989 }, { "epoch": 2.77, "learning_rate": 2.978701597313327e-07, "loss": 0.4283, "step": 14990 }, { "epoch": 2.77, "learning_rate": 2.9738646349182664e-07, "loss": 0.4215, "step": 14991 }, { "epoch": 2.77, "learning_rate": 2.9690315436863517e-07, "loss": 0.4302, "step": 14992 }, { "epoch": 2.77, "learning_rate": 2.96420232381045e-07, "loss": 0.4175, "step": 14993 }, { "epoch": 2.77, "learning_rate": 2.959376975483197e-07, "loss": 0.4317, "step": 14994 }, { "epoch": 2.77, "learning_rate": 2.954555498897149e-07, "loss": 0.4247, "step": 14995 }, { "epoch": 2.77, "learning_rate": 2.949737894244675e-07, "loss": 0.4107, "step": 14996 }, { "epoch": 2.77, "learning_rate": 2.9449241617179545e-07, "loss": 0.4199, "step": 14997 }, { "epoch": 2.77, "learning_rate": 2.9401143015090784e-07, "loss": 0.3937, "step": 14998 }, { "epoch": 2.78, "learning_rate": 2.9353083138099257e-07, "loss": 0.4105, "step": 14999 }, { "epoch": 2.78, "learning_rate": 2.9305061988122774e-07, "loss": 0.4148, "step": 15000 }, { "epoch": 2.78, "learning_rate": 2.9257079567077016e-07, "loss": 0.4044, "step": 15001 }, { "epoch": 2.78, "learning_rate": 2.920913587687657e-07, "loss": 0.4167, "step": 15002 }, { "epoch": 2.78, "learning_rate": 2.9161230919434235e-07, "loss": 0.3904, "step": 15003 }, { "epoch": 2.78, "learning_rate": 2.911336469666126e-07, "loss": 0.4132, "step": 15004 }, { "epoch": 2.78, "learning_rate": 2.906553721046757e-07, "loss": 0.4202, "step": 15005 }, { "epoch": 2.78, "learning_rate": 2.9017748462761176e-07, "loss": 0.4087, "step": 15006 }, { "epoch": 2.78, "learning_rate": 2.896999845544901e-07, "loss": 0.4276, "step": 15007 }, { "epoch": 2.78, "learning_rate": 2.8922287190436107e-07, "loss": 0.4162, "step": 15008 }, { "epoch": 2.78, "learning_rate": 2.887461466962593e-07, "loss": 0.4084, "step": 15009 }, { "epoch": 2.78, "learning_rate": 2.8826980894920753e-07, "loss": 0.4275, "step": 15010 }, { "epoch": 2.78, "learning_rate": 2.877938586822082e-07, "loss": 0.4179, "step": 15011 }, { "epoch": 2.78, "learning_rate": 2.8731829591425286e-07, "loss": 0.4175, "step": 15012 }, { "epoch": 2.78, "learning_rate": 2.868431206643163e-07, "loss": 0.4005, "step": 15013 }, { "epoch": 2.78, "learning_rate": 2.8636833295135334e-07, "loss": 0.4147, "step": 15014 }, { "epoch": 2.78, "learning_rate": 2.8589393279431224e-07, "loss": 0.4136, "step": 15015 }, { "epoch": 2.78, "learning_rate": 2.854199202121155e-07, "loss": 0.4213, "step": 15016 }, { "epoch": 2.78, "learning_rate": 2.8494629522367925e-07, "loss": 0.4242, "step": 15017 }, { "epoch": 2.78, "learning_rate": 2.8447305784789933e-07, "loss": 0.4215, "step": 15018 }, { "epoch": 2.78, "learning_rate": 2.8400020810365525e-07, "loss": 0.4038, "step": 15019 }, { "epoch": 2.78, "learning_rate": 2.8352774600981624e-07, "loss": 0.4162, "step": 15020 }, { "epoch": 2.78, "learning_rate": 2.830556715852284e-07, "loss": 0.3942, "step": 15021 }, { "epoch": 2.78, "learning_rate": 2.8258398484872996e-07, "loss": 0.4134, "step": 15022 }, { "epoch": 2.78, "learning_rate": 2.8211268581913806e-07, "loss": 0.4037, "step": 15023 }, { "epoch": 2.78, "learning_rate": 2.816417745152589e-07, "loss": 0.4159, "step": 15024 }, { "epoch": 2.78, "learning_rate": 2.811712509558806e-07, "loss": 0.4004, "step": 15025 }, { "epoch": 2.78, "learning_rate": 2.8070111515977385e-07, "loss": 0.4088, "step": 15026 }, { "epoch": 2.78, "learning_rate": 2.802313671456991e-07, "loss": 0.4111, "step": 15027 }, { "epoch": 2.78, "learning_rate": 2.7976200693239585e-07, "loss": 0.4358, "step": 15028 }, { "epoch": 2.78, "learning_rate": 2.7929303453859247e-07, "loss": 0.4234, "step": 15029 }, { "epoch": 2.78, "learning_rate": 2.788244499829995e-07, "loss": 0.4146, "step": 15030 }, { "epoch": 2.78, "learning_rate": 2.7835625328431315e-07, "loss": 0.4025, "step": 15031 }, { "epoch": 2.78, "learning_rate": 2.7788844446121175e-07, "loss": 0.3981, "step": 15032 }, { "epoch": 2.78, "learning_rate": 2.7742102353236376e-07, "loss": 0.4002, "step": 15033 }, { "epoch": 2.78, "learning_rate": 2.7695399051641425e-07, "loss": 0.4186, "step": 15034 }, { "epoch": 2.78, "learning_rate": 2.764873454319994e-07, "loss": 0.4052, "step": 15035 }, { "epoch": 2.78, "learning_rate": 2.7602108829773656e-07, "loss": 0.3968, "step": 15036 }, { "epoch": 2.78, "learning_rate": 2.755552191322297e-07, "loss": 0.4157, "step": 15037 }, { "epoch": 2.78, "learning_rate": 2.7508973795406404e-07, "loss": 0.4192, "step": 15038 }, { "epoch": 2.78, "learning_rate": 2.746246447818135e-07, "loss": 0.4433, "step": 15039 }, { "epoch": 2.78, "learning_rate": 2.7415993963403445e-07, "loss": 0.401, "step": 15040 }, { "epoch": 2.78, "learning_rate": 2.736956225292653e-07, "loss": 0.3999, "step": 15041 }, { "epoch": 2.78, "learning_rate": 2.732316934860335e-07, "loss": 0.415, "step": 15042 }, { "epoch": 2.78, "learning_rate": 2.727681525228476e-07, "loss": 0.4244, "step": 15043 }, { "epoch": 2.78, "learning_rate": 2.72304999658205e-07, "loss": 0.4155, "step": 15044 }, { "epoch": 2.78, "learning_rate": 2.7184223491058094e-07, "loss": 0.414, "step": 15045 }, { "epoch": 2.78, "learning_rate": 2.713798582984406e-07, "loss": 0.3889, "step": 15046 }, { "epoch": 2.78, "learning_rate": 2.709178698402337e-07, "loss": 0.4244, "step": 15047 }, { "epoch": 2.78, "learning_rate": 2.7045626955438885e-07, "loss": 0.4157, "step": 15048 }, { "epoch": 2.78, "learning_rate": 2.6999505745932577e-07, "loss": 0.4194, "step": 15049 }, { "epoch": 2.78, "learning_rate": 2.695342335734441e-07, "loss": 0.4022, "step": 15050 }, { "epoch": 2.78, "learning_rate": 2.6907379791513257e-07, "loss": 0.4117, "step": 15051 }, { "epoch": 2.78, "learning_rate": 2.686137505027608e-07, "loss": 0.4136, "step": 15052 }, { "epoch": 2.79, "learning_rate": 2.6815409135468096e-07, "loss": 0.4218, "step": 15053 }, { "epoch": 2.79, "learning_rate": 2.676948204892371e-07, "loss": 0.3946, "step": 15054 }, { "epoch": 2.79, "learning_rate": 2.672359379247491e-07, "loss": 0.4092, "step": 15055 }, { "epoch": 2.79, "learning_rate": 2.6677744367952895e-07, "loss": 0.4054, "step": 15056 }, { "epoch": 2.79, "learning_rate": 2.6631933777186756e-07, "loss": 0.4236, "step": 15057 }, { "epoch": 2.79, "learning_rate": 2.6586162022004256e-07, "loss": 0.4396, "step": 15058 }, { "epoch": 2.79, "learning_rate": 2.654042910423171e-07, "loss": 0.4034, "step": 15059 }, { "epoch": 2.79, "learning_rate": 2.649473502569377e-07, "loss": 0.4103, "step": 15060 }, { "epoch": 2.79, "learning_rate": 2.644907978821354e-07, "loss": 0.4162, "step": 15061 }, { "epoch": 2.79, "learning_rate": 2.640346339361244e-07, "loss": 0.4098, "step": 15062 }, { "epoch": 2.79, "learning_rate": 2.635788584371057e-07, "loss": 0.4119, "step": 15063 }, { "epoch": 2.79, "learning_rate": 2.631234714032649e-07, "loss": 0.3878, "step": 15064 }, { "epoch": 2.79, "learning_rate": 2.6266847285276956e-07, "loss": 0.42, "step": 15065 }, { "epoch": 2.79, "learning_rate": 2.6221386280377513e-07, "loss": 0.4309, "step": 15066 }, { "epoch": 2.79, "learning_rate": 2.6175964127441724e-07, "loss": 0.4257, "step": 15067 }, { "epoch": 2.79, "learning_rate": 2.6130580828282016e-07, "loss": 0.4327, "step": 15068 }, { "epoch": 2.79, "learning_rate": 2.6085236384709166e-07, "loss": 0.4116, "step": 15069 }, { "epoch": 2.79, "learning_rate": 2.6039930798532066e-07, "loss": 0.4104, "step": 15070 }, { "epoch": 2.79, "learning_rate": 2.5994664071558596e-07, "loss": 0.3936, "step": 15071 }, { "epoch": 2.79, "learning_rate": 2.5949436205594647e-07, "loss": 0.4401, "step": 15072 }, { "epoch": 2.79, "learning_rate": 2.5904247202444885e-07, "loss": 0.398, "step": 15073 }, { "epoch": 2.79, "learning_rate": 2.58590970639121e-07, "loss": 0.4194, "step": 15074 }, { "epoch": 2.79, "learning_rate": 2.5813985791797727e-07, "loss": 0.4229, "step": 15075 }, { "epoch": 2.79, "learning_rate": 2.576891338790177e-07, "loss": 0.4116, "step": 15076 }, { "epoch": 2.79, "learning_rate": 2.572387985402225e-07, "loss": 0.4374, "step": 15077 }, { "epoch": 2.79, "learning_rate": 2.567888519195627e-07, "loss": 0.4181, "step": 15078 }, { "epoch": 2.79, "learning_rate": 2.5633929403498734e-07, "loss": 0.416, "step": 15079 }, { "epoch": 2.79, "learning_rate": 2.5589012490443544e-07, "loss": 0.4315, "step": 15080 }, { "epoch": 2.79, "learning_rate": 2.5544134454582593e-07, "loss": 0.4019, "step": 15081 }, { "epoch": 2.79, "learning_rate": 2.5499295297706563e-07, "loss": 0.4192, "step": 15082 }, { "epoch": 2.79, "learning_rate": 2.5454495021604355e-07, "loss": 0.4025, "step": 15083 }, { "epoch": 2.79, "learning_rate": 2.5409733628063647e-07, "loss": 0.4266, "step": 15084 }, { "epoch": 2.79, "learning_rate": 2.5365011118869907e-07, "loss": 0.4147, "step": 15085 }, { "epoch": 2.79, "learning_rate": 2.5320327495807927e-07, "loss": 0.424, "step": 15086 }, { "epoch": 2.79, "learning_rate": 2.527568276066017e-07, "loss": 0.4297, "step": 15087 }, { "epoch": 2.79, "learning_rate": 2.5231076915208206e-07, "loss": 0.4047, "step": 15088 }, { "epoch": 2.79, "learning_rate": 2.5186509961231287e-07, "loss": 0.4004, "step": 15089 }, { "epoch": 2.79, "learning_rate": 2.5141981900507986e-07, "loss": 0.4014, "step": 15090 }, { "epoch": 2.79, "learning_rate": 2.5097492734814765e-07, "loss": 0.4281, "step": 15091 }, { "epoch": 2.79, "learning_rate": 2.5053042465926433e-07, "loss": 0.4014, "step": 15092 }, { "epoch": 2.79, "learning_rate": 2.500863109561669e-07, "loss": 0.4051, "step": 15093 }, { "epoch": 2.79, "learning_rate": 2.4964258625657434e-07, "loss": 0.4168, "step": 15094 }, { "epoch": 2.79, "learning_rate": 2.4919925057819037e-07, "loss": 0.4287, "step": 15095 }, { "epoch": 2.79, "learning_rate": 2.487563039387031e-07, "loss": 0.4287, "step": 15096 }, { "epoch": 2.79, "learning_rate": 2.48313746355785e-07, "loss": 0.4234, "step": 15097 }, { "epoch": 2.79, "learning_rate": 2.4787157784709416e-07, "loss": 0.4094, "step": 15098 }, { "epoch": 2.79, "learning_rate": 2.474297984302709e-07, "loss": 0.4197, "step": 15099 }, { "epoch": 2.79, "learning_rate": 2.4698840812294346e-07, "loss": 0.4017, "step": 15100 }, { "epoch": 2.79, "learning_rate": 2.4654740694272206e-07, "loss": 0.418, "step": 15101 }, { "epoch": 2.79, "learning_rate": 2.4610679490719933e-07, "loss": 0.423, "step": 15102 }, { "epoch": 2.79, "learning_rate": 2.456665720339568e-07, "loss": 0.4216, "step": 15103 }, { "epoch": 2.79, "learning_rate": 2.4522673834055823e-07, "loss": 0.3929, "step": 15104 }, { "epoch": 2.79, "learning_rate": 2.4478729384455393e-07, "loss": 0.4355, "step": 15105 }, { "epoch": 2.79, "learning_rate": 2.443482385634743e-07, "loss": 0.4103, "step": 15106 }, { "epoch": 2.8, "learning_rate": 2.439095725148366e-07, "loss": 0.4235, "step": 15107 }, { "epoch": 2.8, "learning_rate": 2.434712957161456e-07, "loss": 0.4342, "step": 15108 }, { "epoch": 2.8, "learning_rate": 2.4303340818488506e-07, "loss": 0.429, "step": 15109 }, { "epoch": 2.8, "learning_rate": 2.4259590993852886e-07, "loss": 0.4089, "step": 15110 }, { "epoch": 2.8, "learning_rate": 2.421588009945286e-07, "loss": 0.4025, "step": 15111 }, { "epoch": 2.8, "learning_rate": 2.4172208137032694e-07, "loss": 0.4083, "step": 15112 }, { "epoch": 2.8, "learning_rate": 2.4128575108334773e-07, "loss": 0.4181, "step": 15113 }, { "epoch": 2.8, "learning_rate": 2.4084981015099817e-07, "loss": 0.4171, "step": 15114 }, { "epoch": 2.8, "learning_rate": 2.4041425859067325e-07, "loss": 0.4217, "step": 15115 }, { "epoch": 2.8, "learning_rate": 2.3997909641974904e-07, "loss": 0.4184, "step": 15116 }, { "epoch": 2.8, "learning_rate": 2.395443236555894e-07, "loss": 0.4248, "step": 15117 }, { "epoch": 2.8, "learning_rate": 2.391099403155406e-07, "loss": 0.3914, "step": 15118 }, { "epoch": 2.8, "learning_rate": 2.3867594641693304e-07, "loss": 0.4087, "step": 15119 }, { "epoch": 2.8, "learning_rate": 2.3824234197708296e-07, "loss": 0.4178, "step": 15120 }, { "epoch": 2.8, "learning_rate": 2.3780912701328872e-07, "loss": 0.4064, "step": 15121 }, { "epoch": 2.8, "learning_rate": 2.3737630154283764e-07, "loss": 0.4017, "step": 15122 }, { "epoch": 2.8, "learning_rate": 2.3694386558299697e-07, "loss": 0.4058, "step": 15123 }, { "epoch": 2.8, "learning_rate": 2.3651181915101962e-07, "loss": 0.4119, "step": 15124 }, { "epoch": 2.8, "learning_rate": 2.360801622641451e-07, "loss": 0.3849, "step": 15125 }, { "epoch": 2.8, "learning_rate": 2.3564889493959298e-07, "loss": 0.4103, "step": 15126 }, { "epoch": 2.8, "learning_rate": 2.3521801719457283e-07, "loss": 0.4126, "step": 15127 }, { "epoch": 2.8, "learning_rate": 2.3478752904627421e-07, "loss": 0.4187, "step": 15128 }, { "epoch": 2.8, "learning_rate": 2.3435743051187343e-07, "loss": 0.4107, "step": 15129 }, { "epoch": 2.8, "learning_rate": 2.3392772160853118e-07, "loss": 0.4284, "step": 15130 }, { "epoch": 2.8, "learning_rate": 2.3349840235339148e-07, "loss": 0.4096, "step": 15131 }, { "epoch": 2.8, "learning_rate": 2.3306947276358183e-07, "loss": 0.4165, "step": 15132 }, { "epoch": 2.8, "learning_rate": 2.326409328562196e-07, "loss": 0.4196, "step": 15133 }, { "epoch": 2.8, "learning_rate": 2.3221278264839776e-07, "loss": 0.4078, "step": 15134 }, { "epoch": 2.8, "learning_rate": 2.3178502215720376e-07, "loss": 0.4072, "step": 15135 }, { "epoch": 2.8, "learning_rate": 2.3135765139969958e-07, "loss": 0.4077, "step": 15136 }, { "epoch": 2.8, "learning_rate": 2.3093067039294148e-07, "loss": 0.4062, "step": 15137 }, { "epoch": 2.8, "learning_rate": 2.3050407915396034e-07, "loss": 0.4029, "step": 15138 }, { "epoch": 2.8, "learning_rate": 2.300778776997803e-07, "loss": 0.4197, "step": 15139 }, { "epoch": 2.8, "learning_rate": 2.296520660474044e-07, "loss": 0.4154, "step": 15140 }, { "epoch": 2.8, "learning_rate": 2.2922664421382134e-07, "loss": 0.4012, "step": 15141 }, { "epoch": 2.8, "learning_rate": 2.2880161221600527e-07, "loss": 0.4089, "step": 15142 }, { "epoch": 2.8, "learning_rate": 2.2837697007091265e-07, "loss": 0.4052, "step": 15143 }, { "epoch": 2.8, "learning_rate": 2.2795271779548878e-07, "loss": 0.4232, "step": 15144 }, { "epoch": 2.8, "learning_rate": 2.2752885540665904e-07, "loss": 0.4205, "step": 15145 }, { "epoch": 2.8, "learning_rate": 2.2710538292133434e-07, "loss": 0.4098, "step": 15146 }, { "epoch": 2.8, "learning_rate": 2.2668230035641116e-07, "loss": 0.4267, "step": 15147 }, { "epoch": 2.8, "learning_rate": 2.2625960772876821e-07, "loss": 0.4184, "step": 15148 }, { "epoch": 2.8, "learning_rate": 2.25837305055272e-07, "loss": 0.4259, "step": 15149 }, { "epoch": 2.8, "learning_rate": 2.2541539235277133e-07, "loss": 0.403, "step": 15150 }, { "epoch": 2.8, "learning_rate": 2.2499386963809934e-07, "loss": 0.4206, "step": 15151 }, { "epoch": 2.8, "learning_rate": 2.2457273692807368e-07, "loss": 0.429, "step": 15152 }, { "epoch": 2.8, "learning_rate": 2.2415199423949651e-07, "loss": 0.4132, "step": 15153 }, { "epoch": 2.8, "learning_rate": 2.237316415891566e-07, "loss": 0.4213, "step": 15154 }, { "epoch": 2.8, "learning_rate": 2.2331167899382278e-07, "loss": 0.4237, "step": 15155 }, { "epoch": 2.8, "learning_rate": 2.2289210647025273e-07, "loss": 0.4351, "step": 15156 }, { "epoch": 2.8, "learning_rate": 2.2247292403518527e-07, "loss": 0.4254, "step": 15157 }, { "epoch": 2.8, "learning_rate": 2.2205413170534483e-07, "loss": 0.4072, "step": 15158 }, { "epoch": 2.8, "learning_rate": 2.216357294974425e-07, "loss": 0.4093, "step": 15159 }, { "epoch": 2.8, "learning_rate": 2.2121771742816933e-07, "loss": 0.403, "step": 15160 }, { "epoch": 2.8, "learning_rate": 2.2080009551420535e-07, "loss": 0.4181, "step": 15161 }, { "epoch": 2.81, "learning_rate": 2.2038286377221164e-07, "loss": 0.3916, "step": 15162 }, { "epoch": 2.81, "learning_rate": 2.199660222188349e-07, "loss": 0.4294, "step": 15163 }, { "epoch": 2.81, "learning_rate": 2.1954957087070628e-07, "loss": 0.4171, "step": 15164 }, { "epoch": 2.81, "learning_rate": 2.1913350974444246e-07, "loss": 0.4056, "step": 15165 }, { "epoch": 2.81, "learning_rate": 2.1871783885664244e-07, "loss": 0.4271, "step": 15166 }, { "epoch": 2.81, "learning_rate": 2.183025582238918e-07, "loss": 0.4087, "step": 15167 }, { "epoch": 2.81, "learning_rate": 2.1788766786275728e-07, "loss": 0.4086, "step": 15168 }, { "epoch": 2.81, "learning_rate": 2.1747316778979454e-07, "loss": 0.4072, "step": 15169 }, { "epoch": 2.81, "learning_rate": 2.1705905802154038e-07, "loss": 0.41, "step": 15170 }, { "epoch": 2.81, "learning_rate": 2.166453385745171e-07, "loss": 0.4126, "step": 15171 }, { "epoch": 2.81, "learning_rate": 2.162320094652326e-07, "loss": 0.4191, "step": 15172 }, { "epoch": 2.81, "learning_rate": 2.1581907071017481e-07, "loss": 0.432, "step": 15173 }, { "epoch": 2.81, "learning_rate": 2.1540652232582282e-07, "loss": 0.4338, "step": 15174 }, { "epoch": 2.81, "learning_rate": 2.149943643286334e-07, "loss": 0.4081, "step": 15175 }, { "epoch": 2.81, "learning_rate": 2.1458259673505344e-07, "loss": 0.4222, "step": 15176 }, { "epoch": 2.81, "learning_rate": 2.1417121956150978e-07, "loss": 0.3996, "step": 15177 }, { "epoch": 2.81, "learning_rate": 2.1376023282441814e-07, "loss": 0.4196, "step": 15178 }, { "epoch": 2.81, "learning_rate": 2.1334963654017215e-07, "loss": 0.4109, "step": 15179 }, { "epoch": 2.81, "learning_rate": 2.1293943072515867e-07, "loss": 0.3997, "step": 15180 }, { "epoch": 2.81, "learning_rate": 2.1252961539573902e-07, "loss": 0.3934, "step": 15181 }, { "epoch": 2.81, "learning_rate": 2.1212019056826905e-07, "loss": 0.4161, "step": 15182 }, { "epoch": 2.81, "learning_rate": 2.117111562590801e-07, "loss": 0.388, "step": 15183 }, { "epoch": 2.81, "learning_rate": 2.1130251248449475e-07, "loss": 0.4169, "step": 15184 }, { "epoch": 2.81, "learning_rate": 2.108942592608143e-07, "loss": 0.4102, "step": 15185 }, { "epoch": 2.81, "learning_rate": 2.1048639660433024e-07, "loss": 0.4088, "step": 15186 }, { "epoch": 2.81, "learning_rate": 2.1007892453131285e-07, "loss": 0.3961, "step": 15187 }, { "epoch": 2.81, "learning_rate": 2.0967184305802246e-07, "loss": 0.4151, "step": 15188 }, { "epoch": 2.81, "learning_rate": 2.0926515220069833e-07, "loss": 0.4098, "step": 15189 }, { "epoch": 2.81, "learning_rate": 2.0885885197556744e-07, "loss": 0.4061, "step": 15190 }, { "epoch": 2.81, "learning_rate": 2.084529423988413e-07, "loss": 0.4166, "step": 15191 }, { "epoch": 2.81, "learning_rate": 2.0804742348671358e-07, "loss": 0.39, "step": 15192 }, { "epoch": 2.81, "learning_rate": 2.0764229525536472e-07, "loss": 0.4172, "step": 15193 }, { "epoch": 2.81, "learning_rate": 2.0723755772095845e-07, "loss": 0.4143, "step": 15194 }, { "epoch": 2.81, "learning_rate": 2.068332108996407e-07, "loss": 0.411, "step": 15195 }, { "epoch": 2.81, "learning_rate": 2.064292548075486e-07, "loss": 0.41, "step": 15196 }, { "epoch": 2.81, "learning_rate": 2.0602568946079593e-07, "loss": 0.4178, "step": 15197 }, { "epoch": 2.81, "learning_rate": 2.0562251487548534e-07, "loss": 0.414, "step": 15198 }, { "epoch": 2.81, "learning_rate": 2.0521973106770288e-07, "loss": 0.4042, "step": 15199 }, { "epoch": 2.81, "learning_rate": 2.0481733805351788e-07, "loss": 0.4287, "step": 15200 }, { "epoch": 2.81, "learning_rate": 2.0441533584898755e-07, "loss": 0.4186, "step": 15201 }, { "epoch": 2.81, "learning_rate": 2.0401372447014677e-07, "loss": 0.4527, "step": 15202 }, { "epoch": 2.81, "learning_rate": 2.036125039330239e-07, "loss": 0.4118, "step": 15203 }, { "epoch": 2.81, "learning_rate": 2.0321167425362275e-07, "loss": 0.418, "step": 15204 }, { "epoch": 2.81, "learning_rate": 2.0281123544793835e-07, "loss": 0.4243, "step": 15205 }, { "epoch": 2.81, "learning_rate": 2.0241118753194788e-07, "loss": 0.3945, "step": 15206 }, { "epoch": 2.81, "learning_rate": 2.020115305216086e-07, "loss": 0.4039, "step": 15207 }, { "epoch": 2.81, "learning_rate": 2.0161226443287108e-07, "loss": 0.428, "step": 15208 }, { "epoch": 2.81, "learning_rate": 2.0121338928166146e-07, "loss": 0.3988, "step": 15209 }, { "epoch": 2.81, "learning_rate": 2.0081490508389701e-07, "loss": 0.4234, "step": 15210 }, { "epoch": 2.81, "learning_rate": 2.004168118554739e-07, "loss": 0.4025, "step": 15211 }, { "epoch": 2.81, "learning_rate": 2.0001910961227722e-07, "loss": 0.416, "step": 15212 }, { "epoch": 2.81, "learning_rate": 1.9962179837017425e-07, "loss": 0.4039, "step": 15213 }, { "epoch": 2.81, "learning_rate": 1.9922487814501569e-07, "loss": 0.431, "step": 15214 }, { "epoch": 2.81, "learning_rate": 1.988283489526388e-07, "loss": 0.4227, "step": 15215 }, { "epoch": 2.82, "learning_rate": 1.9843221080886544e-07, "loss": 0.4074, "step": 15216 }, { "epoch": 2.82, "learning_rate": 1.9803646372949847e-07, "loss": 0.4088, "step": 15217 }, { "epoch": 2.82, "learning_rate": 1.9764110773032973e-07, "loss": 0.4155, "step": 15218 }, { "epoch": 2.82, "learning_rate": 1.9724614282713218e-07, "loss": 0.4295, "step": 15219 }, { "epoch": 2.82, "learning_rate": 1.9685156903566426e-07, "loss": 0.4097, "step": 15220 }, { "epoch": 2.82, "learning_rate": 1.9645738637166678e-07, "loss": 0.4077, "step": 15221 }, { "epoch": 2.82, "learning_rate": 1.9606359485087155e-07, "loss": 0.445, "step": 15222 }, { "epoch": 2.82, "learning_rate": 1.9567019448898605e-07, "loss": 0.4136, "step": 15223 }, { "epoch": 2.82, "learning_rate": 1.952771853017077e-07, "loss": 0.4152, "step": 15224 }, { "epoch": 2.82, "learning_rate": 1.9488456730471728e-07, "loss": 0.41, "step": 15225 }, { "epoch": 2.82, "learning_rate": 1.9449234051367782e-07, "loss": 0.432, "step": 15226 }, { "epoch": 2.82, "learning_rate": 1.9410050494424014e-07, "loss": 0.4076, "step": 15227 }, { "epoch": 2.82, "learning_rate": 1.9370906061203732e-07, "loss": 0.4144, "step": 15228 }, { "epoch": 2.82, "learning_rate": 1.933180075326868e-07, "loss": 0.4091, "step": 15229 }, { "epoch": 2.82, "learning_rate": 1.929273457217917e-07, "loss": 0.4111, "step": 15230 }, { "epoch": 2.82, "learning_rate": 1.9253707519493736e-07, "loss": 0.3971, "step": 15231 }, { "epoch": 2.82, "learning_rate": 1.921471959676957e-07, "loss": 0.4075, "step": 15232 }, { "epoch": 2.82, "learning_rate": 1.917577080556221e-07, "loss": 0.4108, "step": 15233 }, { "epoch": 2.82, "learning_rate": 1.9136861147425744e-07, "loss": 0.4235, "step": 15234 }, { "epoch": 2.82, "learning_rate": 1.9097990623912488e-07, "loss": 0.4009, "step": 15235 }, { "epoch": 2.82, "learning_rate": 1.9059159236573198e-07, "loss": 0.418, "step": 15236 }, { "epoch": 2.82, "learning_rate": 1.9020366986957418e-07, "loss": 0.4194, "step": 15237 }, { "epoch": 2.82, "learning_rate": 1.898161387661268e-07, "loss": 0.4137, "step": 15238 }, { "epoch": 2.82, "learning_rate": 1.894289990708531e-07, "loss": 0.4089, "step": 15239 }, { "epoch": 2.82, "learning_rate": 1.8904225079919847e-07, "loss": 0.4239, "step": 15240 }, { "epoch": 2.82, "learning_rate": 1.886558939665928e-07, "loss": 0.4261, "step": 15241 }, { "epoch": 2.82, "learning_rate": 1.8826992858845262e-07, "loss": 0.4147, "step": 15242 }, { "epoch": 2.82, "learning_rate": 1.8788435468017564e-07, "loss": 0.4168, "step": 15243 }, { "epoch": 2.82, "learning_rate": 1.874991722571462e-07, "loss": 0.4035, "step": 15244 }, { "epoch": 2.82, "learning_rate": 1.8711438133473315e-07, "loss": 0.4205, "step": 15245 }, { "epoch": 2.82, "learning_rate": 1.867299819282875e-07, "loss": 0.4236, "step": 15246 }, { "epoch": 2.82, "learning_rate": 1.8634597405314703e-07, "loss": 0.4122, "step": 15247 }, { "epoch": 2.82, "learning_rate": 1.8596235772463277e-07, "loss": 0.4241, "step": 15248 }, { "epoch": 2.82, "learning_rate": 1.855791329580503e-07, "loss": 0.4272, "step": 15249 }, { "epoch": 2.82, "learning_rate": 1.8519629976868959e-07, "loss": 0.4027, "step": 15250 }, { "epoch": 2.82, "learning_rate": 1.8481385817182507e-07, "loss": 0.3923, "step": 15251 }, { "epoch": 2.82, "learning_rate": 1.8443180818271455e-07, "loss": 0.4124, "step": 15252 }, { "epoch": 2.82, "learning_rate": 1.8405014981660252e-07, "loss": 0.4267, "step": 15253 }, { "epoch": 2.82, "learning_rate": 1.8366888308871566e-07, "loss": 0.4182, "step": 15254 }, { "epoch": 2.82, "learning_rate": 1.8328800801426628e-07, "loss": 0.4181, "step": 15255 }, { "epoch": 2.82, "learning_rate": 1.8290752460844884e-07, "loss": 0.4109, "step": 15256 }, { "epoch": 2.82, "learning_rate": 1.825274328864468e-07, "loss": 0.4008, "step": 15257 }, { "epoch": 2.82, "learning_rate": 1.8214773286342246e-07, "loss": 0.4026, "step": 15258 }, { "epoch": 2.82, "learning_rate": 1.8176842455452703e-07, "loss": 0.411, "step": 15259 }, { "epoch": 2.82, "learning_rate": 1.8138950797489397e-07, "loss": 0.4044, "step": 15260 }, { "epoch": 2.82, "learning_rate": 1.8101098313964005e-07, "loss": 0.417, "step": 15261 }, { "epoch": 2.82, "learning_rate": 1.8063285006386876e-07, "loss": 0.4103, "step": 15262 }, { "epoch": 2.82, "learning_rate": 1.8025510876266584e-07, "loss": 0.4154, "step": 15263 }, { "epoch": 2.82, "learning_rate": 1.7987775925110473e-07, "loss": 0.3979, "step": 15264 }, { "epoch": 2.82, "learning_rate": 1.7950080154423898e-07, "loss": 0.3972, "step": 15265 }, { "epoch": 2.82, "learning_rate": 1.791242356571088e-07, "loss": 0.4184, "step": 15266 }, { "epoch": 2.82, "learning_rate": 1.787480616047388e-07, "loss": 0.4076, "step": 15267 }, { "epoch": 2.82, "learning_rate": 1.7837227940213698e-07, "loss": 0.4215, "step": 15268 }, { "epoch": 2.82, "learning_rate": 1.7799688906429803e-07, "loss": 0.4061, "step": 15269 }, { "epoch": 2.83, "learning_rate": 1.776218906061977e-07, "loss": 0.4192, "step": 15270 }, { "epoch": 2.83, "learning_rate": 1.7724728404279856e-07, "loss": 0.4038, "step": 15271 }, { "epoch": 2.83, "learning_rate": 1.7687306938904746e-07, "loss": 0.4311, "step": 15272 }, { "epoch": 2.83, "learning_rate": 1.764992466598725e-07, "loss": 0.402, "step": 15273 }, { "epoch": 2.83, "learning_rate": 1.7612581587018952e-07, "loss": 0.3929, "step": 15274 }, { "epoch": 2.83, "learning_rate": 1.757527770348988e-07, "loss": 0.4092, "step": 15275 }, { "epoch": 2.83, "learning_rate": 1.7538013016888288e-07, "loss": 0.4105, "step": 15276 }, { "epoch": 2.83, "learning_rate": 1.7500787528701102e-07, "loss": 0.4077, "step": 15277 }, { "epoch": 2.83, "learning_rate": 1.7463601240413352e-07, "loss": 0.4263, "step": 15278 }, { "epoch": 2.83, "learning_rate": 1.7426454153508742e-07, "loss": 0.415, "step": 15279 }, { "epoch": 2.83, "learning_rate": 1.738934626946942e-07, "loss": 0.4162, "step": 15280 }, { "epoch": 2.83, "learning_rate": 1.735227758977609e-07, "loss": 0.4173, "step": 15281 }, { "epoch": 2.83, "learning_rate": 1.7315248115907457e-07, "loss": 0.3981, "step": 15282 }, { "epoch": 2.83, "learning_rate": 1.7278257849341006e-07, "loss": 0.4137, "step": 15283 }, { "epoch": 2.83, "learning_rate": 1.724130679155256e-07, "loss": 0.4022, "step": 15284 }, { "epoch": 2.83, "learning_rate": 1.72043949440166e-07, "loss": 0.4422, "step": 15285 }, { "epoch": 2.83, "learning_rate": 1.716752230820551e-07, "loss": 0.4319, "step": 15286 }, { "epoch": 2.83, "learning_rate": 1.7130688885590774e-07, "loss": 0.4112, "step": 15287 }, { "epoch": 2.83, "learning_rate": 1.7093894677641664e-07, "loss": 0.429, "step": 15288 }, { "epoch": 2.83, "learning_rate": 1.7057139685826562e-07, "loss": 0.3823, "step": 15289 }, { "epoch": 2.83, "learning_rate": 1.7020423911611517e-07, "loss": 0.4231, "step": 15290 }, { "epoch": 2.83, "learning_rate": 1.6983747356461687e-07, "loss": 0.4128, "step": 15291 }, { "epoch": 2.83, "learning_rate": 1.6947110021840352e-07, "loss": 0.4145, "step": 15292 }, { "epoch": 2.83, "learning_rate": 1.6910511909209227e-07, "loss": 0.4172, "step": 15293 }, { "epoch": 2.83, "learning_rate": 1.687395302002859e-07, "loss": 0.4149, "step": 15294 }, { "epoch": 2.83, "learning_rate": 1.6837433355756938e-07, "loss": 0.3993, "step": 15295 }, { "epoch": 2.83, "learning_rate": 1.6800952917851555e-07, "loss": 0.414, "step": 15296 }, { "epoch": 2.83, "learning_rate": 1.6764511707767606e-07, "loss": 0.4314, "step": 15297 }, { "epoch": 2.83, "learning_rate": 1.6728109726959373e-07, "loss": 0.3982, "step": 15298 }, { "epoch": 2.83, "learning_rate": 1.669174697687903e-07, "loss": 0.4094, "step": 15299 }, { "epoch": 2.83, "learning_rate": 1.6655423458977416e-07, "loss": 0.4015, "step": 15300 }, { "epoch": 2.83, "learning_rate": 1.6619139174703925e-07, "loss": 0.4005, "step": 15301 }, { "epoch": 2.83, "learning_rate": 1.6582894125505956e-07, "loss": 0.4077, "step": 15302 }, { "epoch": 2.83, "learning_rate": 1.6546688312829794e-07, "loss": 0.4118, "step": 15303 }, { "epoch": 2.83, "learning_rate": 1.6510521738119957e-07, "loss": 0.414, "step": 15304 }, { "epoch": 2.83, "learning_rate": 1.6474394402819393e-07, "loss": 0.4285, "step": 15305 }, { "epoch": 2.83, "learning_rate": 1.643830630836962e-07, "loss": 0.4171, "step": 15306 }, { "epoch": 2.83, "learning_rate": 1.640225745621038e-07, "loss": 0.4058, "step": 15307 }, { "epoch": 2.83, "learning_rate": 1.636624784777996e-07, "loss": 0.4126, "step": 15308 }, { "epoch": 2.83, "learning_rate": 1.633027748451521e-07, "loss": 0.4062, "step": 15309 }, { "epoch": 2.83, "learning_rate": 1.6294346367850988e-07, "loss": 0.3893, "step": 15310 }, { "epoch": 2.83, "learning_rate": 1.6258454499221144e-07, "loss": 0.4234, "step": 15311 }, { "epoch": 2.83, "learning_rate": 1.6222601880057642e-07, "loss": 0.4025, "step": 15312 }, { "epoch": 2.83, "learning_rate": 1.6186788511790896e-07, "loss": 0.4067, "step": 15313 }, { "epoch": 2.83, "learning_rate": 1.6151014395849762e-07, "loss": 0.4028, "step": 15314 }, { "epoch": 2.83, "learning_rate": 1.6115279533661654e-07, "loss": 0.401, "step": 15315 }, { "epoch": 2.83, "learning_rate": 1.607958392665232e-07, "loss": 0.3872, "step": 15316 }, { "epoch": 2.83, "learning_rate": 1.6043927576245844e-07, "loss": 0.4266, "step": 15317 }, { "epoch": 2.83, "learning_rate": 1.6008310483864975e-07, "loss": 0.4128, "step": 15318 }, { "epoch": 2.83, "learning_rate": 1.5972732650930577e-07, "loss": 0.4213, "step": 15319 }, { "epoch": 2.83, "learning_rate": 1.5937194078862407e-07, "loss": 0.4114, "step": 15320 }, { "epoch": 2.83, "learning_rate": 1.5901694769078212e-07, "loss": 0.4033, "step": 15321 }, { "epoch": 2.83, "learning_rate": 1.5866234722994312e-07, "loss": 0.4156, "step": 15322 }, { "epoch": 2.83, "learning_rate": 1.583081394202568e-07, "loss": 0.4123, "step": 15323 }, { "epoch": 2.84, "learning_rate": 1.57954324275853e-07, "loss": 0.4224, "step": 15324 }, { "epoch": 2.84, "learning_rate": 1.5760090181085042e-07, "loss": 0.3986, "step": 15325 }, { "epoch": 2.84, "learning_rate": 1.5724787203935e-07, "loss": 0.4229, "step": 15326 }, { "epoch": 2.84, "learning_rate": 1.5689523497543491e-07, "loss": 0.409, "step": 15327 }, { "epoch": 2.84, "learning_rate": 1.5654299063317612e-07, "loss": 0.4177, "step": 15328 }, { "epoch": 2.84, "learning_rate": 1.5619113902662685e-07, "loss": 0.4135, "step": 15329 }, { "epoch": 2.84, "learning_rate": 1.5583968016982698e-07, "loss": 0.4112, "step": 15330 }, { "epoch": 2.84, "learning_rate": 1.5548861407679637e-07, "loss": 0.4078, "step": 15331 }, { "epoch": 2.84, "learning_rate": 1.5513794076154497e-07, "loss": 0.3997, "step": 15332 }, { "epoch": 2.84, "learning_rate": 1.5478766023806158e-07, "loss": 0.43, "step": 15333 }, { "epoch": 2.84, "learning_rate": 1.5443777252032277e-07, "loss": 0.4107, "step": 15334 }, { "epoch": 2.84, "learning_rate": 1.540882776222874e-07, "loss": 0.4026, "step": 15335 }, { "epoch": 2.84, "learning_rate": 1.5373917555790209e-07, "loss": 0.422, "step": 15336 }, { "epoch": 2.84, "learning_rate": 1.5339046634109344e-07, "loss": 0.403, "step": 15337 }, { "epoch": 2.84, "learning_rate": 1.530421499857748e-07, "loss": 0.4295, "step": 15338 }, { "epoch": 2.84, "learning_rate": 1.5269422650584175e-07, "loss": 0.4164, "step": 15339 }, { "epoch": 2.84, "learning_rate": 1.523466959151787e-07, "loss": 0.4057, "step": 15340 }, { "epoch": 2.84, "learning_rate": 1.51999558227649e-07, "loss": 0.4206, "step": 15341 }, { "epoch": 2.84, "learning_rate": 1.5165281345710493e-07, "loss": 0.4095, "step": 15342 }, { "epoch": 2.84, "learning_rate": 1.5130646161737984e-07, "loss": 0.4164, "step": 15343 }, { "epoch": 2.84, "learning_rate": 1.5096050272229267e-07, "loss": 0.39, "step": 15344 }, { "epoch": 2.84, "learning_rate": 1.5061493678564575e-07, "loss": 0.4104, "step": 15345 }, { "epoch": 2.84, "learning_rate": 1.5026976382122695e-07, "loss": 0.4061, "step": 15346 }, { "epoch": 2.84, "learning_rate": 1.4992498384280962e-07, "loss": 0.4054, "step": 15347 }, { "epoch": 2.84, "learning_rate": 1.4958059686414729e-07, "loss": 0.4301, "step": 15348 }, { "epoch": 2.84, "learning_rate": 1.4923660289898223e-07, "loss": 0.4127, "step": 15349 }, { "epoch": 2.84, "learning_rate": 1.4889300196103796e-07, "loss": 0.4133, "step": 15350 }, { "epoch": 2.84, "learning_rate": 1.4854979406402347e-07, "loss": 0.4105, "step": 15351 }, { "epoch": 2.84, "learning_rate": 1.482069792216345e-07, "loss": 0.4159, "step": 15352 }, { "epoch": 2.84, "learning_rate": 1.4786455744754568e-07, "loss": 0.4278, "step": 15353 }, { "epoch": 2.84, "learning_rate": 1.475225287554205e-07, "loss": 0.4035, "step": 15354 }, { "epoch": 2.84, "learning_rate": 1.4718089315890582e-07, "loss": 0.4162, "step": 15355 }, { "epoch": 2.84, "learning_rate": 1.4683965067163075e-07, "loss": 0.4291, "step": 15356 }, { "epoch": 2.84, "learning_rate": 1.4649880130721105e-07, "loss": 0.4159, "step": 15357 }, { "epoch": 2.84, "learning_rate": 1.4615834507924587e-07, "loss": 0.4322, "step": 15358 }, { "epoch": 2.84, "learning_rate": 1.4581828200131876e-07, "loss": 0.4335, "step": 15359 }, { "epoch": 2.84, "learning_rate": 1.4547861208699777e-07, "loss": 0.4227, "step": 15360 }, { "epoch": 2.84, "learning_rate": 1.4513933534983536e-07, "loss": 0.401, "step": 15361 }, { "epoch": 2.84, "learning_rate": 1.4480045180336744e-07, "loss": 0.4206, "step": 15362 }, { "epoch": 2.84, "learning_rate": 1.4446196146111423e-07, "loss": 0.4128, "step": 15363 }, { "epoch": 2.84, "learning_rate": 1.4412386433658277e-07, "loss": 0.415, "step": 15364 }, { "epoch": 2.84, "learning_rate": 1.4378616044326112e-07, "loss": 0.4199, "step": 15365 }, { "epoch": 2.84, "learning_rate": 1.4344884979462293e-07, "loss": 0.4204, "step": 15366 }, { "epoch": 2.84, "learning_rate": 1.4311193240412748e-07, "loss": 0.4004, "step": 15367 }, { "epoch": 2.84, "learning_rate": 1.427754082852162e-07, "loss": 0.4082, "step": 15368 }, { "epoch": 2.84, "learning_rate": 1.4243927745131614e-07, "loss": 0.4107, "step": 15369 }, { "epoch": 2.84, "learning_rate": 1.421035399158377e-07, "loss": 0.4255, "step": 15370 }, { "epoch": 2.84, "learning_rate": 1.4176819569217682e-07, "loss": 0.3878, "step": 15371 }, { "epoch": 2.84, "learning_rate": 1.4143324479371278e-07, "loss": 0.4204, "step": 15372 }, { "epoch": 2.84, "learning_rate": 1.4109868723380938e-07, "loss": 0.423, "step": 15373 }, { "epoch": 2.84, "learning_rate": 1.407645230258159e-07, "loss": 0.4305, "step": 15374 }, { "epoch": 2.84, "learning_rate": 1.404307521830639e-07, "loss": 0.4379, "step": 15375 }, { "epoch": 2.84, "learning_rate": 1.4009737471886942e-07, "loss": 0.4127, "step": 15376 }, { "epoch": 2.84, "learning_rate": 1.3976439064653513e-07, "loss": 0.3963, "step": 15377 }, { "epoch": 2.85, "learning_rate": 1.3943179997934597e-07, "loss": 0.4114, "step": 15378 }, { "epoch": 2.85, "learning_rate": 1.3909960273057132e-07, "loss": 0.4402, "step": 15379 }, { "epoch": 2.85, "learning_rate": 1.3876779891346614e-07, "loss": 0.401, "step": 15380 }, { "epoch": 2.85, "learning_rate": 1.3843638854126762e-07, "loss": 0.4175, "step": 15381 }, { "epoch": 2.85, "learning_rate": 1.381053716271996e-07, "loss": 0.4069, "step": 15382 }, { "epoch": 2.85, "learning_rate": 1.3777474818446823e-07, "loss": 0.4159, "step": 15383 }, { "epoch": 2.85, "learning_rate": 1.3744451822626404e-07, "loss": 0.3936, "step": 15384 }, { "epoch": 2.85, "learning_rate": 1.3711468176576538e-07, "loss": 0.4137, "step": 15385 }, { "epoch": 2.85, "learning_rate": 1.3678523881612837e-07, "loss": 0.3884, "step": 15386 }, { "epoch": 2.85, "learning_rate": 1.364561893905003e-07, "loss": 0.4135, "step": 15387 }, { "epoch": 2.85, "learning_rate": 1.3612753350200735e-07, "loss": 0.4173, "step": 15388 }, { "epoch": 2.85, "learning_rate": 1.3579927116376457e-07, "loss": 0.4111, "step": 15389 }, { "epoch": 2.85, "learning_rate": 1.3547140238886701e-07, "loss": 0.3939, "step": 15390 }, { "epoch": 2.85, "learning_rate": 1.3514392719039758e-07, "loss": 0.4217, "step": 15391 }, { "epoch": 2.85, "learning_rate": 1.3481684558142028e-07, "loss": 0.4237, "step": 15392 }, { "epoch": 2.85, "learning_rate": 1.3449015757498684e-07, "loss": 0.4204, "step": 15393 }, { "epoch": 2.85, "learning_rate": 1.341638631841302e-07, "loss": 0.4248, "step": 15394 }, { "epoch": 2.85, "learning_rate": 1.3383796242186887e-07, "loss": 0.3968, "step": 15395 }, { "epoch": 2.85, "learning_rate": 1.3351245530120682e-07, "loss": 0.4146, "step": 15396 }, { "epoch": 2.85, "learning_rate": 1.3318734183513037e-07, "loss": 0.4291, "step": 15397 }, { "epoch": 2.85, "learning_rate": 1.3286262203661027e-07, "loss": 0.4012, "step": 15398 }, { "epoch": 2.85, "learning_rate": 1.325382959186039e-07, "loss": 0.4048, "step": 15399 }, { "epoch": 2.85, "learning_rate": 1.3221436349404982e-07, "loss": 0.4287, "step": 15400 }, { "epoch": 2.85, "learning_rate": 1.3189082477587323e-07, "loss": 0.3912, "step": 15401 }, { "epoch": 2.85, "learning_rate": 1.315676797769816e-07, "loss": 0.4042, "step": 15402 }, { "epoch": 2.85, "learning_rate": 1.3124492851027016e-07, "loss": 0.4157, "step": 15403 }, { "epoch": 2.85, "learning_rate": 1.3092257098861415e-07, "loss": 0.4037, "step": 15404 }, { "epoch": 2.85, "learning_rate": 1.3060060722487443e-07, "loss": 0.4126, "step": 15405 }, { "epoch": 2.85, "learning_rate": 1.302790372318985e-07, "loss": 0.4032, "step": 15406 }, { "epoch": 2.85, "learning_rate": 1.2995786102251496e-07, "loss": 0.4009, "step": 15407 }, { "epoch": 2.85, "learning_rate": 1.296370786095402e-07, "loss": 0.4132, "step": 15408 }, { "epoch": 2.85, "learning_rate": 1.2931669000577185e-07, "loss": 0.3955, "step": 15409 }, { "epoch": 2.85, "learning_rate": 1.2899669522399072e-07, "loss": 0.417, "step": 15410 }, { "epoch": 2.85, "learning_rate": 1.2867709427696662e-07, "loss": 0.4176, "step": 15411 }, { "epoch": 2.85, "learning_rate": 1.2835788717744936e-07, "loss": 0.417, "step": 15412 }, { "epoch": 2.85, "learning_rate": 1.280390739381765e-07, "loss": 0.4131, "step": 15413 }, { "epoch": 2.85, "learning_rate": 1.277206545718679e-07, "loss": 0.4261, "step": 15414 }, { "epoch": 2.85, "learning_rate": 1.2740262909122558e-07, "loss": 0.3954, "step": 15415 }, { "epoch": 2.85, "learning_rate": 1.2708499750894053e-07, "loss": 0.419, "step": 15416 }, { "epoch": 2.85, "learning_rate": 1.2676775983768487e-07, "loss": 0.4092, "step": 15417 }, { "epoch": 2.85, "learning_rate": 1.2645091609011505e-07, "loss": 0.406, "step": 15418 }, { "epoch": 2.85, "learning_rate": 1.2613446627887438e-07, "loss": 0.4106, "step": 15419 }, { "epoch": 2.85, "learning_rate": 1.2581841041658716e-07, "loss": 0.3894, "step": 15420 }, { "epoch": 2.85, "learning_rate": 1.255027485158633e-07, "loss": 0.4083, "step": 15421 }, { "epoch": 2.85, "learning_rate": 1.251874805892972e-07, "loss": 0.4104, "step": 15422 }, { "epoch": 2.85, "learning_rate": 1.2487260664946988e-07, "loss": 0.4053, "step": 15423 }, { "epoch": 2.85, "learning_rate": 1.245581267089402e-07, "loss": 0.4112, "step": 15424 }, { "epoch": 2.85, "learning_rate": 1.2424404078025808e-07, "loss": 0.4114, "step": 15425 }, { "epoch": 2.85, "learning_rate": 1.2393034887595467e-07, "loss": 0.4249, "step": 15426 }, { "epoch": 2.85, "learning_rate": 1.2361705100854438e-07, "loss": 0.4085, "step": 15427 }, { "epoch": 2.85, "learning_rate": 1.233041471905294e-07, "loss": 0.4165, "step": 15428 }, { "epoch": 2.85, "learning_rate": 1.22991637434392e-07, "loss": 0.4061, "step": 15429 }, { "epoch": 2.85, "learning_rate": 1.2267952175260113e-07, "loss": 0.4076, "step": 15430 }, { "epoch": 2.85, "learning_rate": 1.2236780015761008e-07, "loss": 0.4256, "step": 15431 }, { "epoch": 2.86, "learning_rate": 1.220564726618567e-07, "loss": 0.4082, "step": 15432 }, { "epoch": 2.86, "learning_rate": 1.2174553927776e-07, "loss": 0.4207, "step": 15433 }, { "epoch": 2.86, "learning_rate": 1.214350000177289e-07, "loss": 0.4099, "step": 15434 }, { "epoch": 2.86, "learning_rate": 1.2112485489415015e-07, "loss": 0.4066, "step": 15435 }, { "epoch": 2.86, "learning_rate": 1.2081510391940055e-07, "loss": 0.3938, "step": 15436 }, { "epoch": 2.86, "learning_rate": 1.2050574710583684e-07, "loss": 0.4011, "step": 15437 }, { "epoch": 2.86, "learning_rate": 1.2019678446580363e-07, "loss": 0.4072, "step": 15438 }, { "epoch": 2.86, "learning_rate": 1.1988821601162437e-07, "loss": 0.4162, "step": 15439 }, { "epoch": 2.86, "learning_rate": 1.1958004175561478e-07, "loss": 0.4133, "step": 15440 }, { "epoch": 2.86, "learning_rate": 1.1927226171006833e-07, "loss": 0.4246, "step": 15441 }, { "epoch": 2.86, "learning_rate": 1.1896487588726413e-07, "loss": 0.4044, "step": 15442 }, { "epoch": 2.86, "learning_rate": 1.186578842994679e-07, "loss": 0.4156, "step": 15443 }, { "epoch": 2.86, "learning_rate": 1.183512869589265e-07, "loss": 0.416, "step": 15444 }, { "epoch": 2.86, "learning_rate": 1.180450838778735e-07, "loss": 0.4215, "step": 15445 }, { "epoch": 2.86, "learning_rate": 1.1773927506852578e-07, "loss": 0.4402, "step": 15446 }, { "epoch": 2.86, "learning_rate": 1.174338605430847e-07, "loss": 0.4222, "step": 15447 }, { "epoch": 2.86, "learning_rate": 1.1712884031373606e-07, "loss": 0.4317, "step": 15448 }, { "epoch": 2.86, "learning_rate": 1.168242143926479e-07, "loss": 0.4263, "step": 15449 }, { "epoch": 2.86, "learning_rate": 1.1651998279197607e-07, "loss": 0.4299, "step": 15450 }, { "epoch": 2.86, "learning_rate": 1.1621614552385752e-07, "loss": 0.4201, "step": 15451 }, { "epoch": 2.86, "learning_rate": 1.1591270260041587e-07, "loss": 0.4325, "step": 15452 }, { "epoch": 2.86, "learning_rate": 1.1560965403375702e-07, "loss": 0.4193, "step": 15453 }, { "epoch": 2.86, "learning_rate": 1.1530699983597349e-07, "loss": 0.4228, "step": 15454 }, { "epoch": 2.86, "learning_rate": 1.1500474001913897e-07, "loss": 0.4078, "step": 15455 }, { "epoch": 2.86, "learning_rate": 1.1470287459531381e-07, "loss": 0.4175, "step": 15456 }, { "epoch": 2.86, "learning_rate": 1.1440140357654172e-07, "loss": 0.4261, "step": 15457 }, { "epoch": 2.86, "learning_rate": 1.1410032697485085e-07, "loss": 0.4149, "step": 15458 }, { "epoch": 2.86, "learning_rate": 1.137996448022538e-07, "loss": 0.4256, "step": 15459 }, { "epoch": 2.86, "learning_rate": 1.1349935707074766e-07, "loss": 0.4323, "step": 15460 }, { "epoch": 2.86, "learning_rate": 1.1319946379231173e-07, "loss": 0.4199, "step": 15461 }, { "epoch": 2.86, "learning_rate": 1.1289996497891309e-07, "loss": 0.4192, "step": 15462 }, { "epoch": 2.86, "learning_rate": 1.1260086064250109e-07, "loss": 0.4205, "step": 15463 }, { "epoch": 2.86, "learning_rate": 1.1230215079500728e-07, "loss": 0.4183, "step": 15464 }, { "epoch": 2.86, "learning_rate": 1.1200383544835103e-07, "loss": 0.4265, "step": 15465 }, { "epoch": 2.86, "learning_rate": 1.1170591461443503e-07, "loss": 0.418, "step": 15466 }, { "epoch": 2.86, "learning_rate": 1.1140838830514644e-07, "loss": 0.4009, "step": 15467 }, { "epoch": 2.86, "learning_rate": 1.1111125653235355e-07, "loss": 0.3896, "step": 15468 }, { "epoch": 2.86, "learning_rate": 1.1081451930791354e-07, "loss": 0.4209, "step": 15469 }, { "epoch": 2.86, "learning_rate": 1.105181766436647e-07, "loss": 0.421, "step": 15470 }, { "epoch": 2.86, "learning_rate": 1.1022222855142983e-07, "loss": 0.4154, "step": 15471 }, { "epoch": 2.86, "learning_rate": 1.0992667504301834e-07, "loss": 0.39, "step": 15472 }, { "epoch": 2.86, "learning_rate": 1.0963151613022082e-07, "loss": 0.4176, "step": 15473 }, { "epoch": 2.86, "learning_rate": 1.0933675182481562e-07, "loss": 0.3995, "step": 15474 }, { "epoch": 2.86, "learning_rate": 1.090423821385611e-07, "loss": 0.4047, "step": 15475 }, { "epoch": 2.86, "learning_rate": 1.0874840708320345e-07, "loss": 0.4093, "step": 15476 }, { "epoch": 2.86, "learning_rate": 1.0845482667047103e-07, "loss": 0.4269, "step": 15477 }, { "epoch": 2.86, "learning_rate": 1.081616409120767e-07, "loss": 0.4052, "step": 15478 }, { "epoch": 2.86, "learning_rate": 1.0786884981971891e-07, "loss": 0.3924, "step": 15479 }, { "epoch": 2.86, "learning_rate": 1.0757645340507938e-07, "loss": 0.4339, "step": 15480 }, { "epoch": 2.86, "learning_rate": 1.0728445167982326e-07, "loss": 0.4246, "step": 15481 }, { "epoch": 2.86, "learning_rate": 1.0699284465560234e-07, "loss": 0.4205, "step": 15482 }, { "epoch": 2.86, "learning_rate": 1.0670163234405062e-07, "loss": 0.3985, "step": 15483 }, { "epoch": 2.86, "learning_rate": 1.064108147567866e-07, "loss": 0.4184, "step": 15484 }, { "epoch": 2.86, "learning_rate": 1.0612039190541434e-07, "loss": 0.4035, "step": 15485 }, { "epoch": 2.87, "learning_rate": 1.05830363801519e-07, "loss": 0.4202, "step": 15486 }, { "epoch": 2.87, "learning_rate": 1.0554073045667468e-07, "loss": 0.4212, "step": 15487 }, { "epoch": 2.87, "learning_rate": 1.0525149188243545e-07, "loss": 0.4229, "step": 15488 }, { "epoch": 2.87, "learning_rate": 1.0496264809034206e-07, "loss": 0.4207, "step": 15489 }, { "epoch": 2.87, "learning_rate": 1.0467419909191979e-07, "loss": 0.4058, "step": 15490 }, { "epoch": 2.87, "learning_rate": 1.0438614489867493e-07, "loss": 0.4068, "step": 15491 }, { "epoch": 2.87, "learning_rate": 1.0409848552210278e-07, "loss": 0.4182, "step": 15492 }, { "epoch": 2.87, "learning_rate": 1.0381122097367857e-07, "loss": 0.4217, "step": 15493 }, { "epoch": 2.87, "learning_rate": 1.0352435126486537e-07, "loss": 0.4103, "step": 15494 }, { "epoch": 2.87, "learning_rate": 1.0323787640710626e-07, "loss": 0.4032, "step": 15495 }, { "epoch": 2.87, "learning_rate": 1.0295179641183317e-07, "loss": 0.3985, "step": 15496 }, { "epoch": 2.87, "learning_rate": 1.0266611129046034e-07, "loss": 0.4236, "step": 15497 }, { "epoch": 2.87, "learning_rate": 1.0238082105438418e-07, "loss": 0.4044, "step": 15498 }, { "epoch": 2.87, "learning_rate": 1.0209592571498894e-07, "loss": 0.4438, "step": 15499 }, { "epoch": 2.87, "learning_rate": 1.0181142528363996e-07, "loss": 0.4058, "step": 15500 }, { "epoch": 2.87, "learning_rate": 1.015273197716904e-07, "loss": 0.4261, "step": 15501 }, { "epoch": 2.87, "learning_rate": 1.0124360919047339e-07, "loss": 0.3983, "step": 15502 }, { "epoch": 2.87, "learning_rate": 1.0096029355130876e-07, "loss": 0.4293, "step": 15503 }, { "epoch": 2.87, "learning_rate": 1.0067737286550194e-07, "loss": 0.4031, "step": 15504 }, { "epoch": 2.87, "learning_rate": 1.0039484714433834e-07, "loss": 0.4149, "step": 15505 }, { "epoch": 2.87, "learning_rate": 1.0011271639909337e-07, "loss": 0.4199, "step": 15506 }, { "epoch": 2.87, "learning_rate": 9.983098064102137e-08, "loss": 0.4044, "step": 15507 }, { "epoch": 2.87, "learning_rate": 9.954963988136334e-08, "loss": 0.4307, "step": 15508 }, { "epoch": 2.87, "learning_rate": 9.926869413134477e-08, "loss": 0.4167, "step": 15509 }, { "epoch": 2.87, "learning_rate": 9.898814340217334e-08, "loss": 0.4096, "step": 15510 }, { "epoch": 2.87, "learning_rate": 9.870798770504564e-08, "loss": 0.4253, "step": 15511 }, { "epoch": 2.87, "learning_rate": 9.842822705113608e-08, "loss": 0.4167, "step": 15512 }, { "epoch": 2.87, "learning_rate": 9.814886145160906e-08, "loss": 0.4191, "step": 15513 }, { "epoch": 2.87, "learning_rate": 9.786989091760902e-08, "loss": 0.4362, "step": 15514 }, { "epoch": 2.87, "learning_rate": 9.7591315460267e-08, "loss": 0.41, "step": 15515 }, { "epoch": 2.87, "learning_rate": 9.731313509069751e-08, "loss": 0.4133, "step": 15516 }, { "epoch": 2.87, "learning_rate": 9.70353498199994e-08, "loss": 0.4138, "step": 15517 }, { "epoch": 2.87, "learning_rate": 9.675795965925716e-08, "loss": 0.4009, "step": 15518 }, { "epoch": 2.87, "learning_rate": 9.648096461953638e-08, "loss": 0.3942, "step": 15519 }, { "epoch": 2.87, "learning_rate": 9.620436471188932e-08, "loss": 0.4241, "step": 15520 }, { "epoch": 2.87, "learning_rate": 9.59281599473516e-08, "loss": 0.4221, "step": 15521 }, { "epoch": 2.87, "learning_rate": 9.565235033694331e-08, "loss": 0.4295, "step": 15522 }, { "epoch": 2.87, "learning_rate": 9.537693589166896e-08, "loss": 0.4021, "step": 15523 }, { "epoch": 2.87, "learning_rate": 9.510191662251645e-08, "loss": 0.4145, "step": 15524 }, { "epoch": 2.87, "learning_rate": 9.48272925404592e-08, "loss": 0.4128, "step": 15525 }, { "epoch": 2.87, "learning_rate": 9.455306365645512e-08, "loss": 0.4395, "step": 15526 }, { "epoch": 2.87, "learning_rate": 9.427922998144324e-08, "loss": 0.425, "step": 15527 }, { "epoch": 2.87, "learning_rate": 9.400579152635036e-08, "loss": 0.4004, "step": 15528 }, { "epoch": 2.87, "learning_rate": 9.373274830208556e-08, "loss": 0.3997, "step": 15529 }, { "epoch": 2.87, "learning_rate": 9.346010031954344e-08, "loss": 0.4029, "step": 15530 }, { "epoch": 2.87, "learning_rate": 9.318784758960198e-08, "loss": 0.4224, "step": 15531 }, { "epoch": 2.87, "learning_rate": 9.291599012312358e-08, "loss": 0.408, "step": 15532 }, { "epoch": 2.87, "learning_rate": 9.264452793095513e-08, "loss": 0.4293, "step": 15533 }, { "epoch": 2.87, "learning_rate": 9.237346102392575e-08, "loss": 0.4042, "step": 15534 }, { "epoch": 2.87, "learning_rate": 9.210278941285233e-08, "loss": 0.389, "step": 15535 }, { "epoch": 2.87, "learning_rate": 9.183251310853403e-08, "loss": 0.4179, "step": 15536 }, { "epoch": 2.87, "learning_rate": 9.156263212175331e-08, "loss": 0.3991, "step": 15537 }, { "epoch": 2.87, "learning_rate": 9.129314646327936e-08, "loss": 0.4065, "step": 15538 }, { "epoch": 2.87, "learning_rate": 9.102405614386244e-08, "loss": 0.4296, "step": 15539 }, { "epoch": 2.88, "learning_rate": 9.075536117424067e-08, "loss": 0.4243, "step": 15540 }, { "epoch": 2.88, "learning_rate": 9.04870615651332e-08, "loss": 0.4201, "step": 15541 }, { "epoch": 2.88, "learning_rate": 9.021915732724374e-08, "loss": 0.4226, "step": 15542 }, { "epoch": 2.88, "learning_rate": 8.995164847126481e-08, "loss": 0.4177, "step": 15543 }, { "epoch": 2.88, "learning_rate": 8.968453500786456e-08, "loss": 0.4046, "step": 15544 }, { "epoch": 2.88, "learning_rate": 8.941781694770557e-08, "loss": 0.4061, "step": 15545 }, { "epoch": 2.88, "learning_rate": 8.915149430142489e-08, "loss": 0.3979, "step": 15546 }, { "epoch": 2.88, "learning_rate": 8.888556707965069e-08, "loss": 0.4102, "step": 15547 }, { "epoch": 2.88, "learning_rate": 8.862003529299223e-08, "loss": 0.4219, "step": 15548 }, { "epoch": 2.88, "learning_rate": 8.835489895204441e-08, "loss": 0.4261, "step": 15549 }, { "epoch": 2.88, "learning_rate": 8.80901580673843e-08, "loss": 0.4059, "step": 15550 }, { "epoch": 2.88, "learning_rate": 8.78258126495768e-08, "loss": 0.4104, "step": 15551 }, { "epoch": 2.88, "learning_rate": 8.756186270916678e-08, "loss": 0.4261, "step": 15552 }, { "epoch": 2.88, "learning_rate": 8.729830825668584e-08, "loss": 0.3981, "step": 15553 }, { "epoch": 2.88, "learning_rate": 8.703514930265e-08, "loss": 0.4132, "step": 15554 }, { "epoch": 2.88, "learning_rate": 8.677238585755754e-08, "loss": 0.4233, "step": 15555 }, { "epoch": 2.88, "learning_rate": 8.65100179318934e-08, "loss": 0.4179, "step": 15556 }, { "epoch": 2.88, "learning_rate": 8.624804553612587e-08, "loss": 0.4265, "step": 15557 }, { "epoch": 2.88, "learning_rate": 8.598646868070548e-08, "loss": 0.4285, "step": 15558 }, { "epoch": 2.88, "learning_rate": 8.572528737607055e-08, "loss": 0.4429, "step": 15559 }, { "epoch": 2.88, "learning_rate": 8.546450163264053e-08, "loss": 0.3921, "step": 15560 }, { "epoch": 2.88, "learning_rate": 8.520411146082042e-08, "loss": 0.4274, "step": 15561 }, { "epoch": 2.88, "learning_rate": 8.494411687099969e-08, "loss": 0.4233, "step": 15562 }, { "epoch": 2.88, "learning_rate": 8.468451787355114e-08, "loss": 0.4195, "step": 15563 }, { "epoch": 2.88, "learning_rate": 8.442531447883318e-08, "loss": 0.4156, "step": 15564 }, { "epoch": 2.88, "learning_rate": 8.41665066971864e-08, "loss": 0.397, "step": 15565 }, { "epoch": 2.88, "learning_rate": 8.390809453893812e-08, "loss": 0.417, "step": 15566 }, { "epoch": 2.88, "learning_rate": 8.365007801439673e-08, "loss": 0.4016, "step": 15567 }, { "epoch": 2.88, "learning_rate": 8.339245713385846e-08, "loss": 0.4213, "step": 15568 }, { "epoch": 2.88, "learning_rate": 8.313523190760065e-08, "loss": 0.44, "step": 15569 }, { "epoch": 2.88, "learning_rate": 8.287840234588618e-08, "loss": 0.4126, "step": 15570 }, { "epoch": 2.88, "learning_rate": 8.262196845896242e-08, "loss": 0.4257, "step": 15571 }, { "epoch": 2.88, "learning_rate": 8.23659302570612e-08, "loss": 0.3989, "step": 15572 }, { "epoch": 2.88, "learning_rate": 8.211028775039764e-08, "loss": 0.4187, "step": 15573 }, { "epoch": 2.88, "learning_rate": 8.18550409491703e-08, "loss": 0.4242, "step": 15574 }, { "epoch": 2.88, "learning_rate": 8.160018986356433e-08, "loss": 0.4045, "step": 15575 }, { "epoch": 2.88, "learning_rate": 8.134573450374605e-08, "loss": 0.4122, "step": 15576 }, { "epoch": 2.88, "learning_rate": 8.109167487987069e-08, "loss": 0.4171, "step": 15577 }, { "epoch": 2.88, "learning_rate": 8.083801100207233e-08, "loss": 0.411, "step": 15578 }, { "epoch": 2.88, "learning_rate": 8.058474288047292e-08, "loss": 0.4069, "step": 15579 }, { "epoch": 2.88, "learning_rate": 8.033187052517655e-08, "loss": 0.4194, "step": 15580 }, { "epoch": 2.88, "learning_rate": 8.007939394627295e-08, "loss": 0.4002, "step": 15581 }, { "epoch": 2.88, "learning_rate": 7.982731315383519e-08, "loss": 0.3984, "step": 15582 }, { "epoch": 2.88, "learning_rate": 7.957562815792075e-08, "loss": 0.4148, "step": 15583 }, { "epoch": 2.88, "learning_rate": 7.932433896857272e-08, "loss": 0.4186, "step": 15584 }, { "epoch": 2.88, "learning_rate": 7.907344559581421e-08, "loss": 0.4148, "step": 15585 }, { "epoch": 2.88, "learning_rate": 7.882294804965829e-08, "loss": 0.4102, "step": 15586 }, { "epoch": 2.88, "learning_rate": 7.85728463400981e-08, "loss": 0.3961, "step": 15587 }, { "epoch": 2.88, "learning_rate": 7.832314047711231e-08, "loss": 0.4131, "step": 15588 }, { "epoch": 2.88, "learning_rate": 7.807383047066297e-08, "loss": 0.4131, "step": 15589 }, { "epoch": 2.88, "learning_rate": 7.782491633069877e-08, "loss": 0.4048, "step": 15590 }, { "epoch": 2.88, "learning_rate": 7.757639806714956e-08, "loss": 0.3926, "step": 15591 }, { "epoch": 2.88, "learning_rate": 7.732827568993074e-08, "loss": 0.4227, "step": 15592 }, { "epoch": 2.88, "learning_rate": 7.708054920894326e-08, "loss": 0.4173, "step": 15593 }, { "epoch": 2.89, "learning_rate": 7.683321863406923e-08, "loss": 0.4252, "step": 15594 }, { "epoch": 2.89, "learning_rate": 7.658628397517853e-08, "loss": 0.4156, "step": 15595 }, { "epoch": 2.89, "learning_rate": 7.633974524212107e-08, "loss": 0.416, "step": 15596 }, { "epoch": 2.89, "learning_rate": 7.609360244473562e-08, "loss": 0.3901, "step": 15597 }, { "epoch": 2.89, "learning_rate": 7.584785559284103e-08, "loss": 0.4226, "step": 15598 }, { "epoch": 2.89, "learning_rate": 7.560250469624386e-08, "loss": 0.3938, "step": 15599 }, { "epoch": 2.89, "learning_rate": 7.535754976473186e-08, "loss": 0.425, "step": 15600 }, { "epoch": 2.89, "learning_rate": 7.511299080807832e-08, "loss": 0.42, "step": 15601 }, { "epoch": 2.89, "learning_rate": 7.48688278360421e-08, "loss": 0.3924, "step": 15602 }, { "epoch": 2.89, "learning_rate": 7.462506085836208e-08, "loss": 0.4094, "step": 15603 }, { "epoch": 2.89, "learning_rate": 7.438168988476713e-08, "loss": 0.4041, "step": 15604 }, { "epoch": 2.89, "learning_rate": 7.413871492496506e-08, "loss": 0.4119, "step": 15605 }, { "epoch": 2.89, "learning_rate": 7.389613598865142e-08, "loss": 0.4127, "step": 15606 }, { "epoch": 2.89, "learning_rate": 7.365395308550405e-08, "loss": 0.401, "step": 15607 }, { "epoch": 2.89, "learning_rate": 7.341216622518632e-08, "loss": 0.4323, "step": 15608 }, { "epoch": 2.89, "learning_rate": 7.317077541734386e-08, "loss": 0.4242, "step": 15609 }, { "epoch": 2.89, "learning_rate": 7.292978067160894e-08, "loss": 0.4024, "step": 15610 }, { "epoch": 2.89, "learning_rate": 7.268918199759612e-08, "loss": 0.4068, "step": 15611 }, { "epoch": 2.89, "learning_rate": 7.244897940490547e-08, "loss": 0.4144, "step": 15612 }, { "epoch": 2.89, "learning_rate": 7.220917290311935e-08, "loss": 0.4225, "step": 15613 }, { "epoch": 2.89, "learning_rate": 7.196976250180787e-08, "loss": 0.3902, "step": 15614 }, { "epoch": 2.89, "learning_rate": 7.173074821052007e-08, "loss": 0.411, "step": 15615 }, { "epoch": 2.89, "learning_rate": 7.149213003879386e-08, "loss": 0.4201, "step": 15616 }, { "epoch": 2.89, "learning_rate": 7.125390799615051e-08, "loss": 0.4116, "step": 15617 }, { "epoch": 2.89, "learning_rate": 7.101608209209242e-08, "loss": 0.4041, "step": 15618 }, { "epoch": 2.89, "learning_rate": 7.077865233611092e-08, "loss": 0.4341, "step": 15619 }, { "epoch": 2.89, "learning_rate": 7.054161873767618e-08, "loss": 0.4127, "step": 15620 }, { "epoch": 2.89, "learning_rate": 7.03049813062484e-08, "loss": 0.4376, "step": 15621 }, { "epoch": 2.89, "learning_rate": 7.006874005126674e-08, "loss": 0.4125, "step": 15622 }, { "epoch": 2.89, "learning_rate": 6.983289498215806e-08, "loss": 0.4133, "step": 15623 }, { "epoch": 2.89, "learning_rate": 6.959744610833152e-08, "loss": 0.3994, "step": 15624 }, { "epoch": 2.89, "learning_rate": 6.936239343918073e-08, "loss": 0.4182, "step": 15625 }, { "epoch": 2.89, "learning_rate": 6.912773698408481e-08, "loss": 0.3987, "step": 15626 }, { "epoch": 2.89, "learning_rate": 6.88934767524052e-08, "loss": 0.3956, "step": 15627 }, { "epoch": 2.89, "learning_rate": 6.865961275348998e-08, "loss": 0.3975, "step": 15628 }, { "epoch": 2.89, "learning_rate": 6.842614499666833e-08, "loss": 0.4033, "step": 15629 }, { "epoch": 2.89, "learning_rate": 6.819307349125503e-08, "loss": 0.403, "step": 15630 }, { "epoch": 2.89, "learning_rate": 6.796039824655043e-08, "loss": 0.4223, "step": 15631 }, { "epoch": 2.89, "learning_rate": 6.772811927183599e-08, "loss": 0.4216, "step": 15632 }, { "epoch": 2.89, "learning_rate": 6.749623657638205e-08, "loss": 0.4255, "step": 15633 }, { "epoch": 2.89, "learning_rate": 6.72647501694379e-08, "loss": 0.4091, "step": 15634 }, { "epoch": 2.89, "learning_rate": 6.70336600602417e-08, "loss": 0.4225, "step": 15635 }, { "epoch": 2.89, "learning_rate": 6.680296625801053e-08, "loss": 0.4066, "step": 15636 }, { "epoch": 2.89, "learning_rate": 6.657266877195034e-08, "loss": 0.4222, "step": 15637 }, { "epoch": 2.89, "learning_rate": 6.634276761124936e-08, "loss": 0.4003, "step": 15638 }, { "epoch": 2.89, "learning_rate": 6.611326278508134e-08, "loss": 0.4056, "step": 15639 }, { "epoch": 2.89, "learning_rate": 6.58841543026012e-08, "loss": 0.4073, "step": 15640 }, { "epoch": 2.89, "learning_rate": 6.56554421729505e-08, "loss": 0.4346, "step": 15641 }, { "epoch": 2.89, "learning_rate": 6.542712640525528e-08, "loss": 0.4271, "step": 15642 }, { "epoch": 2.89, "learning_rate": 6.519920700862381e-08, "loss": 0.4023, "step": 15643 }, { "epoch": 2.89, "learning_rate": 6.497168399215103e-08, "loss": 0.4057, "step": 15644 }, { "epoch": 2.89, "learning_rate": 6.474455736491303e-08, "loss": 0.3871, "step": 15645 }, { "epoch": 2.89, "learning_rate": 6.451782713597366e-08, "loss": 0.4039, "step": 15646 }, { "epoch": 2.89, "learning_rate": 6.429149331437679e-08, "loss": 0.4234, "step": 15647 }, { "epoch": 2.9, "learning_rate": 6.406555590915409e-08, "loss": 0.4316, "step": 15648 }, { "epoch": 2.9, "learning_rate": 6.384001492931946e-08, "loss": 0.4077, "step": 15649 }, { "epoch": 2.9, "learning_rate": 6.361487038387238e-08, "loss": 0.4169, "step": 15650 }, { "epoch": 2.9, "learning_rate": 6.339012228179564e-08, "loss": 0.4332, "step": 15651 }, { "epoch": 2.9, "learning_rate": 6.316577063205543e-08, "loss": 0.4127, "step": 15652 }, { "epoch": 2.9, "learning_rate": 6.294181544360345e-08, "loss": 0.4142, "step": 15653 }, { "epoch": 2.9, "learning_rate": 6.271825672537479e-08, "loss": 0.4164, "step": 15654 }, { "epoch": 2.9, "learning_rate": 6.24950944862901e-08, "loss": 0.4044, "step": 15655 }, { "epoch": 2.9, "learning_rate": 6.227232873525223e-08, "loss": 0.4039, "step": 15656 }, { "epoch": 2.9, "learning_rate": 6.204995948114856e-08, "loss": 0.4306, "step": 15657 }, { "epoch": 2.9, "learning_rate": 6.182798673285196e-08, "loss": 0.3909, "step": 15658 }, { "epoch": 2.9, "learning_rate": 6.160641049921867e-08, "loss": 0.394, "step": 15659 }, { "epoch": 2.9, "learning_rate": 6.138523078908943e-08, "loss": 0.4324, "step": 15660 }, { "epoch": 2.9, "learning_rate": 6.116444761128937e-08, "loss": 0.4197, "step": 15661 }, { "epoch": 2.9, "learning_rate": 6.094406097462591e-08, "loss": 0.409, "step": 15662 }, { "epoch": 2.9, "learning_rate": 6.0724070887892e-08, "loss": 0.4086, "step": 15663 }, { "epoch": 2.9, "learning_rate": 6.05044773598662e-08, "loss": 0.4102, "step": 15664 }, { "epoch": 2.9, "learning_rate": 6.028528039930925e-08, "loss": 0.4013, "step": 15665 }, { "epoch": 2.9, "learning_rate": 6.00664800149675e-08, "loss": 0.3927, "step": 15666 }, { "epoch": 2.9, "learning_rate": 5.984807621556843e-08, "loss": 0.409, "step": 15667 }, { "epoch": 2.9, "learning_rate": 5.963006900982837e-08, "loss": 0.4106, "step": 15668 }, { "epoch": 2.9, "learning_rate": 5.941245840644372e-08, "loss": 0.4189, "step": 15669 }, { "epoch": 2.9, "learning_rate": 5.919524441409863e-08, "loss": 0.4182, "step": 15670 }, { "epoch": 2.9, "learning_rate": 5.897842704145729e-08, "loss": 0.4258, "step": 15671 }, { "epoch": 2.9, "learning_rate": 5.876200629717166e-08, "loss": 0.4159, "step": 15672 }, { "epoch": 2.9, "learning_rate": 5.854598218987706e-08, "loss": 0.4178, "step": 15673 }, { "epoch": 2.9, "learning_rate": 5.833035472819104e-08, "loss": 0.4162, "step": 15674 }, { "epoch": 2.9, "learning_rate": 5.811512392071672e-08, "loss": 0.4069, "step": 15675 }, { "epoch": 2.9, "learning_rate": 5.7900289776042784e-08, "loss": 0.4198, "step": 15676 }, { "epoch": 2.9, "learning_rate": 5.7685852302740154e-08, "loss": 0.405, "step": 15677 }, { "epoch": 2.9, "learning_rate": 5.7471811509364205e-08, "loss": 0.4052, "step": 15678 }, { "epoch": 2.9, "learning_rate": 5.725816740445478e-08, "loss": 0.4267, "step": 15679 }, { "epoch": 2.9, "learning_rate": 5.7044919996536165e-08, "loss": 0.4187, "step": 15680 }, { "epoch": 2.9, "learning_rate": 5.683206929411489e-08, "loss": 0.414, "step": 15681 }, { "epoch": 2.9, "learning_rate": 5.661961530568638e-08, "loss": 0.4339, "step": 15682 }, { "epoch": 2.9, "learning_rate": 5.6407558039724974e-08, "loss": 0.403, "step": 15683 }, { "epoch": 2.9, "learning_rate": 5.619589750469279e-08, "loss": 0.4169, "step": 15684 }, { "epoch": 2.9, "learning_rate": 5.598463370903196e-08, "loss": 0.3952, "step": 15685 }, { "epoch": 2.9, "learning_rate": 5.577376666117573e-08, "loss": 0.4131, "step": 15686 }, { "epoch": 2.9, "learning_rate": 5.556329636953295e-08, "loss": 0.4073, "step": 15687 }, { "epoch": 2.9, "learning_rate": 5.535322284250355e-08, "loss": 0.4104, "step": 15688 }, { "epoch": 2.9, "learning_rate": 5.5143546088468616e-08, "loss": 0.4049, "step": 15689 }, { "epoch": 2.9, "learning_rate": 5.493426611579478e-08, "loss": 0.4168, "step": 15690 }, { "epoch": 2.9, "learning_rate": 5.4725382932829806e-08, "loss": 0.3873, "step": 15691 }, { "epoch": 2.9, "learning_rate": 5.451689654790926e-08, "loss": 0.4312, "step": 15692 }, { "epoch": 2.9, "learning_rate": 5.430880696935092e-08, "loss": 0.4126, "step": 15693 }, { "epoch": 2.9, "learning_rate": 5.410111420545705e-08, "loss": 0.4177, "step": 15694 }, { "epoch": 2.9, "learning_rate": 5.389381826451434e-08, "loss": 0.4215, "step": 15695 }, { "epoch": 2.9, "learning_rate": 5.368691915479396e-08, "loss": 0.3976, "step": 15696 }, { "epoch": 2.9, "learning_rate": 5.348041688455041e-08, "loss": 0.4186, "step": 15697 }, { "epoch": 2.9, "learning_rate": 5.3274311462022665e-08, "loss": 0.4104, "step": 15698 }, { "epoch": 2.9, "learning_rate": 5.306860289543414e-08, "loss": 0.4073, "step": 15699 }, { "epoch": 2.9, "learning_rate": 5.2863291192991605e-08, "loss": 0.4044, "step": 15700 }, { "epoch": 2.9, "learning_rate": 5.26583763628874e-08, "loss": 0.4268, "step": 15701 }, { "epoch": 2.91, "learning_rate": 5.2453858413297195e-08, "loss": 0.4163, "step": 15702 }, { "epoch": 2.91, "learning_rate": 5.224973735238004e-08, "loss": 0.3993, "step": 15703 }, { "epoch": 2.91, "learning_rate": 5.204601318828051e-08, "loss": 0.4124, "step": 15704 }, { "epoch": 2.91, "learning_rate": 5.184268592912767e-08, "loss": 0.4319, "step": 15705 }, { "epoch": 2.91, "learning_rate": 5.1639755583032804e-08, "loss": 0.4356, "step": 15706 }, { "epoch": 2.91, "learning_rate": 5.143722215809277e-08, "loss": 0.4144, "step": 15707 }, { "epoch": 2.91, "learning_rate": 5.123508566238777e-08, "loss": 0.39, "step": 15708 }, { "epoch": 2.91, "learning_rate": 5.103334610398469e-08, "loss": 0.4148, "step": 15709 }, { "epoch": 2.91, "learning_rate": 5.083200349093043e-08, "loss": 0.4169, "step": 15710 }, { "epoch": 2.91, "learning_rate": 5.0631057831257435e-08, "loss": 0.4098, "step": 15711 }, { "epoch": 2.91, "learning_rate": 5.0430509132985975e-08, "loss": 0.4042, "step": 15712 }, { "epoch": 2.91, "learning_rate": 5.0230357404115196e-08, "loss": 0.415, "step": 15713 }, { "epoch": 2.91, "learning_rate": 5.0030602652633154e-08, "loss": 0.4194, "step": 15714 }, { "epoch": 2.91, "learning_rate": 4.9831244886506816e-08, "loss": 0.3981, "step": 15715 }, { "epoch": 2.91, "learning_rate": 4.963228411369203e-08, "loss": 0.3995, "step": 15716 }, { "epoch": 2.91, "learning_rate": 4.94337203421269e-08, "loss": 0.408, "step": 15717 }, { "epoch": 2.91, "learning_rate": 4.9235553579731754e-08, "loss": 0.4101, "step": 15718 }, { "epoch": 2.91, "learning_rate": 4.903778383441582e-08, "loss": 0.4144, "step": 15719 }, { "epoch": 2.91, "learning_rate": 4.884041111406834e-08, "loss": 0.4029, "step": 15720 }, { "epoch": 2.91, "learning_rate": 4.864343542656525e-08, "loss": 0.4005, "step": 15721 }, { "epoch": 2.91, "learning_rate": 4.844685677976357e-08, "loss": 0.4202, "step": 15722 }, { "epoch": 2.91, "learning_rate": 4.825067518150817e-08, "loss": 0.3865, "step": 15723 }, { "epoch": 2.91, "learning_rate": 4.8054890639624986e-08, "loss": 0.3779, "step": 15724 }, { "epoch": 2.91, "learning_rate": 4.785950316192667e-08, "loss": 0.4159, "step": 15725 }, { "epoch": 2.91, "learning_rate": 4.766451275620809e-08, "loss": 0.4226, "step": 15726 }, { "epoch": 2.91, "learning_rate": 4.74699194302497e-08, "loss": 0.4091, "step": 15727 }, { "epoch": 2.91, "learning_rate": 4.727572319181417e-08, "loss": 0.4157, "step": 15728 }, { "epoch": 2.91, "learning_rate": 4.708192404865086e-08, "loss": 0.4168, "step": 15729 }, { "epoch": 2.91, "learning_rate": 4.688852200849026e-08, "loss": 0.4079, "step": 15730 }, { "epoch": 2.91, "learning_rate": 4.6695517079050625e-08, "loss": 0.4153, "step": 15731 }, { "epoch": 2.91, "learning_rate": 4.650290926803247e-08, "loss": 0.4011, "step": 15732 }, { "epoch": 2.91, "learning_rate": 4.631069858311965e-08, "loss": 0.3975, "step": 15733 }, { "epoch": 2.91, "learning_rate": 4.6118885031980474e-08, "loss": 0.4175, "step": 15734 }, { "epoch": 2.91, "learning_rate": 4.5927468622268826e-08, "loss": 0.4169, "step": 15735 }, { "epoch": 2.91, "learning_rate": 4.573644936162192e-08, "loss": 0.4267, "step": 15736 }, { "epoch": 2.91, "learning_rate": 4.554582725766144e-08, "loss": 0.4129, "step": 15737 }, { "epoch": 2.91, "learning_rate": 4.53556023179913e-08, "loss": 0.3885, "step": 15738 }, { "epoch": 2.91, "learning_rate": 4.51657745502021e-08, "loss": 0.4461, "step": 15739 }, { "epoch": 2.91, "learning_rate": 4.4976343961867783e-08, "loss": 0.4292, "step": 15740 }, { "epoch": 2.91, "learning_rate": 4.4787310560546746e-08, "loss": 0.4119, "step": 15741 }, { "epoch": 2.91, "learning_rate": 4.4598674353779626e-08, "loss": 0.401, "step": 15742 }, { "epoch": 2.91, "learning_rate": 4.441043534909484e-08, "loss": 0.4206, "step": 15743 }, { "epoch": 2.91, "learning_rate": 4.422259355399971e-08, "loss": 0.4144, "step": 15744 }, { "epoch": 2.91, "learning_rate": 4.4035148975991594e-08, "loss": 0.4201, "step": 15745 }, { "epoch": 2.91, "learning_rate": 4.384810162254782e-08, "loss": 0.4095, "step": 15746 }, { "epoch": 2.91, "learning_rate": 4.3661451501131325e-08, "loss": 0.4278, "step": 15747 }, { "epoch": 2.91, "learning_rate": 4.3475198619189476e-08, "loss": 0.4247, "step": 15748 }, { "epoch": 2.91, "learning_rate": 4.328934298415299e-08, "loss": 0.44, "step": 15749 }, { "epoch": 2.91, "learning_rate": 4.310388460343706e-08, "loss": 0.4191, "step": 15750 }, { "epoch": 2.91, "learning_rate": 4.291882348444132e-08, "loss": 0.4255, "step": 15751 }, { "epoch": 2.91, "learning_rate": 4.2734159634549854e-08, "loss": 0.383, "step": 15752 }, { "epoch": 2.91, "learning_rate": 4.254989306113011e-08, "loss": 0.4197, "step": 15753 }, { "epoch": 2.91, "learning_rate": 4.2366023771533983e-08, "loss": 0.3907, "step": 15754 }, { "epoch": 2.91, "learning_rate": 4.218255177309671e-08, "loss": 0.4233, "step": 15755 }, { "epoch": 2.92, "learning_rate": 4.1999477073140224e-08, "loss": 0.4245, "step": 15756 }, { "epoch": 2.92, "learning_rate": 4.181679967896757e-08, "loss": 0.4109, "step": 15757 }, { "epoch": 2.92, "learning_rate": 4.163451959786735e-08, "loss": 0.4201, "step": 15758 }, { "epoch": 2.92, "learning_rate": 4.1452636837111535e-08, "loss": 0.3986, "step": 15759 }, { "epoch": 2.92, "learning_rate": 4.1271151403958765e-08, "loss": 0.4157, "step": 15760 }, { "epoch": 2.92, "learning_rate": 4.10900633056488e-08, "loss": 0.4123, "step": 15761 }, { "epoch": 2.92, "learning_rate": 4.090937254940697e-08, "loss": 0.4196, "step": 15762 }, { "epoch": 2.92, "learning_rate": 4.0729079142443065e-08, "loss": 0.4295, "step": 15763 }, { "epoch": 2.92, "learning_rate": 4.0549183091948e-08, "loss": 0.416, "step": 15764 }, { "epoch": 2.92, "learning_rate": 4.0369684405102694e-08, "loss": 0.4159, "step": 15765 }, { "epoch": 2.92, "learning_rate": 4.019058308906698e-08, "loss": 0.4163, "step": 15766 }, { "epoch": 2.92, "learning_rate": 4.0011879150986256e-08, "loss": 0.4146, "step": 15767 }, { "epoch": 2.92, "learning_rate": 3.983357259799148e-08, "loss": 0.4184, "step": 15768 }, { "epoch": 2.92, "learning_rate": 3.965566343719585e-08, "loss": 0.4228, "step": 15769 }, { "epoch": 2.92, "learning_rate": 3.947815167569924e-08, "loss": 0.4271, "step": 15770 }, { "epoch": 2.92, "learning_rate": 3.930103732058266e-08, "loss": 0.4101, "step": 15771 }, { "epoch": 2.92, "learning_rate": 3.9124320378912674e-08, "loss": 0.3892, "step": 15772 }, { "epoch": 2.92, "learning_rate": 3.894800085774031e-08, "loss": 0.4377, "step": 15773 }, { "epoch": 2.92, "learning_rate": 3.877207876409994e-08, "loss": 0.4096, "step": 15774 }, { "epoch": 2.92, "learning_rate": 3.859655410501151e-08, "loss": 0.4239, "step": 15775 }, { "epoch": 2.92, "learning_rate": 3.842142688747719e-08, "loss": 0.423, "step": 15776 }, { "epoch": 2.92, "learning_rate": 3.824669711848472e-08, "loss": 0.4178, "step": 15777 }, { "epoch": 2.92, "learning_rate": 3.80723648050052e-08, "loss": 0.4115, "step": 15778 }, { "epoch": 2.92, "learning_rate": 3.789842995399418e-08, "loss": 0.4311, "step": 15779 }, { "epoch": 2.92, "learning_rate": 3.772489257239165e-08, "loss": 0.4272, "step": 15780 }, { "epoch": 2.92, "learning_rate": 3.7551752667120964e-08, "loss": 0.4251, "step": 15781 }, { "epoch": 2.92, "learning_rate": 3.737901024509105e-08, "loss": 0.4133, "step": 15782 }, { "epoch": 2.92, "learning_rate": 3.720666531319195e-08, "loss": 0.4096, "step": 15783 }, { "epoch": 2.92, "learning_rate": 3.70347178783026e-08, "loss": 0.4059, "step": 15784 }, { "epoch": 2.92, "learning_rate": 3.686316794728195e-08, "loss": 0.4255, "step": 15785 }, { "epoch": 2.92, "learning_rate": 3.6692015526974544e-08, "loss": 0.4141, "step": 15786 }, { "epoch": 2.92, "learning_rate": 3.652126062420824e-08, "loss": 0.4083, "step": 15787 }, { "epoch": 2.92, "learning_rate": 3.63509032457976e-08, "loss": 0.3939, "step": 15788 }, { "epoch": 2.92, "learning_rate": 3.6180943398539394e-08, "loss": 0.4168, "step": 15789 }, { "epoch": 2.92, "learning_rate": 3.601138108921265e-08, "loss": 0.412, "step": 15790 }, { "epoch": 2.92, "learning_rate": 3.584221632458418e-08, "loss": 0.4098, "step": 15791 }, { "epoch": 2.92, "learning_rate": 3.5673449111404134e-08, "loss": 0.3874, "step": 15792 }, { "epoch": 2.92, "learning_rate": 3.550507945640491e-08, "loss": 0.4379, "step": 15793 }, { "epoch": 2.92, "learning_rate": 3.533710736630336e-08, "loss": 0.4087, "step": 15794 }, { "epoch": 2.92, "learning_rate": 3.516953284780189e-08, "loss": 0.4461, "step": 15795 }, { "epoch": 2.92, "learning_rate": 3.500235590758738e-08, "loss": 0.4123, "step": 15796 }, { "epoch": 2.92, "learning_rate": 3.483557655232894e-08, "loss": 0.4353, "step": 15797 }, { "epoch": 2.92, "learning_rate": 3.4669194788682356e-08, "loss": 0.4186, "step": 15798 }, { "epoch": 2.92, "learning_rate": 3.450321062328232e-08, "loss": 0.4143, "step": 15799 }, { "epoch": 2.92, "learning_rate": 3.433762406275465e-08, "loss": 0.4084, "step": 15800 }, { "epoch": 2.92, "learning_rate": 3.417243511370516e-08, "loss": 0.4171, "step": 15801 }, { "epoch": 2.92, "learning_rate": 3.400764378272414e-08, "loss": 0.4319, "step": 15802 }, { "epoch": 2.92, "learning_rate": 3.384325007638634e-08, "loss": 0.4114, "step": 15803 }, { "epoch": 2.92, "learning_rate": 3.367925400125094e-08, "loss": 0.4157, "step": 15804 }, { "epoch": 2.92, "learning_rate": 3.351565556386161e-08, "loss": 0.4115, "step": 15805 }, { "epoch": 2.92, "learning_rate": 3.335245477074422e-08, "loss": 0.4065, "step": 15806 }, { "epoch": 2.92, "learning_rate": 3.318965162841137e-08, "loss": 0.4124, "step": 15807 }, { "epoch": 2.92, "learning_rate": 3.302724614335895e-08, "loss": 0.4284, "step": 15808 }, { "epoch": 2.92, "learning_rate": 3.2865238322066226e-08, "loss": 0.4051, "step": 15809 }, { "epoch": 2.93, "learning_rate": 3.2703628170995815e-08, "loss": 0.4154, "step": 15810 }, { "epoch": 2.93, "learning_rate": 3.2542415696596995e-08, "loss": 0.4046, "step": 15811 }, { "epoch": 2.93, "learning_rate": 3.23816009053024e-08, "loss": 0.4049, "step": 15812 }, { "epoch": 2.93, "learning_rate": 3.22211838035269e-08, "loss": 0.4297, "step": 15813 }, { "epoch": 2.93, "learning_rate": 3.206116439767093e-08, "loss": 0.4319, "step": 15814 }, { "epoch": 2.93, "learning_rate": 3.190154269411938e-08, "loss": 0.4172, "step": 15815 }, { "epoch": 2.93, "learning_rate": 3.17423186992416e-08, "loss": 0.4253, "step": 15816 }, { "epoch": 2.93, "learning_rate": 3.1583492419389183e-08, "loss": 0.4227, "step": 15817 }, { "epoch": 2.93, "learning_rate": 3.1425063860899276e-08, "loss": 0.4015, "step": 15818 }, { "epoch": 2.93, "learning_rate": 3.126703303009237e-08, "loss": 0.3911, "step": 15819 }, { "epoch": 2.93, "learning_rate": 3.110939993327566e-08, "loss": 0.4168, "step": 15820 }, { "epoch": 2.93, "learning_rate": 3.095216457673522e-08, "loss": 0.4018, "step": 15821 }, { "epoch": 2.93, "learning_rate": 3.079532696674714e-08, "loss": 0.4091, "step": 15822 }, { "epoch": 2.93, "learning_rate": 3.0638887109568636e-08, "loss": 0.4161, "step": 15823 }, { "epoch": 2.93, "learning_rate": 3.0482845011440274e-08, "loss": 0.4184, "step": 15824 }, { "epoch": 2.93, "learning_rate": 3.0327200678588185e-08, "loss": 0.4069, "step": 15825 }, { "epoch": 2.93, "learning_rate": 3.017195411722185e-08, "loss": 0.4192, "step": 15826 }, { "epoch": 2.93, "learning_rate": 3.00171053335363e-08, "loss": 0.4232, "step": 15827 }, { "epoch": 2.93, "learning_rate": 2.986265433370994e-08, "loss": 0.4034, "step": 15828 }, { "epoch": 2.93, "learning_rate": 2.9708601123904502e-08, "loss": 0.4323, "step": 15829 }, { "epoch": 2.93, "learning_rate": 2.955494571026507e-08, "loss": 0.3959, "step": 15830 }, { "epoch": 2.93, "learning_rate": 2.940168809892452e-08, "loss": 0.4122, "step": 15831 }, { "epoch": 2.93, "learning_rate": 2.9248828295996845e-08, "loss": 0.4176, "step": 15832 }, { "epoch": 2.93, "learning_rate": 2.9096366307579394e-08, "loss": 0.4319, "step": 15833 }, { "epoch": 2.93, "learning_rate": 2.8944302139757298e-08, "loss": 0.4112, "step": 15834 }, { "epoch": 2.93, "learning_rate": 2.8792635798596812e-08, "loss": 0.3958, "step": 15835 }, { "epoch": 2.93, "learning_rate": 2.864136729014755e-08, "loss": 0.4052, "step": 15836 }, { "epoch": 2.93, "learning_rate": 2.8490496620448006e-08, "loss": 0.4179, "step": 15837 }, { "epoch": 2.93, "learning_rate": 2.8340023795514483e-08, "loss": 0.4006, "step": 15838 }, { "epoch": 2.93, "learning_rate": 2.8189948821352175e-08, "loss": 0.4184, "step": 15839 }, { "epoch": 2.93, "learning_rate": 2.804027170394963e-08, "loss": 0.4158, "step": 15840 }, { "epoch": 2.93, "learning_rate": 2.789099244927651e-08, "loss": 0.413, "step": 15841 }, { "epoch": 2.93, "learning_rate": 2.774211106329028e-08, "loss": 0.4061, "step": 15842 }, { "epoch": 2.93, "learning_rate": 2.7593627551930625e-08, "loss": 0.414, "step": 15843 }, { "epoch": 2.93, "learning_rate": 2.744554192112281e-08, "loss": 0.4036, "step": 15844 }, { "epoch": 2.93, "learning_rate": 2.729785417677322e-08, "loss": 0.4017, "step": 15845 }, { "epoch": 2.93, "learning_rate": 2.715056432477492e-08, "loss": 0.4024, "step": 15846 }, { "epoch": 2.93, "learning_rate": 2.700367237100543e-08, "loss": 0.4008, "step": 15847 }, { "epoch": 2.93, "learning_rate": 2.6857178321324507e-08, "loss": 0.4253, "step": 15848 }, { "epoch": 2.93, "learning_rate": 2.6711082181578585e-08, "loss": 0.3959, "step": 15849 }, { "epoch": 2.93, "learning_rate": 2.6565383957594116e-08, "loss": 0.429, "step": 15850 }, { "epoch": 2.93, "learning_rate": 2.6420083655186444e-08, "loss": 0.4143, "step": 15851 }, { "epoch": 2.93, "learning_rate": 2.627518128015094e-08, "loss": 0.4053, "step": 15852 }, { "epoch": 2.93, "learning_rate": 2.6130676838270752e-08, "loss": 0.4182, "step": 15853 }, { "epoch": 2.93, "learning_rate": 2.5986570335309048e-08, "loss": 0.3947, "step": 15854 }, { "epoch": 2.93, "learning_rate": 2.5842861777017893e-08, "loss": 0.4055, "step": 15855 }, { "epoch": 2.93, "learning_rate": 2.5699551169129366e-08, "loss": 0.4034, "step": 15856 }, { "epoch": 2.93, "learning_rate": 2.555663851736223e-08, "loss": 0.4166, "step": 15857 }, { "epoch": 2.93, "learning_rate": 2.541412382741859e-08, "loss": 0.4396, "step": 15858 }, { "epoch": 2.93, "learning_rate": 2.5272007104982787e-08, "loss": 0.4177, "step": 15859 }, { "epoch": 2.93, "learning_rate": 2.513028835572695e-08, "loss": 0.4009, "step": 15860 }, { "epoch": 2.93, "learning_rate": 2.4988967585304335e-08, "loss": 0.4157, "step": 15861 }, { "epoch": 2.93, "learning_rate": 2.4848044799353766e-08, "loss": 0.3978, "step": 15862 }, { "epoch": 2.93, "learning_rate": 2.470752000349741e-08, "loss": 0.4259, "step": 15863 }, { "epoch": 2.94, "learning_rate": 2.4567393203343005e-08, "loss": 0.425, "step": 15864 }, { "epoch": 2.94, "learning_rate": 2.4427664404479412e-08, "loss": 0.4046, "step": 15865 }, { "epoch": 2.94, "learning_rate": 2.4288333612483283e-08, "loss": 0.4052, "step": 15866 }, { "epoch": 2.94, "learning_rate": 2.4149400832913505e-08, "loss": 0.4305, "step": 15867 }, { "epoch": 2.94, "learning_rate": 2.4010866071312312e-08, "loss": 0.4264, "step": 15868 }, { "epoch": 2.94, "learning_rate": 2.38727293332075e-08, "loss": 0.4284, "step": 15869 }, { "epoch": 2.94, "learning_rate": 2.3734990624111333e-08, "loss": 0.4144, "step": 15870 }, { "epoch": 2.94, "learning_rate": 2.3597649949518297e-08, "loss": 0.4211, "step": 15871 }, { "epoch": 2.94, "learning_rate": 2.3460707314907348e-08, "loss": 0.3992, "step": 15872 }, { "epoch": 2.94, "learning_rate": 2.3324162725743004e-08, "loss": 0.4143, "step": 15873 }, { "epoch": 2.94, "learning_rate": 2.318801618747424e-08, "loss": 0.4206, "step": 15874 }, { "epoch": 2.94, "learning_rate": 2.305226770553115e-08, "loss": 0.402, "step": 15875 }, { "epoch": 2.94, "learning_rate": 2.291691728533163e-08, "loss": 0.4218, "step": 15876 }, { "epoch": 2.94, "learning_rate": 2.278196493227469e-08, "loss": 0.4242, "step": 15877 }, { "epoch": 2.94, "learning_rate": 2.2647410651744918e-08, "loss": 0.4308, "step": 15878 }, { "epoch": 2.94, "learning_rate": 2.2513254449110232e-08, "loss": 0.4203, "step": 15879 }, { "epoch": 2.94, "learning_rate": 2.2379496329725247e-08, "loss": 0.4107, "step": 15880 }, { "epoch": 2.94, "learning_rate": 2.224613629892458e-08, "loss": 0.4097, "step": 15881 }, { "epoch": 2.94, "learning_rate": 2.211317436202953e-08, "loss": 0.4056, "step": 15882 }, { "epoch": 2.94, "learning_rate": 2.1980610524345858e-08, "loss": 0.3977, "step": 15883 }, { "epoch": 2.94, "learning_rate": 2.184844479116155e-08, "loss": 0.4132, "step": 15884 }, { "epoch": 2.94, "learning_rate": 2.1716677167750165e-08, "loss": 0.41, "step": 15885 }, { "epoch": 2.94, "learning_rate": 2.1585307659368615e-08, "loss": 0.4204, "step": 15886 }, { "epoch": 2.94, "learning_rate": 2.145433627125937e-08, "loss": 0.405, "step": 15887 }, { "epoch": 2.94, "learning_rate": 2.1323763008647134e-08, "loss": 0.4125, "step": 15888 }, { "epoch": 2.94, "learning_rate": 2.1193587876742193e-08, "loss": 0.4113, "step": 15889 }, { "epoch": 2.94, "learning_rate": 2.1063810880737058e-08, "loss": 0.4052, "step": 15890 }, { "epoch": 2.94, "learning_rate": 2.0934432025810913e-08, "loss": 0.4172, "step": 15891 }, { "epoch": 2.94, "learning_rate": 2.0805451317125193e-08, "loss": 0.3976, "step": 15892 }, { "epoch": 2.94, "learning_rate": 2.0676868759825775e-08, "loss": 0.4043, "step": 15893 }, { "epoch": 2.94, "learning_rate": 2.0548684359043002e-08, "loss": 0.4167, "step": 15894 }, { "epoch": 2.94, "learning_rate": 2.0420898119891676e-08, "loss": 0.4387, "step": 15895 }, { "epoch": 2.94, "learning_rate": 2.0293510047469932e-08, "loss": 0.4287, "step": 15896 }, { "epoch": 2.94, "learning_rate": 2.016652014685927e-08, "loss": 0.3953, "step": 15897 }, { "epoch": 2.94, "learning_rate": 2.0039928423128962e-08, "loss": 0.4192, "step": 15898 }, { "epoch": 2.94, "learning_rate": 1.9913734881326085e-08, "loss": 0.4143, "step": 15899 }, { "epoch": 2.94, "learning_rate": 1.9787939526488832e-08, "loss": 0.4144, "step": 15900 }, { "epoch": 2.94, "learning_rate": 1.9662542363634297e-08, "loss": 0.4028, "step": 15901 }, { "epoch": 2.94, "learning_rate": 1.9537543397766258e-08, "loss": 0.4091, "step": 15902 }, { "epoch": 2.94, "learning_rate": 1.9412942633872945e-08, "loss": 0.4141, "step": 15903 }, { "epoch": 2.94, "learning_rate": 1.928874007692372e-08, "loss": 0.4146, "step": 15904 }, { "epoch": 2.94, "learning_rate": 1.9164935731874612e-08, "loss": 0.425, "step": 15905 }, { "epoch": 2.94, "learning_rate": 1.904152960366612e-08, "loss": 0.3987, "step": 15906 }, { "epoch": 2.94, "learning_rate": 1.891852169722097e-08, "loss": 0.3994, "step": 15907 }, { "epoch": 2.94, "learning_rate": 1.879591201744857e-08, "loss": 0.4371, "step": 15908 }, { "epoch": 2.94, "learning_rate": 1.867370056923834e-08, "loss": 0.3794, "step": 15909 }, { "epoch": 2.94, "learning_rate": 1.855188735746749e-08, "loss": 0.4167, "step": 15910 }, { "epoch": 2.94, "learning_rate": 1.8430472386996577e-08, "loss": 0.4112, "step": 15911 }, { "epoch": 2.94, "learning_rate": 1.8309455662669508e-08, "loss": 0.4105, "step": 15912 }, { "epoch": 2.94, "learning_rate": 1.8188837189314636e-08, "loss": 0.4126, "step": 15913 }, { "epoch": 2.94, "learning_rate": 1.8068616971743667e-08, "loss": 0.4134, "step": 15914 }, { "epoch": 2.94, "learning_rate": 1.7948795014753883e-08, "loss": 0.4113, "step": 15915 }, { "epoch": 2.94, "learning_rate": 1.78293713231259e-08, "loss": 0.3958, "step": 15916 }, { "epoch": 2.94, "learning_rate": 1.7710345901625903e-08, "loss": 0.4054, "step": 15917 }, { "epoch": 2.95, "learning_rate": 1.7591718755000097e-08, "loss": 0.4118, "step": 15918 }, { "epoch": 2.95, "learning_rate": 1.7473489887982475e-08, "loss": 0.4046, "step": 15919 }, { "epoch": 2.95, "learning_rate": 1.7355659305291483e-08, "loss": 0.401, "step": 15920 }, { "epoch": 2.95, "learning_rate": 1.7238227011626697e-08, "loss": 0.4119, "step": 15921 }, { "epoch": 2.95, "learning_rate": 1.7121193011674364e-08, "loss": 0.4052, "step": 15922 }, { "epoch": 2.95, "learning_rate": 1.7004557310102977e-08, "loss": 0.4392, "step": 15923 }, { "epoch": 2.95, "learning_rate": 1.6888319911567697e-08, "loss": 0.3862, "step": 15924 }, { "epoch": 2.95, "learning_rate": 1.6772480820704818e-08, "loss": 0.416, "step": 15925 }, { "epoch": 2.95, "learning_rate": 1.6657040042136198e-08, "loss": 0.4335, "step": 15926 }, { "epoch": 2.95, "learning_rate": 1.654199758046815e-08, "loss": 0.4214, "step": 15927 }, { "epoch": 2.95, "learning_rate": 1.642735344029034e-08, "loss": 0.4125, "step": 15928 }, { "epoch": 2.95, "learning_rate": 1.631310762617688e-08, "loss": 0.3916, "step": 15929 }, { "epoch": 2.95, "learning_rate": 1.6199260142687466e-08, "loss": 0.3987, "step": 15930 }, { "epoch": 2.95, "learning_rate": 1.6085810994361793e-08, "loss": 0.3978, "step": 15931 }, { "epoch": 2.95, "learning_rate": 1.5972760185727352e-08, "loss": 0.3887, "step": 15932 }, { "epoch": 2.95, "learning_rate": 1.5860107721296093e-08, "loss": 0.4342, "step": 15933 }, { "epoch": 2.95, "learning_rate": 1.574785360555997e-08, "loss": 0.4033, "step": 15934 }, { "epoch": 2.95, "learning_rate": 1.563599784299985e-08, "loss": 0.4166, "step": 15935 }, { "epoch": 2.95, "learning_rate": 1.552454043807772e-08, "loss": 0.4183, "step": 15936 }, { "epoch": 2.95, "learning_rate": 1.5413481395241126e-08, "loss": 0.4093, "step": 15937 }, { "epoch": 2.95, "learning_rate": 1.5302820718919863e-08, "loss": 0.4104, "step": 15938 }, { "epoch": 2.95, "learning_rate": 1.51925584135304e-08, "loss": 0.4135, "step": 15939 }, { "epoch": 2.95, "learning_rate": 1.508269448347144e-08, "loss": 0.4301, "step": 15940 }, { "epoch": 2.95, "learning_rate": 1.4973228933126138e-08, "loss": 0.3942, "step": 15941 }, { "epoch": 2.95, "learning_rate": 1.4864161766862118e-08, "loss": 0.4103, "step": 15942 }, { "epoch": 2.95, "learning_rate": 1.475549298903145e-08, "loss": 0.4209, "step": 15943 }, { "epoch": 2.95, "learning_rate": 1.4647222603969557e-08, "loss": 0.4266, "step": 15944 }, { "epoch": 2.95, "learning_rate": 1.4539350615996318e-08, "loss": 0.4349, "step": 15945 }, { "epoch": 2.95, "learning_rate": 1.4431877029414953e-08, "loss": 0.3898, "step": 15946 }, { "epoch": 2.95, "learning_rate": 1.4324801848513148e-08, "loss": 0.4309, "step": 15947 }, { "epoch": 2.95, "learning_rate": 1.421812507756526e-08, "loss": 0.397, "step": 15948 }, { "epoch": 2.95, "learning_rate": 1.4111846720824552e-08, "loss": 0.4152, "step": 15949 }, { "epoch": 2.95, "learning_rate": 1.4005966782533187e-08, "loss": 0.4002, "step": 15950 }, { "epoch": 2.95, "learning_rate": 1.3900485266915564e-08, "loss": 0.4127, "step": 15951 }, { "epoch": 2.95, "learning_rate": 1.3795402178180538e-08, "loss": 0.4418, "step": 15952 }, { "epoch": 2.95, "learning_rate": 1.3690717520519204e-08, "loss": 0.4129, "step": 15953 }, { "epoch": 2.95, "learning_rate": 1.3586431298108217e-08, "loss": 0.4317, "step": 15954 }, { "epoch": 2.95, "learning_rate": 1.3482543515110913e-08, "loss": 0.4138, "step": 15955 }, { "epoch": 2.95, "learning_rate": 1.3379054175669537e-08, "loss": 0.4187, "step": 15956 }, { "epoch": 2.95, "learning_rate": 1.3275963283914117e-08, "loss": 0.4177, "step": 15957 }, { "epoch": 2.95, "learning_rate": 1.317327084395803e-08, "loss": 0.3972, "step": 15958 }, { "epoch": 2.95, "learning_rate": 1.3070976859899109e-08, "loss": 0.426, "step": 15959 }, { "epoch": 2.95, "learning_rate": 1.2969081335816313e-08, "loss": 0.4411, "step": 15960 }, { "epoch": 2.95, "learning_rate": 1.2867584275777501e-08, "loss": 0.4016, "step": 15961 }, { "epoch": 2.95, "learning_rate": 1.2766485683831652e-08, "loss": 0.4125, "step": 15962 }, { "epoch": 2.95, "learning_rate": 1.2665785564012212e-08, "loss": 0.4151, "step": 15963 }, { "epoch": 2.95, "learning_rate": 1.2565483920337073e-08, "loss": 0.4277, "step": 15964 }, { "epoch": 2.95, "learning_rate": 1.2465580756806373e-08, "loss": 0.4248, "step": 15965 }, { "epoch": 2.95, "learning_rate": 1.2366076077409139e-08, "loss": 0.4272, "step": 15966 }, { "epoch": 2.95, "learning_rate": 1.2266969886113312e-08, "loss": 0.4137, "step": 15967 }, { "epoch": 2.95, "learning_rate": 1.2168262186873503e-08, "loss": 0.3956, "step": 15968 }, { "epoch": 2.95, "learning_rate": 1.2069952983628785e-08, "loss": 0.4127, "step": 15969 }, { "epoch": 2.95, "learning_rate": 1.1972042280299357e-08, "loss": 0.4188, "step": 15970 }, { "epoch": 2.95, "learning_rate": 1.1874530080794312e-08, "loss": 0.3849, "step": 15971 }, { "epoch": 2.96, "learning_rate": 1.177741638900276e-08, "loss": 0.4062, "step": 15972 }, { "epoch": 2.96, "learning_rate": 1.1680701208799383e-08, "loss": 0.4222, "step": 15973 }, { "epoch": 2.96, "learning_rate": 1.1584384544043314e-08, "loss": 0.4052, "step": 15974 }, { "epoch": 2.96, "learning_rate": 1.1488466398577036e-08, "loss": 0.3975, "step": 15975 }, { "epoch": 2.96, "learning_rate": 1.1392946776227487e-08, "loss": 0.3961, "step": 15976 }, { "epoch": 2.96, "learning_rate": 1.1297825680806063e-08, "loss": 0.42, "step": 15977 }, { "epoch": 2.96, "learning_rate": 1.1203103116108615e-08, "loss": 0.4095, "step": 15978 }, { "epoch": 2.96, "learning_rate": 1.1108779085913234e-08, "loss": 0.4368, "step": 15979 }, { "epoch": 2.96, "learning_rate": 1.1014853593982466e-08, "loss": 0.4026, "step": 15980 }, { "epoch": 2.96, "learning_rate": 1.0921326644066643e-08, "loss": 0.419, "step": 15981 }, { "epoch": 2.96, "learning_rate": 1.0828198239893895e-08, "loss": 0.4164, "step": 15982 }, { "epoch": 2.96, "learning_rate": 1.0735468385183467e-08, "loss": 0.4028, "step": 15983 }, { "epoch": 2.96, "learning_rate": 1.0643137083631294e-08, "loss": 0.4084, "step": 15984 }, { "epoch": 2.96, "learning_rate": 1.0551204338924425e-08, "loss": 0.3913, "step": 15985 }, { "epoch": 2.96, "learning_rate": 1.0459670154728818e-08, "loss": 0.4238, "step": 15986 }, { "epoch": 2.96, "learning_rate": 1.0368534534698216e-08, "loss": 0.4184, "step": 15987 }, { "epoch": 2.96, "learning_rate": 1.0277797482466378e-08, "loss": 0.4166, "step": 15988 }, { "epoch": 2.96, "learning_rate": 1.0187459001655964e-08, "loss": 0.4211, "step": 15989 }, { "epoch": 2.96, "learning_rate": 1.0097519095869645e-08, "loss": 0.4256, "step": 15990 }, { "epoch": 2.96, "learning_rate": 1.0007977768697885e-08, "loss": 0.4123, "step": 15991 }, { "epoch": 2.96, "learning_rate": 9.91883502371005e-09, "loss": 0.4157, "step": 15992 }, { "epoch": 2.96, "learning_rate": 9.830090864465514e-09, "loss": 0.4121, "step": 15993 }, { "epoch": 2.96, "learning_rate": 9.741745294503668e-09, "loss": 0.4203, "step": 15994 }, { "epoch": 2.96, "learning_rate": 9.653798317350582e-09, "loss": 0.3928, "step": 15995 }, { "epoch": 2.96, "learning_rate": 9.56624993651345e-09, "loss": 0.3972, "step": 15996 }, { "epoch": 2.96, "learning_rate": 9.479100155486143e-09, "loss": 0.4126, "step": 15997 }, { "epoch": 2.96, "learning_rate": 9.39234897774588e-09, "loss": 0.4026, "step": 15998 }, { "epoch": 2.96, "learning_rate": 9.305996406754336e-09, "loss": 0.4081, "step": 15999 }, { "epoch": 2.96, "learning_rate": 9.220042445955425e-09, "loss": 0.4306, "step": 16000 }, { "epoch": 2.96, "learning_rate": 9.134487098779732e-09, "loss": 0.3829, "step": 16001 }, { "epoch": 2.96, "learning_rate": 9.049330368641196e-09, "loss": 0.403, "step": 16002 }, { "epoch": 2.96, "learning_rate": 8.964572258935989e-09, "loss": 0.4263, "step": 16003 }, { "epoch": 2.96, "learning_rate": 8.880212773045849e-09, "loss": 0.3789, "step": 16004 }, { "epoch": 2.96, "learning_rate": 8.796251914338083e-09, "loss": 0.4278, "step": 16005 }, { "epoch": 2.96, "learning_rate": 8.712689686161125e-09, "loss": 0.4115, "step": 16006 }, { "epoch": 2.96, "learning_rate": 8.629526091848972e-09, "loss": 0.4298, "step": 16007 }, { "epoch": 2.96, "learning_rate": 8.546761134721193e-09, "loss": 0.4242, "step": 16008 }, { "epoch": 2.96, "learning_rate": 8.464394818078481e-09, "loss": 0.4126, "step": 16009 }, { "epoch": 2.96, "learning_rate": 8.382427145207095e-09, "loss": 0.4243, "step": 16010 }, { "epoch": 2.96, "learning_rate": 8.300858119378864e-09, "loss": 0.4061, "step": 16011 }, { "epoch": 2.96, "learning_rate": 8.219687743846738e-09, "loss": 0.4239, "step": 16012 }, { "epoch": 2.96, "learning_rate": 8.138916021850352e-09, "loss": 0.4054, "step": 16013 }, { "epoch": 2.96, "learning_rate": 8.05854295661046e-09, "loss": 0.4264, "step": 16014 }, { "epoch": 2.96, "learning_rate": 7.978568551336718e-09, "loss": 0.4375, "step": 16015 }, { "epoch": 2.96, "learning_rate": 7.898992809217687e-09, "loss": 0.3819, "step": 16016 }, { "epoch": 2.96, "learning_rate": 7.819815733428604e-09, "loss": 0.4146, "step": 16017 }, { "epoch": 2.96, "learning_rate": 7.741037327129163e-09, "loss": 0.411, "step": 16018 }, { "epoch": 2.96, "learning_rate": 7.662657593461298e-09, "loss": 0.4113, "step": 16019 }, { "epoch": 2.96, "learning_rate": 7.584676535554725e-09, "loss": 0.4062, "step": 16020 }, { "epoch": 2.96, "learning_rate": 7.507094156518069e-09, "loss": 0.4226, "step": 16021 }, { "epoch": 2.96, "learning_rate": 7.429910459447742e-09, "loss": 0.4079, "step": 16022 }, { "epoch": 2.96, "learning_rate": 7.353125447423504e-09, "loss": 0.41, "step": 16023 }, { "epoch": 2.96, "learning_rate": 7.276739123508458e-09, "loss": 0.3884, "step": 16024 }, { "epoch": 2.96, "learning_rate": 7.200751490751279e-09, "loss": 0.4065, "step": 16025 }, { "epoch": 2.97, "learning_rate": 7.125162552181764e-09, "loss": 0.4175, "step": 16026 }, { "epoch": 2.97, "learning_rate": 7.049972310817499e-09, "loss": 0.397, "step": 16027 }, { "epoch": 2.97, "learning_rate": 6.975180769657197e-09, "loss": 0.4244, "step": 16028 }, { "epoch": 2.97, "learning_rate": 6.900787931686248e-09, "loss": 0.4209, "step": 16029 }, { "epoch": 2.97, "learning_rate": 6.826793799872278e-09, "loss": 0.4419, "step": 16030 }, { "epoch": 2.97, "learning_rate": 6.75319837716737e-09, "loss": 0.4052, "step": 16031 }, { "epoch": 2.97, "learning_rate": 6.680001666508062e-09, "loss": 0.4145, "step": 16032 }, { "epoch": 2.97, "learning_rate": 6.607203670814244e-09, "loss": 0.41, "step": 16033 }, { "epoch": 2.97, "learning_rate": 6.534804392990257e-09, "loss": 0.451, "step": 16034 }, { "epoch": 2.97, "learning_rate": 6.4628038359260124e-09, "loss": 0.4243, "step": 16035 }, { "epoch": 2.97, "learning_rate": 6.391202002492547e-09, "loss": 0.4018, "step": 16036 }, { "epoch": 2.97, "learning_rate": 6.319998895547575e-09, "loss": 0.4285, "step": 16037 }, { "epoch": 2.97, "learning_rate": 6.249194517932156e-09, "loss": 0.4191, "step": 16038 }, { "epoch": 2.97, "learning_rate": 6.178788872470698e-09, "loss": 0.4147, "step": 16039 }, { "epoch": 2.97, "learning_rate": 6.108781961973176e-09, "loss": 0.4199, "step": 16040 }, { "epoch": 2.97, "learning_rate": 6.03917378923069e-09, "loss": 0.3913, "step": 16041 }, { "epoch": 2.97, "learning_rate": 5.969964357023239e-09, "loss": 0.4105, "step": 16042 }, { "epoch": 2.97, "learning_rate": 5.901153668109727e-09, "loss": 0.4035, "step": 16043 }, { "epoch": 2.97, "learning_rate": 5.832741725237956e-09, "loss": 0.4104, "step": 16044 }, { "epoch": 2.97, "learning_rate": 5.764728531134633e-09, "loss": 0.4326, "step": 16045 }, { "epoch": 2.97, "learning_rate": 5.697114088515365e-09, "loss": 0.4155, "step": 16046 }, { "epoch": 2.97, "learning_rate": 5.629898400077993e-09, "loss": 0.4362, "step": 16047 }, { "epoch": 2.97, "learning_rate": 5.563081468502595e-09, "loss": 0.4225, "step": 16048 }, { "epoch": 2.97, "learning_rate": 5.496663296455929e-09, "loss": 0.4099, "step": 16049 }, { "epoch": 2.97, "learning_rate": 5.430643886588094e-09, "loss": 0.4174, "step": 16050 }, { "epoch": 2.97, "learning_rate": 5.365023241533651e-09, "loss": 0.4027, "step": 16051 }, { "epoch": 2.97, "learning_rate": 5.299801363910506e-09, "loss": 0.4394, "step": 16052 }, { "epoch": 2.97, "learning_rate": 5.234978256319911e-09, "loss": 0.429, "step": 16053 }, { "epoch": 2.97, "learning_rate": 5.170553921349797e-09, "loss": 0.4197, "step": 16054 }, { "epoch": 2.97, "learning_rate": 5.1065283615681085e-09, "loss": 0.4114, "step": 16055 }, { "epoch": 2.97, "learning_rate": 5.04290157953169e-09, "loss": 0.3846, "step": 16056 }, { "epoch": 2.97, "learning_rate": 4.97967357777851e-09, "loss": 0.4144, "step": 16057 }, { "epoch": 2.97, "learning_rate": 4.916844358830996e-09, "loss": 0.4215, "step": 16058 }, { "epoch": 2.97, "learning_rate": 4.8544139251960335e-09, "loss": 0.4, "step": 16059 }, { "epoch": 2.97, "learning_rate": 4.79238227936385e-09, "loss": 0.4148, "step": 16060 }, { "epoch": 2.97, "learning_rate": 4.730749423811354e-09, "loss": 0.4036, "step": 16061 }, { "epoch": 2.97, "learning_rate": 4.6695153609954695e-09, "loss": 0.4224, "step": 16062 }, { "epoch": 2.97, "learning_rate": 4.608680093359797e-09, "loss": 0.4217, "step": 16063 }, { "epoch": 2.97, "learning_rate": 4.548243623331283e-09, "loss": 0.4134, "step": 16064 }, { "epoch": 2.97, "learning_rate": 4.488205953322444e-09, "loss": 0.413, "step": 16065 }, { "epoch": 2.97, "learning_rate": 4.4285670857280305e-09, "loss": 0.4255, "step": 16066 }, { "epoch": 2.97, "learning_rate": 4.36932702292725e-09, "loss": 0.4061, "step": 16067 }, { "epoch": 2.97, "learning_rate": 4.310485767283767e-09, "loss": 0.4151, "step": 16068 }, { "epoch": 2.97, "learning_rate": 4.252043321145705e-09, "loss": 0.42, "step": 16069 }, { "epoch": 2.97, "learning_rate": 4.1939996868445296e-09, "loss": 0.3921, "step": 16070 }, { "epoch": 2.97, "learning_rate": 4.136354866696169e-09, "loss": 0.4372, "step": 16071 }, { "epoch": 2.97, "learning_rate": 4.079108862999892e-09, "loss": 0.4265, "step": 16072 }, { "epoch": 2.97, "learning_rate": 4.0222616780405396e-09, "loss": 0.4123, "step": 16073 }, { "epoch": 2.97, "learning_rate": 3.9658133140862975e-09, "loss": 0.4124, "step": 16074 }, { "epoch": 2.97, "learning_rate": 3.909763773388697e-09, "loss": 0.4209, "step": 16075 }, { "epoch": 2.97, "learning_rate": 3.8541130581837285e-09, "loss": 0.4074, "step": 16076 }, { "epoch": 2.97, "learning_rate": 3.798861170691836e-09, "loss": 0.4283, "step": 16077 }, { "epoch": 2.97, "learning_rate": 3.744008113119035e-09, "loss": 0.4014, "step": 16078 }, { "epoch": 2.97, "learning_rate": 3.689553887652464e-09, "loss": 0.4002, "step": 16079 }, { "epoch": 2.98, "learning_rate": 3.6354984964648286e-09, "loss": 0.4148, "step": 16080 }, { "epoch": 2.98, "learning_rate": 3.5818419417132934e-09, "loss": 0.3963, "step": 16081 }, { "epoch": 2.98, "learning_rate": 3.528584225538367e-09, "loss": 0.3929, "step": 16082 }, { "epoch": 2.98, "learning_rate": 3.4757253500650178e-09, "loss": 0.412, "step": 16083 }, { "epoch": 2.98, "learning_rate": 3.4232653174015583e-09, "loss": 0.4287, "step": 16084 }, { "epoch": 2.98, "learning_rate": 3.3712041296418698e-09, "loss": 0.4178, "step": 16085 }, { "epoch": 2.98, "learning_rate": 3.3195417888631786e-09, "loss": 0.4114, "step": 16086 }, { "epoch": 2.98, "learning_rate": 3.2682782971260595e-09, "loss": 0.406, "step": 16087 }, { "epoch": 2.98, "learning_rate": 3.2174136564766533e-09, "loss": 0.444, "step": 16088 }, { "epoch": 2.98, "learning_rate": 3.1669478689433375e-09, "loss": 0.4062, "step": 16089 }, { "epoch": 2.98, "learning_rate": 3.1168809365400567e-09, "loss": 0.4228, "step": 16090 }, { "epoch": 2.98, "learning_rate": 3.0672128612652117e-09, "loss": 0.4193, "step": 16091 }, { "epoch": 2.98, "learning_rate": 3.0179436450994416e-09, "loss": 0.4202, "step": 16092 }, { "epoch": 2.98, "learning_rate": 2.9690732900089504e-09, "loss": 0.4088, "step": 16093 }, { "epoch": 2.98, "learning_rate": 2.92060179794329e-09, "loss": 0.4192, "step": 16094 }, { "epoch": 2.98, "learning_rate": 2.872529170836469e-09, "loss": 0.4072, "step": 16095 }, { "epoch": 2.98, "learning_rate": 2.8248554106058425e-09, "loss": 0.4005, "step": 16096 }, { "epoch": 2.98, "learning_rate": 2.777580519155443e-09, "loss": 0.3889, "step": 16097 }, { "epoch": 2.98, "learning_rate": 2.7307044983693188e-09, "loss": 0.3971, "step": 16098 }, { "epoch": 2.98, "learning_rate": 2.6842273501193063e-09, "loss": 0.4192, "step": 16099 }, { "epoch": 2.98, "learning_rate": 2.6381490762583673e-09, "loss": 0.4165, "step": 16100 }, { "epoch": 2.98, "learning_rate": 2.5924696786261416e-09, "loss": 0.4139, "step": 16101 }, { "epoch": 2.98, "learning_rate": 2.5471891590445052e-09, "loss": 0.4006, "step": 16102 }, { "epoch": 2.98, "learning_rate": 2.502307519320901e-09, "loss": 0.4144, "step": 16103 }, { "epoch": 2.98, "learning_rate": 2.4578247612438987e-09, "loss": 0.4049, "step": 16104 }, { "epoch": 2.98, "learning_rate": 2.413740886590965e-09, "loss": 0.4197, "step": 16105 }, { "epoch": 2.98, "learning_rate": 2.370055897119583e-09, "loss": 0.3971, "step": 16106 }, { "epoch": 2.98, "learning_rate": 2.326769794572803e-09, "loss": 0.4203, "step": 16107 }, { "epoch": 2.98, "learning_rate": 2.2838825806770214e-09, "loss": 0.4057, "step": 16108 }, { "epoch": 2.98, "learning_rate": 2.2413942571442026e-09, "loss": 0.4247, "step": 16109 }, { "epoch": 2.98, "learning_rate": 2.1993048256707673e-09, "loss": 0.4129, "step": 16110 }, { "epoch": 2.98, "learning_rate": 2.1576142879331518e-09, "loss": 0.4107, "step": 16111 }, { "epoch": 2.98, "learning_rate": 2.1163226455966914e-09, "loss": 0.3956, "step": 16112 }, { "epoch": 2.98, "learning_rate": 2.075429900307846e-09, "loss": 0.3904, "step": 16113 }, { "epoch": 2.98, "learning_rate": 2.0349360536997543e-09, "loss": 0.4134, "step": 16114 }, { "epoch": 2.98, "learning_rate": 1.9948411073866803e-09, "loss": 0.4042, "step": 16115 }, { "epoch": 2.98, "learning_rate": 1.9551450629684552e-09, "loss": 0.4128, "step": 16116 }, { "epoch": 2.98, "learning_rate": 1.9158479220282576e-09, "loss": 0.417, "step": 16117 }, { "epoch": 2.98, "learning_rate": 1.8769496861359427e-09, "loss": 0.3961, "step": 16118 }, { "epoch": 2.98, "learning_rate": 1.8384503568413814e-09, "loss": 0.4162, "step": 16119 }, { "epoch": 2.98, "learning_rate": 1.8003499356822328e-09, "loss": 0.4124, "step": 16120 }, { "epoch": 2.98, "learning_rate": 1.7626484241772823e-09, "loss": 0.4255, "step": 16121 }, { "epoch": 2.98, "learning_rate": 1.725345823831992e-09, "loss": 0.4276, "step": 16122 }, { "epoch": 2.98, "learning_rate": 1.6884421361340608e-09, "loss": 0.4275, "step": 16123 }, { "epoch": 2.98, "learning_rate": 1.6519373625556446e-09, "loss": 0.4259, "step": 16124 }, { "epoch": 2.98, "learning_rate": 1.6158315045544658e-09, "loss": 0.4145, "step": 16125 }, { "epoch": 2.98, "learning_rate": 1.5801245635682638e-09, "loss": 0.411, "step": 16126 }, { "epoch": 2.98, "learning_rate": 1.5448165410247851e-09, "loss": 0.3917, "step": 16127 }, { "epoch": 2.98, "learning_rate": 1.5099074383317924e-09, "loss": 0.415, "step": 16128 }, { "epoch": 2.98, "learning_rate": 1.4753972568803953e-09, "loss": 0.4029, "step": 16129 }, { "epoch": 2.98, "learning_rate": 1.441285998050601e-09, "loss": 0.3942, "step": 16130 }, { "epoch": 2.98, "learning_rate": 1.4075736632002124e-09, "loss": 0.3823, "step": 16131 }, { "epoch": 2.98, "learning_rate": 1.3742602536759297e-09, "loss": 0.4282, "step": 16132 }, { "epoch": 2.98, "learning_rate": 1.3413457708078003e-09, "loss": 0.4167, "step": 16133 }, { "epoch": 2.99, "learning_rate": 1.3088302159069977e-09, "loss": 0.4164, "step": 16134 }, { "epoch": 2.99, "learning_rate": 1.2767135902713724e-09, "loss": 0.3882, "step": 16135 }, { "epoch": 2.99, "learning_rate": 1.244995895183232e-09, "loss": 0.4158, "step": 16136 }, { "epoch": 2.99, "learning_rate": 1.2136771319082307e-09, "loss": 0.4361, "step": 16137 }, { "epoch": 2.99, "learning_rate": 1.1827573016942596e-09, "loss": 0.4093, "step": 16138 }, { "epoch": 2.99, "learning_rate": 1.1522364057769963e-09, "loss": 0.4122, "step": 16139 }, { "epoch": 2.99, "learning_rate": 1.1221144453721355e-09, "loss": 0.3995, "step": 16140 }, { "epoch": 2.99, "learning_rate": 1.0923914216831588e-09, "loss": 0.4106, "step": 16141 }, { "epoch": 2.99, "learning_rate": 1.0630673358946742e-09, "loss": 0.3938, "step": 16142 }, { "epoch": 2.99, "learning_rate": 1.0341421891779669e-09, "loss": 0.4206, "step": 16143 }, { "epoch": 2.99, "learning_rate": 1.0056159826854484e-09, "loss": 0.4022, "step": 16144 }, { "epoch": 2.99, "learning_rate": 9.774887175562076e-10, "loss": 0.4105, "step": 16145 }, { "epoch": 2.99, "learning_rate": 9.4976039491379e-10, "loss": 0.4019, "step": 16146 }, { "epoch": 2.99, "learning_rate": 9.224310158617578e-10, "loss": 0.3989, "step": 16147 }, { "epoch": 2.99, "learning_rate": 8.955005814925699e-10, "loss": 0.4153, "step": 16148 }, { "epoch": 2.99, "learning_rate": 8.689690928798123e-10, "loss": 0.4062, "step": 16149 }, { "epoch": 2.99, "learning_rate": 8.428365510826376e-10, "loss": 0.4143, "step": 16150 }, { "epoch": 2.99, "learning_rate": 8.171029571435451e-10, "loss": 0.4213, "step": 16151 }, { "epoch": 2.99, "learning_rate": 7.917683120883812e-10, "loss": 0.4015, "step": 16152 }, { "epoch": 2.99, "learning_rate": 7.668326169296692e-10, "loss": 0.4155, "step": 16153 }, { "epoch": 2.99, "learning_rate": 7.422958726599483e-10, "loss": 0.404, "step": 16154 }, { "epoch": 2.99, "learning_rate": 7.181580802606558e-10, "loss": 0.411, "step": 16155 }, { "epoch": 2.99, "learning_rate": 6.944192406932449e-10, "loss": 0.4144, "step": 16156 }, { "epoch": 2.99, "learning_rate": 6.710793549047356e-10, "loss": 0.4002, "step": 16157 }, { "epoch": 2.99, "learning_rate": 6.481384238277155e-10, "loss": 0.4217, "step": 16158 }, { "epoch": 2.99, "learning_rate": 6.255964483758981e-10, "loss": 0.3986, "step": 16159 }, { "epoch": 2.99, "learning_rate": 6.034534294496742e-10, "loss": 0.4172, "step": 16160 }, { "epoch": 2.99, "learning_rate": 5.817093679327812e-10, "loss": 0.4123, "step": 16161 }, { "epoch": 2.99, "learning_rate": 5.603642646911933e-10, "loss": 0.4215, "step": 16162 }, { "epoch": 2.99, "learning_rate": 5.39418120578672e-10, "loss": 0.41, "step": 16163 }, { "epoch": 2.99, "learning_rate": 5.188709364289945e-10, "loss": 0.4153, "step": 16164 }, { "epoch": 2.99, "learning_rate": 4.987227130637262e-10, "loss": 0.4036, "step": 16165 }, { "epoch": 2.99, "learning_rate": 4.789734512855582e-10, "loss": 0.4064, "step": 16166 }, { "epoch": 2.99, "learning_rate": 4.5962315188274877e-10, "loss": 0.4055, "step": 16167 }, { "epoch": 2.99, "learning_rate": 4.40671815626903e-10, "loss": 0.4086, "step": 16168 }, { "epoch": 2.99, "learning_rate": 4.2211944327519297e-10, "loss": 0.4475, "step": 16169 }, { "epoch": 2.99, "learning_rate": 4.03966035565917e-10, "loss": 0.4154, "step": 16170 }, { "epoch": 2.99, "learning_rate": 3.862115932262711e-10, "loss": 0.4245, "step": 16171 }, { "epoch": 2.99, "learning_rate": 3.6885611696235724e-10, "loss": 0.4335, "step": 16172 }, { "epoch": 2.99, "learning_rate": 3.518996074669545e-10, "loss": 0.4225, "step": 16173 }, { "epoch": 2.99, "learning_rate": 3.3534206541729897e-10, "loss": 0.4124, "step": 16174 }, { "epoch": 2.99, "learning_rate": 3.191834914728631e-10, "loss": 0.4176, "step": 16175 }, { "epoch": 2.99, "learning_rate": 3.034238862797967e-10, "loss": 0.398, "step": 16176 }, { "epoch": 2.99, "learning_rate": 2.8806325046648596e-10, "loss": 0.3896, "step": 16177 }, { "epoch": 2.99, "learning_rate": 2.7310158464466383e-10, "loss": 0.4246, "step": 16178 }, { "epoch": 2.99, "learning_rate": 2.585388894127405e-10, "loss": 0.4204, "step": 16179 }, { "epoch": 2.99, "learning_rate": 2.443751653502524e-10, "loss": 0.3949, "step": 16180 }, { "epoch": 2.99, "learning_rate": 2.3061041302341326e-10, "loss": 0.3965, "step": 16181 }, { "epoch": 2.99, "learning_rate": 2.1724463298178344e-10, "loss": 0.4147, "step": 16182 }, { "epoch": 2.99, "learning_rate": 2.0427782575715982e-10, "loss": 0.4125, "step": 16183 }, { "epoch": 2.99, "learning_rate": 1.9170999186801653e-10, "loss": 0.4065, "step": 16184 }, { "epoch": 2.99, "learning_rate": 1.7954113181617437e-10, "loss": 0.4105, "step": 16185 }, { "epoch": 2.99, "learning_rate": 1.6777124608569063e-10, "loss": 0.4147, "step": 16186 }, { "epoch": 2.99, "learning_rate": 1.564003351472998e-10, "loss": 0.4083, "step": 16187 }, { "epoch": 3.0, "learning_rate": 1.4542839945397292e-10, "loss": 0.4075, "step": 16188 }, { "epoch": 3.0, "learning_rate": 1.3485543944424805e-10, "loss": 0.4143, "step": 16189 }, { "epoch": 3.0, "learning_rate": 1.2468145553889976e-10, "loss": 0.4313, "step": 16190 }, { "epoch": 3.0, "learning_rate": 1.1490644814537987e-10, "loss": 0.4298, "step": 16191 }, { "epoch": 3.0, "learning_rate": 1.0553041765226646e-10, "loss": 0.3925, "step": 16192 }, { "epoch": 3.0, "learning_rate": 9.655336443370467e-11, "loss": 0.4001, "step": 16193 }, { "epoch": 3.0, "learning_rate": 8.797528884940676e-11, "loss": 0.4039, "step": 16194 }, { "epoch": 3.0, "learning_rate": 7.979619124021121e-11, "loss": 0.4177, "step": 16195 }, { "epoch": 3.0, "learning_rate": 7.201607193252358e-11, "loss": 0.4121, "step": 16196 }, { "epoch": 3.0, "learning_rate": 6.463493123720632e-11, "loss": 0.4066, "step": 16197 }, { "epoch": 3.0, "learning_rate": 5.7652769448468537e-11, "loss": 0.3981, "step": 16198 }, { "epoch": 3.0, "learning_rate": 5.1069586844976206e-11, "loss": 0.4085, "step": 16199 }, { "epoch": 3.0, "learning_rate": 4.4885383688741956e-11, "loss": 0.4334, "step": 16200 }, { "epoch": 3.0, "learning_rate": 3.910016022845575e-11, "loss": 0.4309, "step": 16201 }, { "epoch": 3.0, "learning_rate": 3.371391669282353e-11, "loss": 0.4215, "step": 16202 }, { "epoch": 3.0, "learning_rate": 2.8726653297228568e-11, "loss": 0.412, "step": 16203 }, { "epoch": 3.0, "learning_rate": 2.4138370241511e-11, "loss": 0.4253, "step": 16204 }, { "epoch": 3.0, "learning_rate": 1.9949067707747404e-11, "loss": 0.4095, "step": 16205 }, { "epoch": 3.0, "learning_rate": 1.615874586469168e-11, "loss": 0.4154, "step": 16206 }, { "epoch": 3.0, "learning_rate": 1.2767404861113719e-11, "loss": 0.3928, "step": 16207 }, { "epoch": 3.0, "learning_rate": 9.775044834681169e-12, "loss": 0.4127, "step": 16208 }, { "epoch": 3.0, "learning_rate": 7.1816659030776726e-12, "loss": 0.4167, "step": 16209 }, { "epoch": 3.0, "learning_rate": 4.987268170664195e-12, "loss": 0.4077, "step": 16210 }, { "epoch": 3.0, "learning_rate": 3.191851725148354e-12, "loss": 0.4205, "step": 16211 }, { "epoch": 3.0, "learning_rate": 1.795416636474201e-12, "loss": 0.404, "step": 16212 }, { "epoch": 3.0, "learning_rate": 7.979629634835562e-13, "loss": 0.4252, "step": 16213 }, { "epoch": 3.0, "learning_rate": 1.9949074281377934e-13, "loss": 0.4459, "step": 16214 }, { "epoch": 3.0, "learning_rate": 0.0, "loss": 0.4133, "step": 16215 }, { "epoch": 3.0, "step": 16215, "total_flos": 1.3493623993143394e+19, "train_loss": 0.4557394363484631, "train_runtime": 35061.5687, "train_samples_per_second": 14.798, "train_steps_per_second": 0.462 } ], "logging_steps": 1.0, "max_steps": 16215, "num_input_tokens_seen": 0, "num_train_epochs": 3, "save_steps": 1000, "total_flos": 1.3493623993143394e+19, "train_batch_size": 4, "trial_name": null, "trial_params": null }