{ "best_metric": null, "best_model_checkpoint": null, "epoch": 1.0, "eval_steps": 500, "global_step": 8750, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 0.0, "learning_rate": 7.604562737642586e-08, "loss": 0.8388, "step": 1 }, { "epoch": 0.0, "learning_rate": 1.5209125475285173e-07, "loss": 0.8142, "step": 2 }, { "epoch": 0.0, "learning_rate": 2.281368821292776e-07, "loss": 0.8402, "step": 3 }, { "epoch": 0.0, "learning_rate": 3.0418250950570346e-07, "loss": 0.808, "step": 4 }, { "epoch": 0.0, "learning_rate": 3.802281368821293e-07, "loss": 0.8206, "step": 5 }, { "epoch": 0.0, "learning_rate": 4.562737642585552e-07, "loss": 0.8594, "step": 6 }, { "epoch": 0.0, "learning_rate": 5.32319391634981e-07, "loss": 0.8293, "step": 7 }, { "epoch": 0.0, "learning_rate": 6.083650190114069e-07, "loss": 0.8594, "step": 8 }, { "epoch": 0.0, "learning_rate": 6.844106463878328e-07, "loss": 0.8089, "step": 9 }, { "epoch": 0.0, "learning_rate": 7.604562737642586e-07, "loss": 0.8156, "step": 10 }, { "epoch": 0.0, "learning_rate": 8.365019011406844e-07, "loss": 0.8078, "step": 11 }, { "epoch": 0.0, "learning_rate": 9.125475285171104e-07, "loss": 0.7722, "step": 12 }, { "epoch": 0.0, "learning_rate": 9.885931558935361e-07, "loss": 0.799, "step": 13 }, { "epoch": 0.0, "learning_rate": 1.064638783269962e-06, "loss": 0.8171, "step": 14 }, { "epoch": 0.0, "learning_rate": 1.140684410646388e-06, "loss": 0.7761, "step": 15 }, { "epoch": 0.0, "learning_rate": 1.2167300380228138e-06, "loss": 0.7554, "step": 16 }, { "epoch": 0.0, "learning_rate": 1.2927756653992395e-06, "loss": 0.7353, "step": 17 }, { "epoch": 0.0, "learning_rate": 1.3688212927756656e-06, "loss": 0.7562, "step": 18 }, { "epoch": 0.0, "learning_rate": 1.4448669201520913e-06, "loss": 0.7364, "step": 19 }, { "epoch": 0.0, "learning_rate": 1.5209125475285172e-06, "loss": 0.7192, "step": 20 }, { "epoch": 0.0, "learning_rate": 1.5969581749049431e-06, "loss": 0.7345, "step": 21 }, { "epoch": 0.0, "learning_rate": 1.6730038022813688e-06, "loss": 0.704, "step": 22 }, { "epoch": 0.0, "learning_rate": 1.7490494296577947e-06, "loss": 0.6885, "step": 23 }, { "epoch": 0.0, "learning_rate": 1.8250950570342208e-06, "loss": 0.6952, "step": 24 }, { "epoch": 0.0, "learning_rate": 1.9011406844106463e-06, "loss": 0.679, "step": 25 }, { "epoch": 0.0, "learning_rate": 1.9771863117870722e-06, "loss": 0.6861, "step": 26 }, { "epoch": 0.0, "learning_rate": 2.053231939163498e-06, "loss": 0.6799, "step": 27 }, { "epoch": 0.0, "learning_rate": 2.129277566539924e-06, "loss": 0.669, "step": 28 }, { "epoch": 0.0, "learning_rate": 2.20532319391635e-06, "loss": 0.6709, "step": 29 }, { "epoch": 0.0, "learning_rate": 2.281368821292776e-06, "loss": 0.6729, "step": 30 }, { "epoch": 0.0, "learning_rate": 2.3574144486692017e-06, "loss": 0.6522, "step": 31 }, { "epoch": 0.0, "learning_rate": 2.4334600760456276e-06, "loss": 0.6696, "step": 32 }, { "epoch": 0.0, "learning_rate": 2.509505703422053e-06, "loss": 0.6507, "step": 33 }, { "epoch": 0.0, "learning_rate": 2.585551330798479e-06, "loss": 0.6338, "step": 34 }, { "epoch": 0.0, "learning_rate": 2.6615969581749054e-06, "loss": 0.6667, "step": 35 }, { "epoch": 0.0, "learning_rate": 2.7376425855513313e-06, "loss": 0.6551, "step": 36 }, { "epoch": 0.0, "learning_rate": 2.813688212927757e-06, "loss": 0.6158, "step": 37 }, { "epoch": 0.0, "learning_rate": 2.8897338403041826e-06, "loss": 0.6222, "step": 38 }, { "epoch": 0.0, "learning_rate": 2.9657794676806085e-06, "loss": 0.628, "step": 39 }, { "epoch": 0.0, "learning_rate": 3.0418250950570345e-06, "loss": 0.6507, "step": 40 }, { "epoch": 0.0, "learning_rate": 3.1178707224334604e-06, "loss": 0.6518, "step": 41 }, { "epoch": 0.0, "learning_rate": 3.1939163498098863e-06, "loss": 0.6297, "step": 42 }, { "epoch": 0.0, "learning_rate": 3.269961977186312e-06, "loss": 0.6228, "step": 43 }, { "epoch": 0.01, "learning_rate": 3.3460076045627376e-06, "loss": 0.6278, "step": 44 }, { "epoch": 0.01, "learning_rate": 3.4220532319391635e-06, "loss": 0.6226, "step": 45 }, { "epoch": 0.01, "learning_rate": 3.4980988593155894e-06, "loss": 0.6057, "step": 46 }, { "epoch": 0.01, "learning_rate": 3.5741444866920154e-06, "loss": 0.6189, "step": 47 }, { "epoch": 0.01, "learning_rate": 3.6501901140684417e-06, "loss": 0.6293, "step": 48 }, { "epoch": 0.01, "learning_rate": 3.7262357414448676e-06, "loss": 0.6231, "step": 49 }, { "epoch": 0.01, "learning_rate": 3.8022813688212926e-06, "loss": 0.629, "step": 50 }, { "epoch": 0.01, "learning_rate": 3.8783269961977185e-06, "loss": 0.6011, "step": 51 }, { "epoch": 0.01, "learning_rate": 3.9543726235741444e-06, "loss": 0.6084, "step": 52 }, { "epoch": 0.01, "learning_rate": 4.03041825095057e-06, "loss": 0.5854, "step": 53 }, { "epoch": 0.01, "learning_rate": 4.106463878326996e-06, "loss": 0.6004, "step": 54 }, { "epoch": 0.01, "learning_rate": 4.182509505703423e-06, "loss": 0.5955, "step": 55 }, { "epoch": 0.01, "learning_rate": 4.258555133079848e-06, "loss": 0.6117, "step": 56 }, { "epoch": 0.01, "learning_rate": 4.334600760456274e-06, "loss": 0.5993, "step": 57 }, { "epoch": 0.01, "learning_rate": 4.4106463878327e-06, "loss": 0.6063, "step": 58 }, { "epoch": 0.01, "learning_rate": 4.486692015209126e-06, "loss": 0.5858, "step": 59 }, { "epoch": 0.01, "learning_rate": 4.562737642585552e-06, "loss": 0.6101, "step": 60 }, { "epoch": 0.01, "learning_rate": 4.638783269961978e-06, "loss": 0.5843, "step": 61 }, { "epoch": 0.01, "learning_rate": 4.7148288973384035e-06, "loss": 0.5875, "step": 62 }, { "epoch": 0.01, "learning_rate": 4.790874524714829e-06, "loss": 0.5833, "step": 63 }, { "epoch": 0.01, "learning_rate": 4.866920152091255e-06, "loss": 0.5843, "step": 64 }, { "epoch": 0.01, "learning_rate": 4.942965779467681e-06, "loss": 0.5836, "step": 65 }, { "epoch": 0.01, "learning_rate": 5.019011406844106e-06, "loss": 0.6352, "step": 66 }, { "epoch": 0.01, "learning_rate": 5.095057034220533e-06, "loss": 0.5787, "step": 67 }, { "epoch": 0.01, "learning_rate": 5.171102661596958e-06, "loss": 0.59, "step": 68 }, { "epoch": 0.01, "learning_rate": 5.247148288973385e-06, "loss": 0.5917, "step": 69 }, { "epoch": 0.01, "learning_rate": 5.323193916349811e-06, "loss": 0.5731, "step": 70 }, { "epoch": 0.01, "learning_rate": 5.399239543726236e-06, "loss": 0.5789, "step": 71 }, { "epoch": 0.01, "learning_rate": 5.4752851711026625e-06, "loss": 0.581, "step": 72 }, { "epoch": 0.01, "learning_rate": 5.5513307984790876e-06, "loss": 0.5857, "step": 73 }, { "epoch": 0.01, "learning_rate": 5.627376425855514e-06, "loss": 0.5863, "step": 74 }, { "epoch": 0.01, "learning_rate": 5.703422053231939e-06, "loss": 0.5802, "step": 75 }, { "epoch": 0.01, "learning_rate": 5.779467680608365e-06, "loss": 0.5812, "step": 76 }, { "epoch": 0.01, "learning_rate": 5.855513307984791e-06, "loss": 0.5775, "step": 77 }, { "epoch": 0.01, "learning_rate": 5.931558935361217e-06, "loss": 0.5732, "step": 78 }, { "epoch": 0.01, "learning_rate": 6.007604562737643e-06, "loss": 0.5573, "step": 79 }, { "epoch": 0.01, "learning_rate": 6.083650190114069e-06, "loss": 0.5563, "step": 80 }, { "epoch": 0.01, "learning_rate": 6.159695817490496e-06, "loss": 0.5797, "step": 81 }, { "epoch": 0.01, "learning_rate": 6.235741444866921e-06, "loss": 0.5945, "step": 82 }, { "epoch": 0.01, "learning_rate": 6.311787072243346e-06, "loss": 0.5757, "step": 83 }, { "epoch": 0.01, "learning_rate": 6.3878326996197725e-06, "loss": 0.569, "step": 84 }, { "epoch": 0.01, "learning_rate": 6.4638783269961976e-06, "loss": 0.5691, "step": 85 }, { "epoch": 0.01, "learning_rate": 6.539923954372624e-06, "loss": 0.5818, "step": 86 }, { "epoch": 0.01, "learning_rate": 6.61596958174905e-06, "loss": 0.5869, "step": 87 }, { "epoch": 0.01, "learning_rate": 6.692015209125475e-06, "loss": 0.5624, "step": 88 }, { "epoch": 0.01, "learning_rate": 6.768060836501902e-06, "loss": 0.561, "step": 89 }, { "epoch": 0.01, "learning_rate": 6.844106463878327e-06, "loss": 0.5586, "step": 90 }, { "epoch": 0.01, "learning_rate": 6.920152091254754e-06, "loss": 0.585, "step": 91 }, { "epoch": 0.01, "learning_rate": 6.996197718631179e-06, "loss": 0.575, "step": 92 }, { "epoch": 0.01, "learning_rate": 7.072243346007606e-06, "loss": 0.5674, "step": 93 }, { "epoch": 0.01, "learning_rate": 7.148288973384031e-06, "loss": 0.5803, "step": 94 }, { "epoch": 0.01, "learning_rate": 7.224334600760457e-06, "loss": 0.5745, "step": 95 }, { "epoch": 0.01, "learning_rate": 7.300380228136883e-06, "loss": 0.5678, "step": 96 }, { "epoch": 0.01, "learning_rate": 7.376425855513308e-06, "loss": 0.5495, "step": 97 }, { "epoch": 0.01, "learning_rate": 7.452471482889735e-06, "loss": 0.5583, "step": 98 }, { "epoch": 0.01, "learning_rate": 7.52851711026616e-06, "loss": 0.5921, "step": 99 }, { "epoch": 0.01, "learning_rate": 7.604562737642585e-06, "loss": 0.564, "step": 100 }, { "epoch": 0.01, "learning_rate": 7.680608365019012e-06, "loss": 0.5552, "step": 101 }, { "epoch": 0.01, "learning_rate": 7.756653992395437e-06, "loss": 0.5649, "step": 102 }, { "epoch": 0.01, "learning_rate": 7.832699619771864e-06, "loss": 0.5691, "step": 103 }, { "epoch": 0.01, "learning_rate": 7.908745247148289e-06, "loss": 0.5722, "step": 104 }, { "epoch": 0.01, "learning_rate": 7.984790874524716e-06, "loss": 0.5691, "step": 105 }, { "epoch": 0.01, "learning_rate": 8.06083650190114e-06, "loss": 0.5728, "step": 106 }, { "epoch": 0.01, "learning_rate": 8.136882129277567e-06, "loss": 0.5799, "step": 107 }, { "epoch": 0.01, "learning_rate": 8.212927756653993e-06, "loss": 0.5636, "step": 108 }, { "epoch": 0.01, "learning_rate": 8.28897338403042e-06, "loss": 0.5666, "step": 109 }, { "epoch": 0.01, "learning_rate": 8.365019011406846e-06, "loss": 0.5627, "step": 110 }, { "epoch": 0.01, "learning_rate": 8.441064638783271e-06, "loss": 0.5494, "step": 111 }, { "epoch": 0.01, "learning_rate": 8.517110266159696e-06, "loss": 0.5716, "step": 112 }, { "epoch": 0.01, "learning_rate": 8.593155893536123e-06, "loss": 0.5442, "step": 113 }, { "epoch": 0.01, "learning_rate": 8.669201520912548e-06, "loss": 0.5698, "step": 114 }, { "epoch": 0.01, "learning_rate": 8.745247148288975e-06, "loss": 0.5592, "step": 115 }, { "epoch": 0.01, "learning_rate": 8.8212927756654e-06, "loss": 0.5573, "step": 116 }, { "epoch": 0.01, "learning_rate": 8.897338403041825e-06, "loss": 0.5634, "step": 117 }, { "epoch": 0.01, "learning_rate": 8.973384030418252e-06, "loss": 0.5451, "step": 118 }, { "epoch": 0.01, "learning_rate": 9.049429657794677e-06, "loss": 0.5629, "step": 119 }, { "epoch": 0.01, "learning_rate": 9.125475285171103e-06, "loss": 0.5551, "step": 120 }, { "epoch": 0.01, "learning_rate": 9.201520912547528e-06, "loss": 0.547, "step": 121 }, { "epoch": 0.01, "learning_rate": 9.277566539923955e-06, "loss": 0.5649, "step": 122 }, { "epoch": 0.01, "learning_rate": 9.35361216730038e-06, "loss": 0.5516, "step": 123 }, { "epoch": 0.01, "learning_rate": 9.429657794676807e-06, "loss": 0.5661, "step": 124 }, { "epoch": 0.01, "learning_rate": 9.505703422053234e-06, "loss": 0.5619, "step": 125 }, { "epoch": 0.01, "learning_rate": 9.581749049429659e-06, "loss": 0.5714, "step": 126 }, { "epoch": 0.01, "learning_rate": 9.657794676806086e-06, "loss": 0.5372, "step": 127 }, { "epoch": 0.01, "learning_rate": 9.73384030418251e-06, "loss": 0.5492, "step": 128 }, { "epoch": 0.01, "learning_rate": 9.809885931558936e-06, "loss": 0.5402, "step": 129 }, { "epoch": 0.01, "learning_rate": 9.885931558935362e-06, "loss": 0.5687, "step": 130 }, { "epoch": 0.01, "learning_rate": 9.961977186311787e-06, "loss": 0.5433, "step": 131 }, { "epoch": 0.02, "learning_rate": 1.0038022813688212e-05, "loss": 0.5584, "step": 132 }, { "epoch": 0.02, "learning_rate": 1.011406844106464e-05, "loss": 0.5561, "step": 133 }, { "epoch": 0.02, "learning_rate": 1.0190114068441066e-05, "loss": 0.5563, "step": 134 }, { "epoch": 0.02, "learning_rate": 1.0266159695817491e-05, "loss": 0.5626, "step": 135 }, { "epoch": 0.02, "learning_rate": 1.0342205323193916e-05, "loss": 0.5659, "step": 136 }, { "epoch": 0.02, "learning_rate": 1.0418250950570343e-05, "loss": 0.516, "step": 137 }, { "epoch": 0.02, "learning_rate": 1.049429657794677e-05, "loss": 0.5602, "step": 138 }, { "epoch": 0.02, "learning_rate": 1.0570342205323195e-05, "loss": 0.553, "step": 139 }, { "epoch": 0.02, "learning_rate": 1.0646387832699621e-05, "loss": 0.5562, "step": 140 }, { "epoch": 0.02, "learning_rate": 1.0722433460076046e-05, "loss": 0.5302, "step": 141 }, { "epoch": 0.02, "learning_rate": 1.0798479087452472e-05, "loss": 0.561, "step": 142 }, { "epoch": 0.02, "learning_rate": 1.0874524714828898e-05, "loss": 0.5463, "step": 143 }, { "epoch": 0.02, "learning_rate": 1.0950570342205325e-05, "loss": 0.5567, "step": 144 }, { "epoch": 0.02, "learning_rate": 1.1026615969581752e-05, "loss": 0.5301, "step": 145 }, { "epoch": 0.02, "learning_rate": 1.1102661596958175e-05, "loss": 0.5499, "step": 146 }, { "epoch": 0.02, "learning_rate": 1.1178707224334602e-05, "loss": 0.5371, "step": 147 }, { "epoch": 0.02, "learning_rate": 1.1254752851711029e-05, "loss": 0.5385, "step": 148 }, { "epoch": 0.02, "learning_rate": 1.1330798479087452e-05, "loss": 0.5438, "step": 149 }, { "epoch": 0.02, "learning_rate": 1.1406844106463879e-05, "loss": 0.5507, "step": 150 }, { "epoch": 0.02, "learning_rate": 1.1482889733840306e-05, "loss": 0.5496, "step": 151 }, { "epoch": 0.02, "learning_rate": 1.155893536121673e-05, "loss": 0.5411, "step": 152 }, { "epoch": 0.02, "learning_rate": 1.1634980988593156e-05, "loss": 0.5492, "step": 153 }, { "epoch": 0.02, "learning_rate": 1.1711026615969582e-05, "loss": 0.5384, "step": 154 }, { "epoch": 0.02, "learning_rate": 1.1787072243346009e-05, "loss": 0.5209, "step": 155 }, { "epoch": 0.02, "learning_rate": 1.1863117870722434e-05, "loss": 0.5404, "step": 156 }, { "epoch": 0.02, "learning_rate": 1.1939163498098861e-05, "loss": 0.5511, "step": 157 }, { "epoch": 0.02, "learning_rate": 1.2015209125475286e-05, "loss": 0.53, "step": 158 }, { "epoch": 0.02, "learning_rate": 1.2091254752851711e-05, "loss": 0.5369, "step": 159 }, { "epoch": 0.02, "learning_rate": 1.2167300380228138e-05, "loss": 0.5446, "step": 160 }, { "epoch": 0.02, "learning_rate": 1.2243346007604565e-05, "loss": 0.5408, "step": 161 }, { "epoch": 0.02, "learning_rate": 1.2319391634980991e-05, "loss": 0.5411, "step": 162 }, { "epoch": 0.02, "learning_rate": 1.2395437262357415e-05, "loss": 0.5167, "step": 163 }, { "epoch": 0.02, "learning_rate": 1.2471482889733841e-05, "loss": 0.5447, "step": 164 }, { "epoch": 0.02, "learning_rate": 1.2547528517110268e-05, "loss": 0.5221, "step": 165 }, { "epoch": 0.02, "learning_rate": 1.2623574144486692e-05, "loss": 0.536, "step": 166 }, { "epoch": 0.02, "learning_rate": 1.2699619771863118e-05, "loss": 0.5453, "step": 167 }, { "epoch": 0.02, "learning_rate": 1.2775665399239545e-05, "loss": 0.531, "step": 168 }, { "epoch": 0.02, "learning_rate": 1.2851711026615972e-05, "loss": 0.5511, "step": 169 }, { "epoch": 0.02, "learning_rate": 1.2927756653992395e-05, "loss": 0.5444, "step": 170 }, { "epoch": 0.02, "learning_rate": 1.3003802281368822e-05, "loss": 0.5562, "step": 171 }, { "epoch": 0.02, "learning_rate": 1.3079847908745249e-05, "loss": 0.5343, "step": 172 }, { "epoch": 0.02, "learning_rate": 1.3155893536121674e-05, "loss": 0.5298, "step": 173 }, { "epoch": 0.02, "learning_rate": 1.32319391634981e-05, "loss": 0.5133, "step": 174 }, { "epoch": 0.02, "learning_rate": 1.3307984790874526e-05, "loss": 0.5407, "step": 175 }, { "epoch": 0.02, "learning_rate": 1.338403041825095e-05, "loss": 0.5446, "step": 176 }, { "epoch": 0.02, "learning_rate": 1.3460076045627377e-05, "loss": 0.5178, "step": 177 }, { "epoch": 0.02, "learning_rate": 1.3536121673003804e-05, "loss": 0.5481, "step": 178 }, { "epoch": 0.02, "learning_rate": 1.361216730038023e-05, "loss": 0.5537, "step": 179 }, { "epoch": 0.02, "learning_rate": 1.3688212927756654e-05, "loss": 0.5121, "step": 180 }, { "epoch": 0.02, "learning_rate": 1.3764258555133081e-05, "loss": 0.5132, "step": 181 }, { "epoch": 0.02, "learning_rate": 1.3840304182509508e-05, "loss": 0.5489, "step": 182 }, { "epoch": 0.02, "learning_rate": 1.3916349809885931e-05, "loss": 0.5299, "step": 183 }, { "epoch": 0.02, "learning_rate": 1.3992395437262358e-05, "loss": 0.5523, "step": 184 }, { "epoch": 0.02, "learning_rate": 1.4068441064638785e-05, "loss": 0.5257, "step": 185 }, { "epoch": 0.02, "learning_rate": 1.4144486692015211e-05, "loss": 0.5232, "step": 186 }, { "epoch": 0.02, "learning_rate": 1.4220532319391636e-05, "loss": 0.5423, "step": 187 }, { "epoch": 0.02, "learning_rate": 1.4296577946768061e-05, "loss": 0.528, "step": 188 }, { "epoch": 0.02, "learning_rate": 1.4372623574144488e-05, "loss": 0.527, "step": 189 }, { "epoch": 0.02, "learning_rate": 1.4448669201520913e-05, "loss": 0.5425, "step": 190 }, { "epoch": 0.02, "learning_rate": 1.452471482889734e-05, "loss": 0.5182, "step": 191 }, { "epoch": 0.02, "learning_rate": 1.4600760456273767e-05, "loss": 0.5552, "step": 192 }, { "epoch": 0.02, "learning_rate": 1.467680608365019e-05, "loss": 0.5517, "step": 193 }, { "epoch": 0.02, "learning_rate": 1.4752851711026617e-05, "loss": 0.5179, "step": 194 }, { "epoch": 0.02, "learning_rate": 1.4828897338403044e-05, "loss": 0.5453, "step": 195 }, { "epoch": 0.02, "learning_rate": 1.490494296577947e-05, "loss": 0.5325, "step": 196 }, { "epoch": 0.02, "learning_rate": 1.4980988593155894e-05, "loss": 0.5305, "step": 197 }, { "epoch": 0.02, "learning_rate": 1.505703422053232e-05, "loss": 0.5312, "step": 198 }, { "epoch": 0.02, "learning_rate": 1.5133079847908747e-05, "loss": 0.5371, "step": 199 }, { "epoch": 0.02, "learning_rate": 1.520912547528517e-05, "loss": 0.5374, "step": 200 }, { "epoch": 0.02, "learning_rate": 1.5285171102661597e-05, "loss": 0.537, "step": 201 }, { "epoch": 0.02, "learning_rate": 1.5361216730038024e-05, "loss": 0.5428, "step": 202 }, { "epoch": 0.02, "learning_rate": 1.543726235741445e-05, "loss": 0.5202, "step": 203 }, { "epoch": 0.02, "learning_rate": 1.5513307984790874e-05, "loss": 0.5168, "step": 204 }, { "epoch": 0.02, "learning_rate": 1.55893536121673e-05, "loss": 0.5479, "step": 205 }, { "epoch": 0.02, "learning_rate": 1.5665399239543728e-05, "loss": 0.5294, "step": 206 }, { "epoch": 0.02, "learning_rate": 1.574144486692015e-05, "loss": 0.535, "step": 207 }, { "epoch": 0.02, "learning_rate": 1.5817490494296578e-05, "loss": 0.5417, "step": 208 }, { "epoch": 0.02, "learning_rate": 1.5893536121673005e-05, "loss": 0.5564, "step": 209 }, { "epoch": 0.02, "learning_rate": 1.596958174904943e-05, "loss": 0.5247, "step": 210 }, { "epoch": 0.02, "learning_rate": 1.6045627376425855e-05, "loss": 0.5157, "step": 211 }, { "epoch": 0.02, "learning_rate": 1.612167300380228e-05, "loss": 0.5206, "step": 212 }, { "epoch": 0.02, "learning_rate": 1.6197718631178708e-05, "loss": 0.5466, "step": 213 }, { "epoch": 0.02, "learning_rate": 1.6273764258555135e-05, "loss": 0.5188, "step": 214 }, { "epoch": 0.02, "learning_rate": 1.634980988593156e-05, "loss": 0.5301, "step": 215 }, { "epoch": 0.02, "learning_rate": 1.6425855513307985e-05, "loss": 0.5417, "step": 216 }, { "epoch": 0.02, "learning_rate": 1.6501901140684412e-05, "loss": 0.5318, "step": 217 }, { "epoch": 0.02, "learning_rate": 1.657794676806084e-05, "loss": 0.5161, "step": 218 }, { "epoch": 0.03, "learning_rate": 1.6653992395437265e-05, "loss": 0.5379, "step": 219 }, { "epoch": 0.03, "learning_rate": 1.6730038022813692e-05, "loss": 0.5216, "step": 220 }, { "epoch": 0.03, "learning_rate": 1.6806083650190115e-05, "loss": 0.5264, "step": 221 }, { "epoch": 0.03, "learning_rate": 1.6882129277566542e-05, "loss": 0.5262, "step": 222 }, { "epoch": 0.03, "learning_rate": 1.695817490494297e-05, "loss": 0.5251, "step": 223 }, { "epoch": 0.03, "learning_rate": 1.7034220532319392e-05, "loss": 0.5259, "step": 224 }, { "epoch": 0.03, "learning_rate": 1.711026615969582e-05, "loss": 0.5346, "step": 225 }, { "epoch": 0.03, "learning_rate": 1.7186311787072246e-05, "loss": 0.5362, "step": 226 }, { "epoch": 0.03, "learning_rate": 1.7262357414448672e-05, "loss": 0.5164, "step": 227 }, { "epoch": 0.03, "learning_rate": 1.7338403041825096e-05, "loss": 0.5233, "step": 228 }, { "epoch": 0.03, "learning_rate": 1.7414448669201523e-05, "loss": 0.5171, "step": 229 }, { "epoch": 0.03, "learning_rate": 1.749049429657795e-05, "loss": 0.521, "step": 230 }, { "epoch": 0.03, "learning_rate": 1.7566539923954373e-05, "loss": 0.5227, "step": 231 }, { "epoch": 0.03, "learning_rate": 1.76425855513308e-05, "loss": 0.518, "step": 232 }, { "epoch": 0.03, "learning_rate": 1.7718631178707226e-05, "loss": 0.5416, "step": 233 }, { "epoch": 0.03, "learning_rate": 1.779467680608365e-05, "loss": 0.521, "step": 234 }, { "epoch": 0.03, "learning_rate": 1.7870722433460076e-05, "loss": 0.5199, "step": 235 }, { "epoch": 0.03, "learning_rate": 1.7946768060836503e-05, "loss": 0.5327, "step": 236 }, { "epoch": 0.03, "learning_rate": 1.802281368821293e-05, "loss": 0.52, "step": 237 }, { "epoch": 0.03, "learning_rate": 1.8098859315589353e-05, "loss": 0.519, "step": 238 }, { "epoch": 0.03, "learning_rate": 1.817490494296578e-05, "loss": 0.5309, "step": 239 }, { "epoch": 0.03, "learning_rate": 1.8250950570342207e-05, "loss": 0.5213, "step": 240 }, { "epoch": 0.03, "learning_rate": 1.832699619771863e-05, "loss": 0.5349, "step": 241 }, { "epoch": 0.03, "learning_rate": 1.8403041825095057e-05, "loss": 0.5415, "step": 242 }, { "epoch": 0.03, "learning_rate": 1.8479087452471484e-05, "loss": 0.5163, "step": 243 }, { "epoch": 0.03, "learning_rate": 1.855513307984791e-05, "loss": 0.5141, "step": 244 }, { "epoch": 0.03, "learning_rate": 1.8631178707224337e-05, "loss": 0.5208, "step": 245 }, { "epoch": 0.03, "learning_rate": 1.870722433460076e-05, "loss": 0.5091, "step": 246 }, { "epoch": 0.03, "learning_rate": 1.8783269961977187e-05, "loss": 0.5496, "step": 247 }, { "epoch": 0.03, "learning_rate": 1.8859315589353614e-05, "loss": 0.518, "step": 248 }, { "epoch": 0.03, "learning_rate": 1.893536121673004e-05, "loss": 0.5337, "step": 249 }, { "epoch": 0.03, "learning_rate": 1.9011406844106467e-05, "loss": 0.5099, "step": 250 }, { "epoch": 0.03, "learning_rate": 1.908745247148289e-05, "loss": 0.5258, "step": 251 }, { "epoch": 0.03, "learning_rate": 1.9163498098859318e-05, "loss": 0.5225, "step": 252 }, { "epoch": 0.03, "learning_rate": 1.9239543726235744e-05, "loss": 0.5185, "step": 253 }, { "epoch": 0.03, "learning_rate": 1.931558935361217e-05, "loss": 0.527, "step": 254 }, { "epoch": 0.03, "learning_rate": 1.9391634980988594e-05, "loss": 0.5155, "step": 255 }, { "epoch": 0.03, "learning_rate": 1.946768060836502e-05, "loss": 0.5138, "step": 256 }, { "epoch": 0.03, "learning_rate": 1.9543726235741448e-05, "loss": 0.5309, "step": 257 }, { "epoch": 0.03, "learning_rate": 1.961977186311787e-05, "loss": 0.527, "step": 258 }, { "epoch": 0.03, "learning_rate": 1.9695817490494298e-05, "loss": 0.5223, "step": 259 }, { "epoch": 0.03, "learning_rate": 1.9771863117870725e-05, "loss": 0.5452, "step": 260 }, { "epoch": 0.03, "learning_rate": 1.984790874524715e-05, "loss": 0.527, "step": 261 }, { "epoch": 0.03, "learning_rate": 1.9923954372623575e-05, "loss": 0.535, "step": 262 }, { "epoch": 0.03, "learning_rate": 2e-05, "loss": 0.5283, "step": 263 }, { "epoch": 0.03, "learning_rate": 1.9999999314888373e-05, "loss": 0.5108, "step": 264 }, { "epoch": 0.03, "learning_rate": 1.9999997259553572e-05, "loss": 0.5212, "step": 265 }, { "epoch": 0.03, "learning_rate": 1.9999993833995886e-05, "loss": 0.5039, "step": 266 }, { "epoch": 0.03, "learning_rate": 1.9999989038215787e-05, "loss": 0.5497, "step": 267 }, { "epoch": 0.03, "learning_rate": 1.9999982872213925e-05, "loss": 0.5265, "step": 268 }, { "epoch": 0.03, "learning_rate": 1.999997533599115e-05, "loss": 0.5201, "step": 269 }, { "epoch": 0.03, "learning_rate": 1.999996642954849e-05, "loss": 0.5279, "step": 270 }, { "epoch": 0.03, "learning_rate": 1.999995615288717e-05, "loss": 0.5313, "step": 271 }, { "epoch": 0.03, "learning_rate": 1.9999944506008594e-05, "loss": 0.5108, "step": 272 }, { "epoch": 0.03, "learning_rate": 1.9999931488914366e-05, "loss": 0.5274, "step": 273 }, { "epoch": 0.03, "learning_rate": 1.999991710160626e-05, "loss": 0.5071, "step": 274 }, { "epoch": 0.03, "learning_rate": 1.999990134408625e-05, "loss": 0.5226, "step": 275 }, { "epoch": 0.03, "learning_rate": 1.99998842163565e-05, "loss": 0.5201, "step": 276 }, { "epoch": 0.03, "learning_rate": 1.9999865718419352e-05, "loss": 0.5188, "step": 277 }, { "epoch": 0.03, "learning_rate": 1.999984585027734e-05, "loss": 0.5578, "step": 278 }, { "epoch": 0.03, "learning_rate": 1.999982461193319e-05, "loss": 0.5245, "step": 279 }, { "epoch": 0.03, "learning_rate": 1.999980200338981e-05, "loss": 0.5092, "step": 280 }, { "epoch": 0.03, "learning_rate": 1.9999778024650296e-05, "loss": 0.5174, "step": 281 }, { "epoch": 0.03, "learning_rate": 1.9999752675717938e-05, "loss": 0.524, "step": 282 }, { "epoch": 0.03, "learning_rate": 1.9999725956596204e-05, "loss": 0.5193, "step": 283 }, { "epoch": 0.03, "learning_rate": 1.9999697867288764e-05, "loss": 0.5026, "step": 284 }, { "epoch": 0.03, "learning_rate": 1.999966840779946e-05, "loss": 0.527, "step": 285 }, { "epoch": 0.03, "learning_rate": 1.9999637578132328e-05, "loss": 0.5295, "step": 286 }, { "epoch": 0.03, "learning_rate": 1.9999605378291593e-05, "loss": 0.5041, "step": 287 }, { "epoch": 0.03, "learning_rate": 1.999957180828167e-05, "loss": 0.5232, "step": 288 }, { "epoch": 0.03, "learning_rate": 1.999953686810716e-05, "loss": 0.5181, "step": 289 }, { "epoch": 0.03, "learning_rate": 1.9999500557772843e-05, "loss": 0.5092, "step": 290 }, { "epoch": 0.03, "learning_rate": 1.9999462877283702e-05, "loss": 0.5373, "step": 291 }, { "epoch": 0.03, "learning_rate": 1.9999423826644895e-05, "loss": 0.5129, "step": 292 }, { "epoch": 0.03, "learning_rate": 1.999938340586178e-05, "loss": 0.5435, "step": 293 }, { "epoch": 0.03, "learning_rate": 1.999934161493988e-05, "loss": 0.5212, "step": 294 }, { "epoch": 0.03, "learning_rate": 1.9999298453884944e-05, "loss": 0.5404, "step": 295 }, { "epoch": 0.03, "learning_rate": 1.9999253922702868e-05, "loss": 0.5253, "step": 296 }, { "epoch": 0.03, "learning_rate": 1.9999208021399757e-05, "loss": 0.5073, "step": 297 }, { "epoch": 0.03, "learning_rate": 1.9999160749981908e-05, "loss": 0.507, "step": 298 }, { "epoch": 0.03, "learning_rate": 1.999911210845579e-05, "loss": 0.5219, "step": 299 }, { "epoch": 0.03, "learning_rate": 1.9999062096828072e-05, "loss": 0.5168, "step": 300 }, { "epoch": 0.03, "learning_rate": 1.9999010715105608e-05, "loss": 0.5167, "step": 301 }, { "epoch": 0.03, "learning_rate": 1.9998957963295434e-05, "loss": 0.5081, "step": 302 }, { "epoch": 0.03, "learning_rate": 1.999890384140478e-05, "loss": 0.5134, "step": 303 }, { "epoch": 0.03, "learning_rate": 1.999884834944106e-05, "loss": 0.5205, "step": 304 }, { "epoch": 0.03, "learning_rate": 1.9998791487411887e-05, "loss": 0.5281, "step": 305 }, { "epoch": 0.03, "learning_rate": 1.9998733255325043e-05, "loss": 0.5184, "step": 306 }, { "epoch": 0.04, "learning_rate": 1.999867365318851e-05, "loss": 0.509, "step": 307 }, { "epoch": 0.04, "learning_rate": 1.9998612681010452e-05, "loss": 0.5131, "step": 308 }, { "epoch": 0.04, "learning_rate": 1.999855033879923e-05, "loss": 0.5204, "step": 309 }, { "epoch": 0.04, "learning_rate": 1.9998486626563376e-05, "loss": 0.5085, "step": 310 }, { "epoch": 0.04, "learning_rate": 1.999842154431163e-05, "loss": 0.5362, "step": 311 }, { "epoch": 0.04, "learning_rate": 1.9998355092052906e-05, "loss": 0.5136, "step": 312 }, { "epoch": 0.04, "learning_rate": 1.9998287269796313e-05, "loss": 0.5057, "step": 313 }, { "epoch": 0.04, "learning_rate": 1.9998218077551135e-05, "loss": 0.5129, "step": 314 }, { "epoch": 0.04, "learning_rate": 1.9998147515326862e-05, "loss": 0.5301, "step": 315 }, { "epoch": 0.04, "learning_rate": 1.9998075583133157e-05, "loss": 0.4895, "step": 316 }, { "epoch": 0.04, "learning_rate": 1.999800228097988e-05, "loss": 0.5259, "step": 317 }, { "epoch": 0.04, "learning_rate": 1.999792760887707e-05, "loss": 0.5194, "step": 318 }, { "epoch": 0.04, "learning_rate": 1.9997851566834966e-05, "loss": 0.5316, "step": 319 }, { "epoch": 0.04, "learning_rate": 1.999777415486398e-05, "loss": 0.517, "step": 320 }, { "epoch": 0.04, "learning_rate": 1.9997695372974725e-05, "loss": 0.5055, "step": 321 }, { "epoch": 0.04, "learning_rate": 1.9997615221177996e-05, "loss": 0.543, "step": 322 }, { "epoch": 0.04, "learning_rate": 1.999753369948477e-05, "loss": 0.5334, "step": 323 }, { "epoch": 0.04, "learning_rate": 1.999745080790622e-05, "loss": 0.5019, "step": 324 }, { "epoch": 0.04, "learning_rate": 1.999736654645371e-05, "loss": 0.5284, "step": 325 }, { "epoch": 0.04, "learning_rate": 1.999728091513877e-05, "loss": 0.5158, "step": 326 }, { "epoch": 0.04, "learning_rate": 1.9997193913973154e-05, "loss": 0.5483, "step": 327 }, { "epoch": 0.04, "learning_rate": 1.999710554296877e-05, "loss": 0.5111, "step": 328 }, { "epoch": 0.04, "learning_rate": 1.9997015802137727e-05, "loss": 0.5069, "step": 329 }, { "epoch": 0.04, "learning_rate": 1.9996924691492325e-05, "loss": 0.4987, "step": 330 }, { "epoch": 0.04, "learning_rate": 1.9996832211045048e-05, "loss": 0.542, "step": 331 }, { "epoch": 0.04, "learning_rate": 1.9996738360808566e-05, "loss": 0.5133, "step": 332 }, { "epoch": 0.04, "learning_rate": 1.999664314079574e-05, "loss": 0.5189, "step": 333 }, { "epoch": 0.04, "learning_rate": 1.9996546551019618e-05, "loss": 0.4968, "step": 334 }, { "epoch": 0.04, "learning_rate": 1.9996448591493433e-05, "loss": 0.5309, "step": 335 }, { "epoch": 0.04, "learning_rate": 1.9996349262230607e-05, "loss": 0.5144, "step": 336 }, { "epoch": 0.04, "learning_rate": 1.9996248563244755e-05, "loss": 0.5217, "step": 337 }, { "epoch": 0.04, "learning_rate": 1.9996146494549672e-05, "loss": 0.4983, "step": 338 }, { "epoch": 0.04, "learning_rate": 1.999604305615934e-05, "loss": 0.4968, "step": 339 }, { "epoch": 0.04, "learning_rate": 1.9995938248087937e-05, "loss": 0.5185, "step": 340 }, { "epoch": 0.04, "learning_rate": 1.9995832070349827e-05, "loss": 0.4945, "step": 341 }, { "epoch": 0.04, "learning_rate": 1.999572452295955e-05, "loss": 0.5324, "step": 342 }, { "epoch": 0.04, "learning_rate": 1.999561560593185e-05, "loss": 0.5058, "step": 343 }, { "epoch": 0.04, "learning_rate": 1.9995505319281645e-05, "loss": 0.5145, "step": 344 }, { "epoch": 0.04, "learning_rate": 1.9995393663024054e-05, "loss": 0.5248, "step": 345 }, { "epoch": 0.04, "learning_rate": 1.999528063717437e-05, "loss": 0.515, "step": 346 }, { "epoch": 0.04, "learning_rate": 1.9995166241748084e-05, "loss": 0.5016, "step": 347 }, { "epoch": 0.04, "learning_rate": 1.9995050476760864e-05, "loss": 0.5052, "step": 348 }, { "epoch": 0.04, "learning_rate": 1.9994933342228583e-05, "loss": 0.5221, "step": 349 }, { "epoch": 0.04, "learning_rate": 1.9994814838167286e-05, "loss": 0.5006, "step": 350 }, { "epoch": 0.04, "learning_rate": 1.9994694964593206e-05, "loss": 0.513, "step": 351 }, { "epoch": 0.04, "learning_rate": 1.9994573721522776e-05, "loss": 0.5107, "step": 352 }, { "epoch": 0.04, "learning_rate": 1.9994451108972604e-05, "loss": 0.5247, "step": 353 }, { "epoch": 0.04, "learning_rate": 1.999432712695949e-05, "loss": 0.5054, "step": 354 }, { "epoch": 0.04, "learning_rate": 1.999420177550043e-05, "loss": 0.5129, "step": 355 }, { "epoch": 0.04, "learning_rate": 1.999407505461259e-05, "loss": 0.4971, "step": 356 }, { "epoch": 0.04, "learning_rate": 1.999394696431334e-05, "loss": 0.4876, "step": 357 }, { "epoch": 0.04, "learning_rate": 1.999381750462023e-05, "loss": 0.528, "step": 358 }, { "epoch": 0.04, "learning_rate": 1.9993686675550998e-05, "loss": 0.5143, "step": 359 }, { "epoch": 0.04, "learning_rate": 1.9993554477123568e-05, "loss": 0.5101, "step": 360 }, { "epoch": 0.04, "learning_rate": 1.9993420909356058e-05, "loss": 0.5107, "step": 361 }, { "epoch": 0.04, "learning_rate": 1.999328597226677e-05, "loss": 0.5321, "step": 362 }, { "epoch": 0.04, "learning_rate": 1.9993149665874193e-05, "loss": 0.5402, "step": 363 }, { "epoch": 0.04, "learning_rate": 1.9993011990197e-05, "loss": 0.5014, "step": 364 }, { "epoch": 0.04, "learning_rate": 1.9992872945254064e-05, "loss": 0.4866, "step": 365 }, { "epoch": 0.04, "learning_rate": 1.9992732531064427e-05, "loss": 0.5061, "step": 366 }, { "epoch": 0.04, "learning_rate": 1.9992590747647334e-05, "loss": 0.5053, "step": 367 }, { "epoch": 0.04, "learning_rate": 1.9992447595022214e-05, "loss": 0.5216, "step": 368 }, { "epoch": 0.04, "learning_rate": 1.9992303073208678e-05, "loss": 0.5027, "step": 369 }, { "epoch": 0.04, "learning_rate": 1.9992157182226535e-05, "loss": 0.4829, "step": 370 }, { "epoch": 0.04, "learning_rate": 1.9992009922095766e-05, "loss": 0.5256, "step": 371 }, { "epoch": 0.04, "learning_rate": 1.999186129283656e-05, "loss": 0.5018, "step": 372 }, { "epoch": 0.04, "learning_rate": 1.9991711294469273e-05, "loss": 0.509, "step": 373 }, { "epoch": 0.04, "learning_rate": 1.9991559927014465e-05, "loss": 0.5046, "step": 374 }, { "epoch": 0.04, "learning_rate": 1.999140719049287e-05, "loss": 0.5319, "step": 375 }, { "epoch": 0.04, "learning_rate": 1.9991253084925425e-05, "loss": 0.52, "step": 376 }, { "epoch": 0.04, "learning_rate": 1.999109761033324e-05, "loss": 0.5033, "step": 377 }, { "epoch": 0.04, "learning_rate": 1.9990940766737617e-05, "loss": 0.4969, "step": 378 }, { "epoch": 0.04, "learning_rate": 1.999078255416005e-05, "loss": 0.5246, "step": 379 }, { "epoch": 0.04, "learning_rate": 1.9990622972622216e-05, "loss": 0.4919, "step": 380 }, { "epoch": 0.04, "learning_rate": 1.9990462022145985e-05, "loss": 0.5271, "step": 381 }, { "epoch": 0.04, "learning_rate": 1.9990299702753405e-05, "loss": 0.5046, "step": 382 }, { "epoch": 0.04, "learning_rate": 1.9990136014466722e-05, "loss": 0.5027, "step": 383 }, { "epoch": 0.04, "learning_rate": 1.9989970957308364e-05, "loss": 0.5148, "step": 384 }, { "epoch": 0.04, "learning_rate": 1.998980453130095e-05, "loss": 0.529, "step": 385 }, { "epoch": 0.04, "learning_rate": 1.9989636736467278e-05, "loss": 0.5077, "step": 386 }, { "epoch": 0.04, "learning_rate": 1.9989467572830342e-05, "loss": 0.5123, "step": 387 }, { "epoch": 0.04, "learning_rate": 1.9989297040413325e-05, "loss": 0.5002, "step": 388 }, { "epoch": 0.04, "learning_rate": 1.998912513923959e-05, "loss": 0.5295, "step": 389 }, { "epoch": 0.04, "learning_rate": 1.998895186933269e-05, "loss": 0.4975, "step": 390 }, { "epoch": 0.04, "learning_rate": 1.9988777230716367e-05, "loss": 0.5053, "step": 391 }, { "epoch": 0.04, "learning_rate": 1.9988601223414555e-05, "loss": 0.5067, "step": 392 }, { "epoch": 0.04, "learning_rate": 1.998842384745137e-05, "loss": 0.5156, "step": 393 }, { "epoch": 0.05, "learning_rate": 1.998824510285111e-05, "loss": 0.5218, "step": 394 }, { "epoch": 0.05, "learning_rate": 1.998806498963828e-05, "loss": 0.5057, "step": 395 }, { "epoch": 0.05, "learning_rate": 1.9987883507837545e-05, "loss": 0.5167, "step": 396 }, { "epoch": 0.05, "learning_rate": 1.998770065747378e-05, "loss": 0.5119, "step": 397 }, { "epoch": 0.05, "learning_rate": 1.9987516438572035e-05, "loss": 0.5095, "step": 398 }, { "epoch": 0.05, "learning_rate": 1.9987330851157557e-05, "loss": 0.526, "step": 399 }, { "epoch": 0.05, "learning_rate": 1.9987143895255774e-05, "loss": 0.5022, "step": 400 }, { "epoch": 0.05, "learning_rate": 1.9986955570892302e-05, "loss": 0.5204, "step": 401 }, { "epoch": 0.05, "learning_rate": 1.9986765878092945e-05, "loss": 0.5211, "step": 402 }, { "epoch": 0.05, "learning_rate": 1.99865748168837e-05, "loss": 0.5107, "step": 403 }, { "epoch": 0.05, "learning_rate": 1.9986382387290738e-05, "loss": 0.5242, "step": 404 }, { "epoch": 0.05, "learning_rate": 1.9986188589340435e-05, "loss": 0.5001, "step": 405 }, { "epoch": 0.05, "learning_rate": 1.9985993423059342e-05, "loss": 0.4907, "step": 406 }, { "epoch": 0.05, "learning_rate": 1.99857968884742e-05, "loss": 0.5123, "step": 407 }, { "epoch": 0.05, "learning_rate": 1.998559898561194e-05, "loss": 0.508, "step": 408 }, { "epoch": 0.05, "learning_rate": 1.9985399714499678e-05, "loss": 0.4923, "step": 409 }, { "epoch": 0.05, "learning_rate": 1.998519907516472e-05, "loss": 0.5473, "step": 410 }, { "epoch": 0.05, "learning_rate": 1.998499706763456e-05, "loss": 0.5052, "step": 411 }, { "epoch": 0.05, "learning_rate": 1.998479369193687e-05, "loss": 0.5304, "step": 412 }, { "epoch": 0.05, "learning_rate": 1.9984588948099528e-05, "loss": 0.4969, "step": 413 }, { "epoch": 0.05, "learning_rate": 1.998438283615058e-05, "loss": 0.5129, "step": 414 }, { "epoch": 0.05, "learning_rate": 1.9984175356118268e-05, "loss": 0.4953, "step": 415 }, { "epoch": 0.05, "learning_rate": 1.9983966508031026e-05, "loss": 0.5145, "step": 416 }, { "epoch": 0.05, "learning_rate": 1.9983756291917467e-05, "loss": 0.5019, "step": 417 }, { "epoch": 0.05, "learning_rate": 1.99835447078064e-05, "loss": 0.5282, "step": 418 }, { "epoch": 0.05, "learning_rate": 1.998333175572681e-05, "loss": 0.4842, "step": 419 }, { "epoch": 0.05, "learning_rate": 1.998311743570788e-05, "loss": 0.5177, "step": 420 }, { "epoch": 0.05, "learning_rate": 1.998290174777898e-05, "loss": 0.5039, "step": 421 }, { "epoch": 0.05, "learning_rate": 1.998268469196966e-05, "loss": 0.5227, "step": 422 }, { "epoch": 0.05, "learning_rate": 1.998246626830966e-05, "loss": 0.4926, "step": 423 }, { "epoch": 0.05, "learning_rate": 1.998224647682891e-05, "loss": 0.5044, "step": 424 }, { "epoch": 0.05, "learning_rate": 1.998202531755753e-05, "loss": 0.5244, "step": 425 }, { "epoch": 0.05, "learning_rate": 1.9981802790525822e-05, "loss": 0.4932, "step": 426 }, { "epoch": 0.05, "learning_rate": 1.9981578895764272e-05, "loss": 0.5055, "step": 427 }, { "epoch": 0.05, "learning_rate": 1.998135363330357e-05, "loss": 0.537, "step": 428 }, { "epoch": 0.05, "learning_rate": 1.998112700317457e-05, "loss": 0.4919, "step": 429 }, { "epoch": 0.05, "learning_rate": 1.998089900540833e-05, "loss": 0.5127, "step": 430 }, { "epoch": 0.05, "learning_rate": 1.998066964003609e-05, "loss": 0.5092, "step": 431 }, { "epoch": 0.05, "learning_rate": 1.998043890708928e-05, "loss": 0.5153, "step": 432 }, { "epoch": 0.05, "learning_rate": 1.9980206806599516e-05, "loss": 0.508, "step": 433 }, { "epoch": 0.05, "learning_rate": 1.9979973338598603e-05, "loss": 0.5059, "step": 434 }, { "epoch": 0.05, "learning_rate": 1.997973850311852e-05, "loss": 0.4842, "step": 435 }, { "epoch": 0.05, "learning_rate": 1.997950230019146e-05, "loss": 0.5241, "step": 436 }, { "epoch": 0.05, "learning_rate": 1.9979264729849776e-05, "loss": 0.5035, "step": 437 }, { "epoch": 0.05, "learning_rate": 1.9979025792126027e-05, "loss": 0.4893, "step": 438 }, { "epoch": 0.05, "learning_rate": 1.9978785487052952e-05, "loss": 0.5123, "step": 439 }, { "epoch": 0.05, "learning_rate": 1.9978543814663478e-05, "loss": 0.5177, "step": 440 }, { "epoch": 0.05, "learning_rate": 1.9978300774990716e-05, "loss": 0.4992, "step": 441 }, { "epoch": 0.05, "learning_rate": 1.9978056368067973e-05, "loss": 0.5116, "step": 442 }, { "epoch": 0.05, "learning_rate": 1.9977810593928736e-05, "loss": 0.5017, "step": 443 }, { "epoch": 0.05, "learning_rate": 1.9977563452606677e-05, "loss": 0.5114, "step": 444 }, { "epoch": 0.05, "learning_rate": 1.9977314944135667e-05, "loss": 0.4902, "step": 445 }, { "epoch": 0.05, "learning_rate": 1.9977065068549756e-05, "loss": 0.5134, "step": 446 }, { "epoch": 0.05, "learning_rate": 1.9976813825883182e-05, "loss": 0.4954, "step": 447 }, { "epoch": 0.05, "learning_rate": 1.9976561216170368e-05, "loss": 0.5045, "step": 448 }, { "epoch": 0.05, "learning_rate": 1.9976307239445924e-05, "loss": 0.4949, "step": 449 }, { "epoch": 0.05, "learning_rate": 1.9976051895744663e-05, "loss": 0.5228, "step": 450 }, { "epoch": 0.05, "learning_rate": 1.997579518510156e-05, "loss": 0.5035, "step": 451 }, { "epoch": 0.05, "learning_rate": 1.99755371075518e-05, "loss": 0.5046, "step": 452 }, { "epoch": 0.05, "learning_rate": 1.9975277663130736e-05, "loss": 0.5041, "step": 453 }, { "epoch": 0.05, "learning_rate": 1.9975016851873925e-05, "loss": 0.5142, "step": 454 }, { "epoch": 0.05, "learning_rate": 1.99747546738171e-05, "loss": 0.4906, "step": 455 }, { "epoch": 0.05, "learning_rate": 1.997449112899619e-05, "loss": 0.5018, "step": 456 }, { "epoch": 0.05, "learning_rate": 1.99742262174473e-05, "loss": 0.5064, "step": 457 }, { "epoch": 0.05, "learning_rate": 1.9973959939206734e-05, "loss": 0.4996, "step": 458 }, { "epoch": 0.05, "learning_rate": 1.9973692294310972e-05, "loss": 0.5149, "step": 459 }, { "epoch": 0.05, "learning_rate": 1.9973423282796695e-05, "loss": 0.4956, "step": 460 }, { "epoch": 0.05, "learning_rate": 1.9973152904700762e-05, "loss": 0.5125, "step": 461 }, { "epoch": 0.05, "learning_rate": 1.9972881160060216e-05, "loss": 0.5385, "step": 462 }, { "epoch": 0.05, "learning_rate": 1.997260804891229e-05, "loss": 0.485, "step": 463 }, { "epoch": 0.05, "learning_rate": 1.9972333571294418e-05, "loss": 0.5028, "step": 464 }, { "epoch": 0.05, "learning_rate": 1.9972057727244203e-05, "loss": 0.4887, "step": 465 }, { "epoch": 0.05, "learning_rate": 1.997178051679944e-05, "loss": 0.5229, "step": 466 }, { "epoch": 0.05, "learning_rate": 1.997150193999811e-05, "loss": 0.4953, "step": 467 }, { "epoch": 0.05, "learning_rate": 1.9971221996878395e-05, "loss": 0.5123, "step": 468 }, { "epoch": 0.05, "learning_rate": 1.9970940687478643e-05, "loss": 0.5256, "step": 469 }, { "epoch": 0.05, "learning_rate": 1.9970658011837404e-05, "loss": 0.501, "step": 470 }, { "epoch": 0.05, "learning_rate": 1.9970373969993414e-05, "loss": 0.5173, "step": 471 }, { "epoch": 0.05, "learning_rate": 1.997008856198559e-05, "loss": 0.5047, "step": 472 }, { "epoch": 0.05, "learning_rate": 1.9969801787853035e-05, "loss": 0.5107, "step": 473 }, { "epoch": 0.05, "learning_rate": 1.996951364763505e-05, "loss": 0.5104, "step": 474 }, { "epoch": 0.05, "learning_rate": 1.9969224141371114e-05, "loss": 0.5097, "step": 475 }, { "epoch": 0.05, "learning_rate": 1.99689332691009e-05, "loss": 0.5093, "step": 476 }, { "epoch": 0.05, "learning_rate": 1.9968641030864254e-05, "loss": 0.4957, "step": 477 }, { "epoch": 0.05, "learning_rate": 1.9968347426701228e-05, "loss": 0.5105, "step": 478 }, { "epoch": 0.05, "learning_rate": 1.9968052456652048e-05, "loss": 0.504, "step": 479 }, { "epoch": 0.05, "learning_rate": 1.9967756120757132e-05, "loss": 0.5008, "step": 480 }, { "epoch": 0.05, "learning_rate": 1.9967458419057092e-05, "loss": 0.5101, "step": 481 }, { "epoch": 0.06, "learning_rate": 1.9967159351592706e-05, "loss": 0.5092, "step": 482 }, { "epoch": 0.06, "learning_rate": 1.9966858918404965e-05, "loss": 0.5023, "step": 483 }, { "epoch": 0.06, "learning_rate": 1.996655711953503e-05, "loss": 0.5103, "step": 484 }, { "epoch": 0.06, "learning_rate": 1.996625395502425e-05, "loss": 0.5325, "step": 485 }, { "epoch": 0.06, "learning_rate": 1.9965949424914175e-05, "loss": 0.5126, "step": 486 }, { "epoch": 0.06, "learning_rate": 1.9965643529246526e-05, "loss": 0.5017, "step": 487 }, { "epoch": 0.06, "learning_rate": 1.996533626806322e-05, "loss": 0.5367, "step": 488 }, { "epoch": 0.06, "learning_rate": 1.9965027641406355e-05, "loss": 0.4925, "step": 489 }, { "epoch": 0.06, "learning_rate": 1.996471764931822e-05, "loss": 0.5153, "step": 490 }, { "epoch": 0.06, "learning_rate": 1.99644062918413e-05, "loss": 0.5196, "step": 491 }, { "epoch": 0.06, "learning_rate": 1.9964093569018247e-05, "loss": 0.4936, "step": 492 }, { "epoch": 0.06, "learning_rate": 1.9963779480891917e-05, "loss": 0.5085, "step": 493 }, { "epoch": 0.06, "learning_rate": 1.9963464027505343e-05, "loss": 0.5153, "step": 494 }, { "epoch": 0.06, "learning_rate": 1.996314720890175e-05, "loss": 0.5228, "step": 495 }, { "epoch": 0.06, "learning_rate": 1.9962829025124553e-05, "loss": 0.499, "step": 496 }, { "epoch": 0.06, "learning_rate": 1.9962509476217348e-05, "loss": 0.512, "step": 497 }, { "epoch": 0.06, "learning_rate": 1.9962188562223916e-05, "loss": 0.4839, "step": 498 }, { "epoch": 0.06, "learning_rate": 1.9961866283188237e-05, "loss": 0.4876, "step": 499 }, { "epoch": 0.06, "learning_rate": 1.9961542639154467e-05, "loss": 0.5057, "step": 500 }, { "epoch": 0.06, "learning_rate": 1.9961217630166954e-05, "loss": 0.5144, "step": 501 }, { "epoch": 0.06, "learning_rate": 1.9960891256270224e-05, "loss": 0.5042, "step": 502 }, { "epoch": 0.06, "learning_rate": 1.9960563517509008e-05, "loss": 0.5188, "step": 503 }, { "epoch": 0.06, "learning_rate": 1.996023441392821e-05, "loss": 0.4886, "step": 504 }, { "epoch": 0.06, "learning_rate": 1.9959903945572918e-05, "loss": 0.4883, "step": 505 }, { "epoch": 0.06, "learning_rate": 1.9959572112488423e-05, "loss": 0.5606, "step": 506 }, { "epoch": 0.06, "learning_rate": 1.9959238914720188e-05, "loss": 0.492, "step": 507 }, { "epoch": 0.06, "learning_rate": 1.995890435231387e-05, "loss": 0.4934, "step": 508 }, { "epoch": 0.06, "learning_rate": 1.9958568425315316e-05, "loss": 0.5088, "step": 509 }, { "epoch": 0.06, "learning_rate": 1.9958231133770548e-05, "loss": 0.5085, "step": 510 }, { "epoch": 0.06, "learning_rate": 1.995789247772578e-05, "loss": 0.5067, "step": 511 }, { "epoch": 0.06, "learning_rate": 1.9957552457227428e-05, "loss": 0.5029, "step": 512 }, { "epoch": 0.06, "learning_rate": 1.9957211072322075e-05, "loss": 0.4727, "step": 513 }, { "epoch": 0.06, "learning_rate": 1.9956868323056494e-05, "loss": 0.5176, "step": 514 }, { "epoch": 0.06, "learning_rate": 1.9956524209477658e-05, "loss": 0.5033, "step": 515 }, { "epoch": 0.06, "learning_rate": 1.9956178731632715e-05, "loss": 0.513, "step": 516 }, { "epoch": 0.06, "learning_rate": 1.9955831889568998e-05, "loss": 0.5041, "step": 517 }, { "epoch": 0.06, "learning_rate": 1.995548368333404e-05, "loss": 0.4975, "step": 518 }, { "epoch": 0.06, "learning_rate": 1.9955134112975548e-05, "loss": 0.5129, "step": 519 }, { "epoch": 0.06, "learning_rate": 1.9954783178541424e-05, "loss": 0.505, "step": 520 }, { "epoch": 0.06, "learning_rate": 1.995443088007975e-05, "loss": 0.5008, "step": 521 }, { "epoch": 0.06, "learning_rate": 1.9954077217638807e-05, "loss": 0.5171, "step": 522 }, { "epoch": 0.06, "learning_rate": 1.995372219126704e-05, "loss": 0.4896, "step": 523 }, { "epoch": 0.06, "learning_rate": 1.995336580101311e-05, "loss": 0.521, "step": 524 }, { "epoch": 0.06, "learning_rate": 1.9953008046925844e-05, "loss": 0.5038, "step": 525 }, { "epoch": 0.06, "learning_rate": 1.9952648929054262e-05, "loss": 0.5123, "step": 526 }, { "epoch": 0.06, "learning_rate": 1.9952288447447573e-05, "loss": 0.5118, "step": 527 }, { "epoch": 0.06, "learning_rate": 1.995192660215517e-05, "loss": 0.5144, "step": 528 }, { "epoch": 0.06, "learning_rate": 1.9951563393226632e-05, "loss": 0.5075, "step": 529 }, { "epoch": 0.06, "learning_rate": 1.9951198820711735e-05, "loss": 0.497, "step": 530 }, { "epoch": 0.06, "learning_rate": 1.995083288466042e-05, "loss": 0.4836, "step": 531 }, { "epoch": 0.06, "learning_rate": 1.995046558512284e-05, "loss": 0.5177, "step": 532 }, { "epoch": 0.06, "learning_rate": 1.995009692214932e-05, "loss": 0.4862, "step": 533 }, { "epoch": 0.06, "learning_rate": 1.994972689579037e-05, "loss": 0.5107, "step": 534 }, { "epoch": 0.06, "learning_rate": 1.99493555060967e-05, "loss": 0.4924, "step": 535 }, { "epoch": 0.06, "learning_rate": 1.994898275311919e-05, "loss": 0.4966, "step": 536 }, { "epoch": 0.06, "learning_rate": 1.9948608636908928e-05, "loss": 0.5062, "step": 537 }, { "epoch": 0.06, "learning_rate": 1.9948233157517164e-05, "loss": 0.5026, "step": 538 }, { "epoch": 0.06, "learning_rate": 1.994785631499535e-05, "loss": 0.5129, "step": 539 }, { "epoch": 0.06, "learning_rate": 1.9947478109395123e-05, "loss": 0.5277, "step": 540 }, { "epoch": 0.06, "learning_rate": 1.9947098540768306e-05, "loss": 0.5, "step": 541 }, { "epoch": 0.06, "learning_rate": 1.994671760916691e-05, "loss": 0.5134, "step": 542 }, { "epoch": 0.06, "learning_rate": 1.994633531464313e-05, "loss": 0.5056, "step": 543 }, { "epoch": 0.06, "learning_rate": 1.9945951657249348e-05, "loss": 0.5002, "step": 544 }, { "epoch": 0.06, "learning_rate": 1.9945566637038133e-05, "loss": 0.509, "step": 545 }, { "epoch": 0.06, "learning_rate": 1.9945180254062242e-05, "loss": 0.5243, "step": 546 }, { "epoch": 0.06, "learning_rate": 1.994479250837462e-05, "loss": 0.5495, "step": 547 }, { "epoch": 0.06, "learning_rate": 1.9944403400028392e-05, "loss": 0.4995, "step": 548 }, { "epoch": 0.06, "learning_rate": 1.9944012929076884e-05, "loss": 0.4847, "step": 549 }, { "epoch": 0.06, "learning_rate": 1.9943621095573588e-05, "loss": 0.5106, "step": 550 }, { "epoch": 0.06, "learning_rate": 1.9943227899572198e-05, "loss": 0.5006, "step": 551 }, { "epoch": 0.06, "learning_rate": 1.9942833341126597e-05, "loss": 0.5108, "step": 552 }, { "epoch": 0.06, "learning_rate": 1.9942437420290835e-05, "loss": 0.4873, "step": 553 }, { "epoch": 0.06, "learning_rate": 1.994204013711918e-05, "loss": 0.5005, "step": 554 }, { "epoch": 0.06, "learning_rate": 1.9941641491666052e-05, "loss": 0.5119, "step": 555 }, { "epoch": 0.06, "learning_rate": 1.994124148398608e-05, "loss": 0.5057, "step": 556 }, { "epoch": 0.06, "learning_rate": 1.9940840114134078e-05, "loss": 0.4932, "step": 557 }, { "epoch": 0.06, "learning_rate": 1.9940437382165038e-05, "loss": 0.505, "step": 558 }, { "epoch": 0.06, "learning_rate": 1.9940033288134143e-05, "loss": 0.487, "step": 559 }, { "epoch": 0.06, "learning_rate": 1.993962783209677e-05, "loss": 0.5201, "step": 560 }, { "epoch": 0.06, "learning_rate": 1.9939221014108467e-05, "loss": 0.5063, "step": 561 }, { "epoch": 0.06, "learning_rate": 1.9938812834224978e-05, "loss": 0.5005, "step": 562 }, { "epoch": 0.06, "learning_rate": 1.993840329250224e-05, "loss": 0.5017, "step": 563 }, { "epoch": 0.06, "learning_rate": 1.993799238899636e-05, "loss": 0.519, "step": 564 }, { "epoch": 0.06, "learning_rate": 1.9937580123763645e-05, "loss": 0.4934, "step": 565 }, { "epoch": 0.06, "learning_rate": 1.993716649686059e-05, "loss": 0.5086, "step": 566 }, { "epoch": 0.06, "learning_rate": 1.993675150834386e-05, "loss": 0.4863, "step": 567 }, { "epoch": 0.06, "learning_rate": 1.993633515827033e-05, "loss": 0.5089, "step": 568 }, { "epoch": 0.07, "learning_rate": 1.9935917446697038e-05, "loss": 0.5077, "step": 569 }, { "epoch": 0.07, "learning_rate": 1.993549837368123e-05, "loss": 0.4964, "step": 570 }, { "epoch": 0.07, "learning_rate": 1.9935077939280316e-05, "loss": 0.5055, "step": 571 }, { "epoch": 0.07, "learning_rate": 1.993465614355192e-05, "loss": 0.503, "step": 572 }, { "epoch": 0.07, "learning_rate": 1.9934232986553823e-05, "loss": 0.5179, "step": 573 }, { "epoch": 0.07, "learning_rate": 1.9933808468344016e-05, "loss": 0.4953, "step": 574 }, { "epoch": 0.07, "learning_rate": 1.9933382588980665e-05, "loss": 0.4912, "step": 575 }, { "epoch": 0.07, "learning_rate": 1.9932955348522125e-05, "loss": 0.4973, "step": 576 }, { "epoch": 0.07, "learning_rate": 1.9932526747026936e-05, "loss": 0.5004, "step": 577 }, { "epoch": 0.07, "learning_rate": 1.993209678455383e-05, "loss": 0.5175, "step": 578 }, { "epoch": 0.07, "learning_rate": 1.9931665461161716e-05, "loss": 0.5021, "step": 579 }, { "epoch": 0.07, "learning_rate": 1.9931232776909703e-05, "loss": 0.5096, "step": 580 }, { "epoch": 0.07, "learning_rate": 1.993079873185707e-05, "loss": 0.4768, "step": 581 }, { "epoch": 0.07, "learning_rate": 1.993036332606329e-05, "loss": 0.5109, "step": 582 }, { "epoch": 0.07, "learning_rate": 1.9929926559588032e-05, "loss": 0.4972, "step": 583 }, { "epoch": 0.07, "learning_rate": 1.9929488432491137e-05, "loss": 0.4919, "step": 584 }, { "epoch": 0.07, "learning_rate": 1.9929048944832638e-05, "loss": 0.4959, "step": 585 }, { "epoch": 0.07, "learning_rate": 1.9928608096672757e-05, "loss": 0.5132, "step": 586 }, { "epoch": 0.07, "learning_rate": 1.99281658880719e-05, "loss": 0.512, "step": 587 }, { "epoch": 0.07, "learning_rate": 1.992772231909066e-05, "loss": 0.4972, "step": 588 }, { "epoch": 0.07, "learning_rate": 1.9927277389789812e-05, "loss": 0.5027, "step": 589 }, { "epoch": 0.07, "learning_rate": 1.9926831100230322e-05, "loss": 0.4921, "step": 590 }, { "epoch": 0.07, "learning_rate": 1.9926383450473344e-05, "loss": 0.5223, "step": 591 }, { "epoch": 0.07, "learning_rate": 1.9925934440580218e-05, "loss": 0.496, "step": 592 }, { "epoch": 0.07, "learning_rate": 1.9925484070612465e-05, "loss": 0.5087, "step": 593 }, { "epoch": 0.07, "learning_rate": 1.9925032340631793e-05, "loss": 0.5022, "step": 594 }, { "epoch": 0.07, "learning_rate": 1.9924579250700104e-05, "loss": 0.511, "step": 595 }, { "epoch": 0.07, "learning_rate": 1.992412480087948e-05, "loss": 0.509, "step": 596 }, { "epoch": 0.07, "learning_rate": 1.992366899123219e-05, "loss": 0.513, "step": 597 }, { "epoch": 0.07, "learning_rate": 1.9923211821820692e-05, "loss": 0.5128, "step": 598 }, { "epoch": 0.07, "learning_rate": 1.9922753292707627e-05, "loss": 0.5197, "step": 599 }, { "epoch": 0.07, "learning_rate": 1.992229340395582e-05, "loss": 0.4962, "step": 600 }, { "epoch": 0.07, "learning_rate": 1.9921832155628295e-05, "loss": 0.4956, "step": 601 }, { "epoch": 0.07, "learning_rate": 1.9921369547788246e-05, "loss": 0.4905, "step": 602 }, { "epoch": 0.07, "learning_rate": 1.9920905580499063e-05, "loss": 0.5012, "step": 603 }, { "epoch": 0.07, "learning_rate": 1.9920440253824318e-05, "loss": 0.4991, "step": 604 }, { "epoch": 0.07, "learning_rate": 1.9919973567827776e-05, "loss": 0.5092, "step": 605 }, { "epoch": 0.07, "learning_rate": 1.991950552257338e-05, "loss": 0.4813, "step": 606 }, { "epoch": 0.07, "learning_rate": 1.991903611812526e-05, "loss": 0.4992, "step": 607 }, { "epoch": 0.07, "learning_rate": 1.9918565354547738e-05, "loss": 0.4908, "step": 608 }, { "epoch": 0.07, "learning_rate": 1.991809323190532e-05, "loss": 0.505, "step": 609 }, { "epoch": 0.07, "learning_rate": 1.99176197502627e-05, "loss": 0.4865, "step": 610 }, { "epoch": 0.07, "learning_rate": 1.9917144909684745e-05, "loss": 0.4982, "step": 611 }, { "epoch": 0.07, "learning_rate": 1.9916668710236528e-05, "loss": 0.5175, "step": 612 }, { "epoch": 0.07, "learning_rate": 1.9916191151983297e-05, "loss": 0.529, "step": 613 }, { "epoch": 0.07, "learning_rate": 1.9915712234990486e-05, "loss": 0.4916, "step": 614 }, { "epoch": 0.07, "learning_rate": 1.9915231959323722e-05, "loss": 0.5154, "step": 615 }, { "epoch": 0.07, "learning_rate": 1.991475032504881e-05, "loss": 0.4903, "step": 616 }, { "epoch": 0.07, "learning_rate": 1.9914267332231746e-05, "loss": 0.4984, "step": 617 }, { "epoch": 0.07, "learning_rate": 1.991378298093871e-05, "loss": 0.5179, "step": 618 }, { "epoch": 0.07, "learning_rate": 1.9913297271236063e-05, "loss": 0.4865, "step": 619 }, { "epoch": 0.07, "learning_rate": 1.9912810203190367e-05, "loss": 0.5074, "step": 620 }, { "epoch": 0.07, "learning_rate": 1.991232177686836e-05, "loss": 0.5076, "step": 621 }, { "epoch": 0.07, "learning_rate": 1.9911831992336963e-05, "loss": 0.5042, "step": 622 }, { "epoch": 0.07, "learning_rate": 1.9911340849663293e-05, "loss": 0.5021, "step": 623 }, { "epoch": 0.07, "learning_rate": 1.991084834891464e-05, "loss": 0.5062, "step": 624 }, { "epoch": 0.07, "learning_rate": 1.9910354490158498e-05, "loss": 0.4975, "step": 625 }, { "epoch": 0.07, "learning_rate": 1.9909859273462525e-05, "loss": 0.4892, "step": 626 }, { "epoch": 0.07, "learning_rate": 1.9909362698894585e-05, "loss": 0.4962, "step": 627 }, { "epoch": 0.07, "learning_rate": 1.9908864766522716e-05, "loss": 0.5167, "step": 628 }, { "epoch": 0.07, "learning_rate": 1.9908365476415146e-05, "loss": 0.5168, "step": 629 }, { "epoch": 0.07, "learning_rate": 1.9907864828640292e-05, "loss": 0.502, "step": 630 }, { "epoch": 0.07, "learning_rate": 1.9907362823266752e-05, "loss": 0.5143, "step": 631 }, { "epoch": 0.07, "learning_rate": 1.9906859460363307e-05, "loss": 0.5045, "step": 632 }, { "epoch": 0.07, "learning_rate": 1.9906354739998937e-05, "loss": 0.5051, "step": 633 }, { "epoch": 0.07, "learning_rate": 1.99058486622428e-05, "loss": 0.4971, "step": 634 }, { "epoch": 0.07, "learning_rate": 1.990534122716423e-05, "loss": 0.4839, "step": 635 }, { "epoch": 0.07, "learning_rate": 1.990483243483277e-05, "loss": 0.5059, "step": 636 }, { "epoch": 0.07, "learning_rate": 1.990432228531813e-05, "loss": 0.504, "step": 637 }, { "epoch": 0.07, "learning_rate": 1.9903810778690204e-05, "loss": 0.5081, "step": 638 }, { "epoch": 0.07, "learning_rate": 1.9903297915019093e-05, "loss": 0.5, "step": 639 }, { "epoch": 0.07, "learning_rate": 1.9902783694375064e-05, "loss": 0.5103, "step": 640 }, { "epoch": 0.07, "learning_rate": 1.9902268116828578e-05, "loss": 0.5111, "step": 641 }, { "epoch": 0.07, "learning_rate": 1.9901751182450276e-05, "loss": 0.4893, "step": 642 }, { "epoch": 0.07, "learning_rate": 1.9901232891310998e-05, "loss": 0.4861, "step": 643 }, { "epoch": 0.07, "learning_rate": 1.9900713243481758e-05, "loss": 0.5005, "step": 644 }, { "epoch": 0.07, "learning_rate": 1.990019223903376e-05, "loss": 0.4887, "step": 645 }, { "epoch": 0.07, "learning_rate": 1.9899669878038382e-05, "loss": 0.5158, "step": 646 }, { "epoch": 0.07, "learning_rate": 1.989914616056722e-05, "loss": 0.4871, "step": 647 }, { "epoch": 0.07, "learning_rate": 1.9898621086692017e-05, "loss": 0.5133, "step": 648 }, { "epoch": 0.07, "learning_rate": 1.989809465648473e-05, "loss": 0.4984, "step": 649 }, { "epoch": 0.07, "learning_rate": 1.989756687001749e-05, "loss": 0.4881, "step": 650 }, { "epoch": 0.07, "learning_rate": 1.9897037727362612e-05, "loss": 0.4802, "step": 651 }, { "epoch": 0.07, "learning_rate": 1.9896507228592604e-05, "loss": 0.5036, "step": 652 }, { "epoch": 0.07, "learning_rate": 1.989597537378015e-05, "loss": 0.4942, "step": 653 }, { "epoch": 0.07, "learning_rate": 1.9895442162998136e-05, "loss": 0.5228, "step": 654 }, { "epoch": 0.07, "learning_rate": 1.9894907596319615e-05, "loss": 0.4976, "step": 655 }, { "epoch": 0.07, "learning_rate": 1.989437167381784e-05, "loss": 0.5151, "step": 656 }, { "epoch": 0.08, "learning_rate": 1.9893834395566242e-05, "loss": 0.5039, "step": 657 }, { "epoch": 0.08, "learning_rate": 1.989329576163844e-05, "loss": 0.4843, "step": 658 }, { "epoch": 0.08, "learning_rate": 1.989275577210824e-05, "loss": 0.5066, "step": 659 }, { "epoch": 0.08, "learning_rate": 1.989221442704963e-05, "loss": 0.497, "step": 660 }, { "epoch": 0.08, "learning_rate": 1.9891671726536787e-05, "loss": 0.4965, "step": 661 }, { "epoch": 0.08, "learning_rate": 1.9891127670644076e-05, "loss": 0.4853, "step": 662 }, { "epoch": 0.08, "learning_rate": 1.9890582259446046e-05, "loss": 0.5132, "step": 663 }, { "epoch": 0.08, "learning_rate": 1.9890035493017424e-05, "loss": 0.4881, "step": 664 }, { "epoch": 0.08, "learning_rate": 1.9889487371433134e-05, "loss": 0.5049, "step": 665 }, { "epoch": 0.08, "learning_rate": 1.988893789476828e-05, "loss": 0.4886, "step": 666 }, { "epoch": 0.08, "learning_rate": 1.9888387063098153e-05, "loss": 0.5109, "step": 667 }, { "epoch": 0.08, "learning_rate": 1.9887834876498228e-05, "loss": 0.4744, "step": 668 }, { "epoch": 0.08, "learning_rate": 1.9887281335044167e-05, "loss": 0.4952, "step": 669 }, { "epoch": 0.08, "learning_rate": 1.988672643881182e-05, "loss": 0.4774, "step": 670 }, { "epoch": 0.08, "learning_rate": 1.9886170187877214e-05, "loss": 0.509, "step": 671 }, { "epoch": 0.08, "learning_rate": 1.9885612582316575e-05, "loss": 0.4924, "step": 672 }, { "epoch": 0.08, "learning_rate": 1.9885053622206305e-05, "loss": 0.4924, "step": 673 }, { "epoch": 0.08, "learning_rate": 1.9884493307622993e-05, "loss": 0.5126, "step": 674 }, { "epoch": 0.08, "learning_rate": 1.988393163864341e-05, "loss": 0.4876, "step": 675 }, { "epoch": 0.08, "learning_rate": 1.9883368615344526e-05, "loss": 0.4895, "step": 676 }, { "epoch": 0.08, "learning_rate": 1.9882804237803487e-05, "loss": 0.5074, "step": 677 }, { "epoch": 0.08, "learning_rate": 1.988223850609762e-05, "loss": 0.4826, "step": 678 }, { "epoch": 0.08, "learning_rate": 1.9881671420304444e-05, "loss": 0.5268, "step": 679 }, { "epoch": 0.08, "learning_rate": 1.9881102980501664e-05, "loss": 0.4995, "step": 680 }, { "epoch": 0.08, "learning_rate": 1.988053318676717e-05, "loss": 0.5015, "step": 681 }, { "epoch": 0.08, "learning_rate": 1.9879962039179033e-05, "loss": 0.5134, "step": 682 }, { "epoch": 0.08, "learning_rate": 1.9879389537815514e-05, "loss": 0.4966, "step": 683 }, { "epoch": 0.08, "learning_rate": 1.9878815682755062e-05, "loss": 0.4792, "step": 684 }, { "epoch": 0.08, "learning_rate": 1.9878240474076306e-05, "loss": 0.523, "step": 685 }, { "epoch": 0.08, "learning_rate": 1.987766391185806e-05, "loss": 0.492, "step": 686 }, { "epoch": 0.08, "learning_rate": 1.9877085996179327e-05, "loss": 0.5097, "step": 687 }, { "epoch": 0.08, "learning_rate": 1.9876506727119294e-05, "loss": 0.4948, "step": 688 }, { "epoch": 0.08, "learning_rate": 1.9875926104757337e-05, "loss": 0.5193, "step": 689 }, { "epoch": 0.08, "learning_rate": 1.9875344129173012e-05, "loss": 0.5, "step": 690 }, { "epoch": 0.08, "learning_rate": 1.9874760800446063e-05, "loss": 0.4983, "step": 691 }, { "epoch": 0.08, "learning_rate": 1.9874176118656415e-05, "loss": 0.4759, "step": 692 }, { "epoch": 0.08, "learning_rate": 1.9873590083884192e-05, "loss": 0.5069, "step": 693 }, { "epoch": 0.08, "learning_rate": 1.9873002696209688e-05, "loss": 0.5129, "step": 694 }, { "epoch": 0.08, "learning_rate": 1.9872413955713382e-05, "loss": 0.508, "step": 695 }, { "epoch": 0.08, "learning_rate": 1.9871823862475955e-05, "loss": 0.4963, "step": 696 }, { "epoch": 0.08, "learning_rate": 1.987123241657826e-05, "loss": 0.5074, "step": 697 }, { "epoch": 0.08, "learning_rate": 1.9870639618101333e-05, "loss": 0.5238, "step": 698 }, { "epoch": 0.08, "learning_rate": 1.987004546712641e-05, "loss": 0.4916, "step": 699 }, { "epoch": 0.08, "learning_rate": 1.9869449963734894e-05, "loss": 0.4913, "step": 700 }, { "epoch": 0.08, "learning_rate": 1.9868853108008387e-05, "loss": 0.4755, "step": 701 }, { "epoch": 0.08, "learning_rate": 1.986825490002867e-05, "loss": 0.4836, "step": 702 }, { "epoch": 0.08, "learning_rate": 1.9867655339877713e-05, "loss": 0.4985, "step": 703 }, { "epoch": 0.08, "learning_rate": 1.9867054427637667e-05, "loss": 0.4972, "step": 704 }, { "epoch": 0.08, "learning_rate": 1.986645216339087e-05, "loss": 0.5101, "step": 705 }, { "epoch": 0.08, "learning_rate": 1.9865848547219845e-05, "loss": 0.4929, "step": 706 }, { "epoch": 0.08, "learning_rate": 1.9865243579207304e-05, "loss": 0.4964, "step": 707 }, { "epoch": 0.08, "learning_rate": 1.986463725943614e-05, "loss": 0.5103, "step": 708 }, { "epoch": 0.08, "learning_rate": 1.9864029587989432e-05, "loss": 0.481, "step": 709 }, { "epoch": 0.08, "learning_rate": 1.9863420564950445e-05, "loss": 0.4843, "step": 710 }, { "epoch": 0.08, "learning_rate": 1.986281019040263e-05, "loss": 0.5253, "step": 711 }, { "epoch": 0.08, "learning_rate": 1.9862198464429614e-05, "loss": 0.4945, "step": 712 }, { "epoch": 0.08, "learning_rate": 1.9861585387115228e-05, "loss": 0.4945, "step": 713 }, { "epoch": 0.08, "learning_rate": 1.986097095854347e-05, "loss": 0.4998, "step": 714 }, { "epoch": 0.08, "learning_rate": 1.9860355178798536e-05, "loss": 0.4981, "step": 715 }, { "epoch": 0.08, "learning_rate": 1.9859738047964795e-05, "loss": 0.5039, "step": 716 }, { "epoch": 0.08, "learning_rate": 1.9859119566126813e-05, "loss": 0.4968, "step": 717 }, { "epoch": 0.08, "learning_rate": 1.9858499733369335e-05, "loss": 0.4974, "step": 718 }, { "epoch": 0.08, "learning_rate": 1.985787854977729e-05, "loss": 0.4996, "step": 719 }, { "epoch": 0.08, "learning_rate": 1.9857256015435797e-05, "loss": 0.4793, "step": 720 }, { "epoch": 0.08, "learning_rate": 1.985663213043015e-05, "loss": 0.4923, "step": 721 }, { "epoch": 0.08, "learning_rate": 1.9856006894845844e-05, "loss": 0.4878, "step": 722 }, { "epoch": 0.08, "learning_rate": 1.9855380308768546e-05, "loss": 0.5218, "step": 723 }, { "epoch": 0.08, "learning_rate": 1.9854752372284113e-05, "loss": 0.4872, "step": 724 }, { "epoch": 0.08, "learning_rate": 1.9854123085478587e-05, "loss": 0.4902, "step": 725 }, { "epoch": 0.08, "learning_rate": 1.9853492448438192e-05, "loss": 0.5086, "step": 726 }, { "epoch": 0.08, "learning_rate": 1.985286046124934e-05, "loss": 0.4679, "step": 727 }, { "epoch": 0.08, "learning_rate": 1.985222712399863e-05, "loss": 0.4948, "step": 728 }, { "epoch": 0.08, "learning_rate": 1.985159243677284e-05, "loss": 0.4955, "step": 729 }, { "epoch": 0.08, "learning_rate": 1.985095639965894e-05, "loss": 0.4996, "step": 730 }, { "epoch": 0.08, "learning_rate": 1.985031901274408e-05, "loss": 0.512, "step": 731 }, { "epoch": 0.08, "learning_rate": 1.9849680276115593e-05, "loss": 0.492, "step": 732 }, { "epoch": 0.08, "learning_rate": 1.9849040189861004e-05, "loss": 0.4928, "step": 733 }, { "epoch": 0.08, "learning_rate": 1.9848398754068018e-05, "loss": 0.5268, "step": 734 }, { "epoch": 0.08, "learning_rate": 1.984775596882452e-05, "loss": 0.4822, "step": 735 }, { "epoch": 0.08, "learning_rate": 1.98471118342186e-05, "loss": 0.487, "step": 736 }, { "epoch": 0.08, "learning_rate": 1.9846466350338506e-05, "loss": 0.5087, "step": 737 }, { "epoch": 0.08, "learning_rate": 1.9845819517272688e-05, "loss": 0.4785, "step": 738 }, { "epoch": 0.08, "learning_rate": 1.9845171335109776e-05, "loss": 0.523, "step": 739 }, { "epoch": 0.08, "learning_rate": 1.9844521803938588e-05, "loss": 0.4755, "step": 740 }, { "epoch": 0.08, "learning_rate": 1.9843870923848122e-05, "loss": 0.4949, "step": 741 }, { "epoch": 0.08, "learning_rate": 1.984321869492756e-05, "loss": 0.5024, "step": 742 }, { "epoch": 0.08, "learning_rate": 1.984256511726628e-05, "loss": 0.502, "step": 743 }, { "epoch": 0.09, "learning_rate": 1.984191019095383e-05, "loss": 0.4899, "step": 744 }, { "epoch": 0.09, "learning_rate": 1.9841253916079953e-05, "loss": 0.5067, "step": 745 }, { "epoch": 0.09, "learning_rate": 1.9840596292734573e-05, "loss": 0.4877, "step": 746 }, { "epoch": 0.09, "learning_rate": 1.9839937321007795e-05, "loss": 0.5142, "step": 747 }, { "epoch": 0.09, "learning_rate": 1.983927700098992e-05, "loss": 0.488, "step": 748 }, { "epoch": 0.09, "learning_rate": 1.983861533277142e-05, "loss": 0.501, "step": 749 }, { "epoch": 0.09, "learning_rate": 1.983795231644296e-05, "loss": 0.4959, "step": 750 }, { "epoch": 0.09, "learning_rate": 1.983728795209539e-05, "loss": 0.5074, "step": 751 }, { "epoch": 0.09, "learning_rate": 1.9836622239819743e-05, "loss": 0.4955, "step": 752 }, { "epoch": 0.09, "learning_rate": 1.983595517970723e-05, "loss": 0.4876, "step": 753 }, { "epoch": 0.09, "learning_rate": 1.9835286771849264e-05, "loss": 0.4906, "step": 754 }, { "epoch": 0.09, "learning_rate": 1.9834617016337424e-05, "loss": 0.5096, "step": 755 }, { "epoch": 0.09, "learning_rate": 1.9833945913263483e-05, "loss": 0.513, "step": 756 }, { "epoch": 0.09, "learning_rate": 1.9833273462719396e-05, "loss": 0.5042, "step": 757 }, { "epoch": 0.09, "learning_rate": 1.9832599664797306e-05, "loss": 0.4622, "step": 758 }, { "epoch": 0.09, "learning_rate": 1.9831924519589537e-05, "loss": 0.4877, "step": 759 }, { "epoch": 0.09, "learning_rate": 1.9831248027188604e-05, "loss": 0.5123, "step": 760 }, { "epoch": 0.09, "learning_rate": 1.983057018768719e-05, "loss": 0.4812, "step": 761 }, { "epoch": 0.09, "learning_rate": 1.982989100117819e-05, "loss": 0.4839, "step": 762 }, { "epoch": 0.09, "learning_rate": 1.9829210467754654e-05, "loss": 0.5185, "step": 763 }, { "epoch": 0.09, "learning_rate": 1.9828528587509836e-05, "loss": 0.4878, "step": 764 }, { "epoch": 0.09, "learning_rate": 1.982784536053717e-05, "loss": 0.4959, "step": 765 }, { "epoch": 0.09, "learning_rate": 1.9827160786930267e-05, "loss": 0.5101, "step": 766 }, { "epoch": 0.09, "learning_rate": 1.9826474866782933e-05, "loss": 0.4955, "step": 767 }, { "epoch": 0.09, "learning_rate": 1.9825787600189163e-05, "loss": 0.5152, "step": 768 }, { "epoch": 0.09, "learning_rate": 1.982509898724311e-05, "loss": 0.4909, "step": 769 }, { "epoch": 0.09, "learning_rate": 1.9824409028039143e-05, "loss": 0.5013, "step": 770 }, { "epoch": 0.09, "learning_rate": 1.9823717722671798e-05, "loss": 0.4928, "step": 771 }, { "epoch": 0.09, "learning_rate": 1.98230250712358e-05, "loss": 0.4885, "step": 772 }, { "epoch": 0.09, "learning_rate": 1.9822331073826056e-05, "loss": 0.5048, "step": 773 }, { "epoch": 0.09, "learning_rate": 1.982163573053766e-05, "loss": 0.4921, "step": 774 }, { "epoch": 0.09, "learning_rate": 1.9820939041465887e-05, "loss": 0.4884, "step": 775 }, { "epoch": 0.09, "learning_rate": 1.9820241006706203e-05, "loss": 0.4746, "step": 776 }, { "epoch": 0.09, "learning_rate": 1.9819541626354252e-05, "loss": 0.4968, "step": 777 }, { "epoch": 0.09, "learning_rate": 1.9818840900505866e-05, "loss": 0.4767, "step": 778 }, { "epoch": 0.09, "learning_rate": 1.9818138829257063e-05, "loss": 0.5091, "step": 779 }, { "epoch": 0.09, "learning_rate": 1.9817435412704037e-05, "loss": 0.5013, "step": 780 }, { "epoch": 0.09, "learning_rate": 1.981673065094317e-05, "loss": 0.525, "step": 781 }, { "epoch": 0.09, "learning_rate": 1.9816024544071038e-05, "loss": 0.4728, "step": 782 }, { "epoch": 0.09, "learning_rate": 1.9815317092184388e-05, "loss": 0.505, "step": 783 }, { "epoch": 0.09, "learning_rate": 1.9814608295380155e-05, "loss": 0.4836, "step": 784 }, { "epoch": 0.09, "learning_rate": 1.9813898153755465e-05, "loss": 0.4904, "step": 785 }, { "epoch": 0.09, "learning_rate": 1.9813186667407624e-05, "loss": 0.4916, "step": 786 }, { "epoch": 0.09, "learning_rate": 1.9812473836434115e-05, "loss": 0.4835, "step": 787 }, { "epoch": 0.09, "learning_rate": 1.981175966093262e-05, "loss": 0.5016, "step": 788 }, { "epoch": 0.09, "learning_rate": 1.9811044141000985e-05, "loss": 0.507, "step": 789 }, { "epoch": 0.09, "learning_rate": 1.9810327276737268e-05, "loss": 0.4745, "step": 790 }, { "epoch": 0.09, "learning_rate": 1.980960906823968e-05, "loss": 0.5002, "step": 791 }, { "epoch": 0.09, "learning_rate": 1.9808889515606644e-05, "loss": 0.4881, "step": 792 }, { "epoch": 0.09, "learning_rate": 1.9808168618936746e-05, "loss": 0.4806, "step": 793 }, { "epoch": 0.09, "learning_rate": 1.980744637832877e-05, "loss": 0.4801, "step": 794 }, { "epoch": 0.09, "learning_rate": 1.9806722793881675e-05, "loss": 0.4944, "step": 795 }, { "epoch": 0.09, "learning_rate": 1.9805997865694616e-05, "loss": 0.499, "step": 796 }, { "epoch": 0.09, "learning_rate": 1.9805271593866914e-05, "loss": 0.5009, "step": 797 }, { "epoch": 0.09, "learning_rate": 1.9804543978498093e-05, "loss": 0.4867, "step": 798 }, { "epoch": 0.09, "learning_rate": 1.9803815019687844e-05, "loss": 0.5012, "step": 799 }, { "epoch": 0.09, "learning_rate": 1.980308471753606e-05, "loss": 0.5014, "step": 800 }, { "epoch": 0.09, "learning_rate": 1.9802353072142802e-05, "loss": 0.5037, "step": 801 }, { "epoch": 0.09, "learning_rate": 1.9801620083608327e-05, "loss": 0.4848, "step": 802 }, { "epoch": 0.09, "learning_rate": 1.9800885752033067e-05, "loss": 0.4847, "step": 803 }, { "epoch": 0.09, "learning_rate": 1.980015007751764e-05, "loss": 0.4958, "step": 804 }, { "epoch": 0.09, "learning_rate": 1.9799413060162854e-05, "loss": 0.4871, "step": 805 }, { "epoch": 0.09, "learning_rate": 1.9798674700069698e-05, "loss": 0.4962, "step": 806 }, { "epoch": 0.09, "learning_rate": 1.979793499733934e-05, "loss": 0.5009, "step": 807 }, { "epoch": 0.09, "learning_rate": 1.9797193952073135e-05, "loss": 0.4764, "step": 808 }, { "epoch": 0.09, "learning_rate": 1.9796451564372624e-05, "loss": 0.5013, "step": 809 }, { "epoch": 0.09, "learning_rate": 1.979570783433954e-05, "loss": 0.5022, "step": 810 }, { "epoch": 0.09, "learning_rate": 1.9794962762075772e-05, "loss": 0.4912, "step": 811 }, { "epoch": 0.09, "learning_rate": 1.9794216347683425e-05, "loss": 0.5052, "step": 812 }, { "epoch": 0.09, "learning_rate": 1.979346859126477e-05, "loss": 0.4961, "step": 813 }, { "epoch": 0.09, "learning_rate": 1.979271949292227e-05, "loss": 0.5019, "step": 814 }, { "epoch": 0.09, "learning_rate": 1.9791969052758563e-05, "loss": 0.497, "step": 815 }, { "epoch": 0.09, "learning_rate": 1.979121727087648e-05, "loss": 0.4944, "step": 816 }, { "epoch": 0.09, "learning_rate": 1.979046414737903e-05, "loss": 0.4989, "step": 817 }, { "epoch": 0.09, "learning_rate": 1.978970968236941e-05, "loss": 0.4955, "step": 818 }, { "epoch": 0.09, "learning_rate": 1.9788953875950992e-05, "loss": 0.4843, "step": 819 }, { "epoch": 0.09, "learning_rate": 1.9788196728227348e-05, "loss": 0.4918, "step": 820 }, { "epoch": 0.09, "learning_rate": 1.9787438239302217e-05, "loss": 0.4815, "step": 821 }, { "epoch": 0.09, "learning_rate": 1.9786678409279535e-05, "loss": 0.4935, "step": 822 }, { "epoch": 0.09, "learning_rate": 1.9785917238263405e-05, "loss": 0.4966, "step": 823 }, { "epoch": 0.09, "learning_rate": 1.9785154726358134e-05, "loss": 0.514, "step": 824 }, { "epoch": 0.09, "learning_rate": 1.9784390873668206e-05, "loss": 0.517, "step": 825 }, { "epoch": 0.09, "learning_rate": 1.9783625680298276e-05, "loss": 0.4887, "step": 826 }, { "epoch": 0.09, "learning_rate": 1.9782859146353196e-05, "loss": 0.4793, "step": 827 }, { "epoch": 0.09, "learning_rate": 1.9782091271938e-05, "loss": 0.4941, "step": 828 }, { "epoch": 0.09, "learning_rate": 1.9781322057157902e-05, "loss": 0.5018, "step": 829 }, { "epoch": 0.09, "learning_rate": 1.9780551502118306e-05, "loss": 0.4994, "step": 830 }, { "epoch": 0.09, "learning_rate": 1.9779779606924788e-05, "loss": 0.491, "step": 831 }, { "epoch": 0.1, "learning_rate": 1.977900637168312e-05, "loss": 0.4961, "step": 832 }, { "epoch": 0.1, "learning_rate": 1.9778231796499254e-05, "loss": 0.4925, "step": 833 }, { "epoch": 0.1, "learning_rate": 1.977745588147932e-05, "loss": 0.4914, "step": 834 }, { "epoch": 0.1, "learning_rate": 1.977667862672964e-05, "loss": 0.4989, "step": 835 }, { "epoch": 0.1, "learning_rate": 1.9775900032356704e-05, "loss": 0.4993, "step": 836 }, { "epoch": 0.1, "learning_rate": 1.9775120098467212e-05, "loss": 0.4878, "step": 837 }, { "epoch": 0.1, "learning_rate": 1.9774338825168024e-05, "loss": 0.5092, "step": 838 }, { "epoch": 0.1, "learning_rate": 1.977355621256619e-05, "loss": 0.4944, "step": 839 }, { "epoch": 0.1, "learning_rate": 1.9772772260768954e-05, "loss": 0.5022, "step": 840 }, { "epoch": 0.1, "learning_rate": 1.9771986969883727e-05, "loss": 0.5086, "step": 841 }, { "epoch": 0.1, "learning_rate": 1.9771200340018115e-05, "loss": 0.4895, "step": 842 }, { "epoch": 0.1, "learning_rate": 1.97704123712799e-05, "loss": 0.4911, "step": 843 }, { "epoch": 0.1, "learning_rate": 1.976962306377706e-05, "loss": 0.5018, "step": 844 }, { "epoch": 0.1, "learning_rate": 1.9768832417617737e-05, "loss": 0.4837, "step": 845 }, { "epoch": 0.1, "learning_rate": 1.9768040432910276e-05, "loss": 0.5251, "step": 846 }, { "epoch": 0.1, "learning_rate": 1.976724710976319e-05, "loss": 0.5045, "step": 847 }, { "epoch": 0.1, "learning_rate": 1.9766452448285184e-05, "loss": 0.5115, "step": 848 }, { "epoch": 0.1, "learning_rate": 1.9765656448585148e-05, "loss": 0.4769, "step": 849 }, { "epoch": 0.1, "learning_rate": 1.976485911077215e-05, "loss": 0.4936, "step": 850 }, { "epoch": 0.1, "learning_rate": 1.9764060434955437e-05, "loss": 0.4867, "step": 851 }, { "epoch": 0.1, "learning_rate": 1.9763260421244455e-05, "loss": 0.4924, "step": 852 }, { "epoch": 0.1, "learning_rate": 1.9762459069748817e-05, "loss": 0.4903, "step": 853 }, { "epoch": 0.1, "learning_rate": 1.9761656380578328e-05, "loss": 0.4812, "step": 854 }, { "epoch": 0.1, "learning_rate": 1.9760852353842973e-05, "loss": 0.4974, "step": 855 }, { "epoch": 0.1, "learning_rate": 1.9760046989652926e-05, "loss": 0.5047, "step": 856 }, { "epoch": 0.1, "learning_rate": 1.9759240288118536e-05, "loss": 0.4837, "step": 857 }, { "epoch": 0.1, "learning_rate": 1.975843224935034e-05, "loss": 0.4966, "step": 858 }, { "epoch": 0.1, "learning_rate": 1.9757622873459056e-05, "loss": 0.505, "step": 859 }, { "epoch": 0.1, "learning_rate": 1.9756812160555586e-05, "loss": 0.4818, "step": 860 }, { "epoch": 0.1, "learning_rate": 1.9756000110751023e-05, "loss": 0.4965, "step": 861 }, { "epoch": 0.1, "learning_rate": 1.975518672415663e-05, "loss": 0.4987, "step": 862 }, { "epoch": 0.1, "learning_rate": 1.975437200088386e-05, "loss": 0.4718, "step": 863 }, { "epoch": 0.1, "learning_rate": 1.9753555941044345e-05, "loss": 0.5024, "step": 864 }, { "epoch": 0.1, "learning_rate": 1.9752738544749906e-05, "loss": 0.4937, "step": 865 }, { "epoch": 0.1, "learning_rate": 1.975191981211255e-05, "loss": 0.4968, "step": 866 }, { "epoch": 0.1, "learning_rate": 1.9751099743244454e-05, "loss": 0.4785, "step": 867 }, { "epoch": 0.1, "learning_rate": 1.9750278338257985e-05, "loss": 0.5002, "step": 868 }, { "epoch": 0.1, "learning_rate": 1.9749455597265704e-05, "loss": 0.4948, "step": 869 }, { "epoch": 0.1, "learning_rate": 1.9748631520380333e-05, "loss": 0.4887, "step": 870 }, { "epoch": 0.1, "learning_rate": 1.97478061077148e-05, "loss": 0.4751, "step": 871 }, { "epoch": 0.1, "learning_rate": 1.9746979359382193e-05, "loss": 0.4976, "step": 872 }, { "epoch": 0.1, "learning_rate": 1.9746151275495803e-05, "loss": 0.5071, "step": 873 }, { "epoch": 0.1, "learning_rate": 1.974532185616909e-05, "loss": 0.5251, "step": 874 }, { "epoch": 0.1, "learning_rate": 1.9744491101515715e-05, "loss": 0.484, "step": 875 }, { "epoch": 0.1, "learning_rate": 1.9743659011649495e-05, "loss": 0.4894, "step": 876 }, { "epoch": 0.1, "learning_rate": 1.9742825586684457e-05, "loss": 0.4815, "step": 877 }, { "epoch": 0.1, "learning_rate": 1.9741990826734793e-05, "loss": 0.5014, "step": 878 }, { "epoch": 0.1, "learning_rate": 1.9741154731914882e-05, "loss": 0.4918, "step": 879 }, { "epoch": 0.1, "learning_rate": 1.974031730233929e-05, "loss": 0.4868, "step": 880 }, { "epoch": 0.1, "learning_rate": 1.9739478538122765e-05, "loss": 0.4782, "step": 881 }, { "epoch": 0.1, "learning_rate": 1.9738638439380237e-05, "loss": 0.5087, "step": 882 }, { "epoch": 0.1, "learning_rate": 1.9737797006226815e-05, "loss": 0.4789, "step": 883 }, { "epoch": 0.1, "learning_rate": 1.9736954238777793e-05, "loss": 0.4782, "step": 884 }, { "epoch": 0.1, "learning_rate": 1.973611013714865e-05, "loss": 0.4946, "step": 885 }, { "epoch": 0.1, "learning_rate": 1.9735264701455054e-05, "loss": 0.5054, "step": 886 }, { "epoch": 0.1, "learning_rate": 1.973441793181284e-05, "loss": 0.4952, "step": 887 }, { "epoch": 0.1, "learning_rate": 1.9733569828338038e-05, "loss": 0.4816, "step": 888 }, { "epoch": 0.1, "learning_rate": 1.9732720391146852e-05, "loss": 0.5189, "step": 889 }, { "epoch": 0.1, "learning_rate": 1.973186962035568e-05, "loss": 0.4958, "step": 890 }, { "epoch": 0.1, "learning_rate": 1.97310175160811e-05, "loss": 0.5128, "step": 891 }, { "epoch": 0.1, "learning_rate": 1.9730164078439857e-05, "loss": 0.5123, "step": 892 }, { "epoch": 0.1, "learning_rate": 1.97293093075489e-05, "loss": 0.4817, "step": 893 }, { "epoch": 0.1, "learning_rate": 1.9728453203525352e-05, "loss": 0.5027, "step": 894 }, { "epoch": 0.1, "learning_rate": 1.9727595766486514e-05, "loss": 0.5033, "step": 895 }, { "epoch": 0.1, "learning_rate": 1.972673699654988e-05, "loss": 0.4904, "step": 896 }, { "epoch": 0.1, "learning_rate": 1.9725876893833108e-05, "loss": 0.4848, "step": 897 }, { "epoch": 0.1, "learning_rate": 1.9725015458454068e-05, "loss": 0.4898, "step": 898 }, { "epoch": 0.1, "learning_rate": 1.9724152690530785e-05, "loss": 0.5056, "step": 899 }, { "epoch": 0.1, "learning_rate": 1.972328859018148e-05, "loss": 0.4908, "step": 900 }, { "epoch": 0.1, "learning_rate": 1.9722423157524553e-05, "loss": 0.4829, "step": 901 }, { "epoch": 0.1, "learning_rate": 1.972155639267859e-05, "loss": 0.4885, "step": 902 }, { "epoch": 0.1, "learning_rate": 1.972068829576236e-05, "loss": 0.4938, "step": 903 }, { "epoch": 0.1, "learning_rate": 1.9719818866894802e-05, "loss": 0.4802, "step": 904 }, { "epoch": 0.1, "learning_rate": 1.9718948106195055e-05, "loss": 0.5079, "step": 905 }, { "epoch": 0.1, "learning_rate": 1.971807601378243e-05, "loss": 0.4982, "step": 906 }, { "epoch": 0.1, "learning_rate": 1.9717202589776424e-05, "loss": 0.4993, "step": 907 }, { "epoch": 0.1, "learning_rate": 1.971632783429672e-05, "loss": 0.5026, "step": 908 }, { "epoch": 0.1, "learning_rate": 1.9715451747463168e-05, "loss": 0.4881, "step": 909 }, { "epoch": 0.1, "learning_rate": 1.971457432939582e-05, "loss": 0.5166, "step": 910 }, { "epoch": 0.1, "learning_rate": 1.97136955802149e-05, "loss": 0.4888, "step": 911 }, { "epoch": 0.1, "learning_rate": 1.9712815500040815e-05, "loss": 0.4803, "step": 912 }, { "epoch": 0.1, "learning_rate": 1.9711934088994157e-05, "loss": 0.4939, "step": 913 }, { "epoch": 0.1, "learning_rate": 1.97110513471957e-05, "loss": 0.4948, "step": 914 }, { "epoch": 0.1, "learning_rate": 1.9710167274766395e-05, "loss": 0.4926, "step": 915 }, { "epoch": 0.1, "learning_rate": 1.9709281871827386e-05, "loss": 0.4969, "step": 916 }, { "epoch": 0.1, "learning_rate": 1.9708395138499986e-05, "loss": 0.4836, "step": 917 }, { "epoch": 0.1, "learning_rate": 1.97075070749057e-05, "loss": 0.5263, "step": 918 }, { "epoch": 0.11, "learning_rate": 1.970661768116622e-05, "loss": 0.4922, "step": 919 }, { "epoch": 0.11, "learning_rate": 1.9705726957403398e-05, "loss": 0.4912, "step": 920 }, { "epoch": 0.11, "learning_rate": 1.9704834903739297e-05, "loss": 0.4587, "step": 921 }, { "epoch": 0.11, "learning_rate": 1.970394152029614e-05, "loss": 0.5059, "step": 922 }, { "epoch": 0.11, "learning_rate": 1.970304680719634e-05, "loss": 0.4826, "step": 923 }, { "epoch": 0.11, "learning_rate": 1.9702150764562498e-05, "loss": 0.5044, "step": 924 }, { "epoch": 0.11, "learning_rate": 1.970125339251739e-05, "loss": 0.4838, "step": 925 }, { "epoch": 0.11, "learning_rate": 1.9700354691183977e-05, "loss": 0.5082, "step": 926 }, { "epoch": 0.11, "learning_rate": 1.9699454660685398e-05, "loss": 0.4833, "step": 927 }, { "epoch": 0.11, "learning_rate": 1.969855330114498e-05, "loss": 0.4837, "step": 928 }, { "epoch": 0.11, "learning_rate": 1.9697650612686228e-05, "loss": 0.4915, "step": 929 }, { "epoch": 0.11, "learning_rate": 1.9696746595432828e-05, "loss": 0.4941, "step": 930 }, { "epoch": 0.11, "learning_rate": 1.9695841249508656e-05, "loss": 0.5001, "step": 931 }, { "epoch": 0.11, "learning_rate": 1.9694934575037762e-05, "loss": 0.514, "step": 932 }, { "epoch": 0.11, "learning_rate": 1.969402657214438e-05, "loss": 0.4917, "step": 933 }, { "epoch": 0.11, "learning_rate": 1.9693117240952928e-05, "loss": 0.4981, "step": 934 }, { "epoch": 0.11, "learning_rate": 1.9692206581588e-05, "loss": 0.4806, "step": 935 }, { "epoch": 0.11, "learning_rate": 1.969129459417438e-05, "loss": 0.496, "step": 936 }, { "epoch": 0.11, "learning_rate": 1.9690381278837038e-05, "loss": 0.4817, "step": 937 }, { "epoch": 0.11, "learning_rate": 1.9689466635701106e-05, "loss": 0.5036, "step": 938 }, { "epoch": 0.11, "learning_rate": 1.9688550664891915e-05, "loss": 0.5118, "step": 939 }, { "epoch": 0.11, "learning_rate": 1.968763336653498e-05, "loss": 0.5007, "step": 940 }, { "epoch": 0.11, "learning_rate": 1.968671474075598e-05, "loss": 0.4755, "step": 941 }, { "epoch": 0.11, "learning_rate": 1.96857947876808e-05, "loss": 0.51, "step": 942 }, { "epoch": 0.11, "learning_rate": 1.968487350743548e-05, "loss": 0.4993, "step": 943 }, { "epoch": 0.11, "learning_rate": 1.968395090014627e-05, "loss": 0.5162, "step": 944 }, { "epoch": 0.11, "learning_rate": 1.968302696593958e-05, "loss": 0.4912, "step": 945 }, { "epoch": 0.11, "learning_rate": 1.968210170494201e-05, "loss": 0.4905, "step": 946 }, { "epoch": 0.11, "learning_rate": 1.9681175117280343e-05, "loss": 0.4988, "step": 947 }, { "epoch": 0.11, "learning_rate": 1.9680247203081537e-05, "loss": 0.4947, "step": 948 }, { "epoch": 0.11, "learning_rate": 1.9679317962472746e-05, "loss": 0.4997, "step": 949 }, { "epoch": 0.11, "learning_rate": 1.9678387395581292e-05, "loss": 0.4728, "step": 950 }, { "epoch": 0.11, "learning_rate": 1.967745550253468e-05, "loss": 0.4971, "step": 951 }, { "epoch": 0.11, "learning_rate": 1.9676522283460606e-05, "loss": 0.488, "step": 952 }, { "epoch": 0.11, "learning_rate": 1.9675587738486935e-05, "loss": 0.4897, "step": 953 }, { "epoch": 0.11, "learning_rate": 1.9674651867741733e-05, "loss": 0.4924, "step": 954 }, { "epoch": 0.11, "learning_rate": 1.967371467135322e-05, "loss": 0.489, "step": 955 }, { "epoch": 0.11, "learning_rate": 1.9672776149449826e-05, "loss": 0.4761, "step": 956 }, { "epoch": 0.11, "learning_rate": 1.967183630216014e-05, "loss": 0.513, "step": 957 }, { "epoch": 0.11, "learning_rate": 1.9670895129612946e-05, "loss": 0.4968, "step": 958 }, { "epoch": 0.11, "learning_rate": 1.9669952631937206e-05, "loss": 0.4754, "step": 959 }, { "epoch": 0.11, "learning_rate": 1.9669008809262064e-05, "loss": 0.4952, "step": 960 }, { "epoch": 0.11, "learning_rate": 1.9668063661716837e-05, "loss": 0.4881, "step": 961 }, { "epoch": 0.11, "learning_rate": 1.9667117189431045e-05, "loss": 0.4988, "step": 962 }, { "epoch": 0.11, "learning_rate": 1.9666169392534363e-05, "loss": 0.4809, "step": 963 }, { "epoch": 0.11, "learning_rate": 1.966522027115667e-05, "loss": 0.4772, "step": 964 }, { "epoch": 0.11, "learning_rate": 1.966426982542801e-05, "loss": 0.4936, "step": 965 }, { "epoch": 0.11, "learning_rate": 1.9663318055478616e-05, "loss": 0.4872, "step": 966 }, { "epoch": 0.11, "learning_rate": 1.9662364961438907e-05, "loss": 0.5017, "step": 967 }, { "epoch": 0.11, "learning_rate": 1.966141054343947e-05, "loss": 0.4938, "step": 968 }, { "epoch": 0.11, "learning_rate": 1.9660454801611094e-05, "loss": 0.4742, "step": 969 }, { "epoch": 0.11, "learning_rate": 1.9659497736084722e-05, "loss": 0.4818, "step": 970 }, { "epoch": 0.11, "learning_rate": 1.9658539346991504e-05, "loss": 0.4862, "step": 971 }, { "epoch": 0.11, "learning_rate": 1.9657579634462757e-05, "loss": 0.4894, "step": 972 }, { "epoch": 0.11, "learning_rate": 1.9656618598629985e-05, "loss": 0.4805, "step": 973 }, { "epoch": 0.11, "learning_rate": 1.9655656239624864e-05, "loss": 0.4846, "step": 974 }, { "epoch": 0.11, "learning_rate": 1.965469255757927e-05, "loss": 0.5027, "step": 975 }, { "epoch": 0.11, "learning_rate": 1.9653727552625242e-05, "loss": 0.4863, "step": 976 }, { "epoch": 0.11, "learning_rate": 1.9652761224895006e-05, "loss": 0.4852, "step": 977 }, { "epoch": 0.11, "learning_rate": 1.9651793574520975e-05, "loss": 0.4887, "step": 978 }, { "epoch": 0.11, "learning_rate": 1.965082460163574e-05, "loss": 0.4766, "step": 979 }, { "epoch": 0.11, "learning_rate": 1.9649854306372065e-05, "loss": 0.5133, "step": 980 }, { "epoch": 0.11, "learning_rate": 1.9648882688862905e-05, "loss": 0.4669, "step": 981 }, { "epoch": 0.11, "learning_rate": 1.9647909749241394e-05, "loss": 0.4821, "step": 982 }, { "epoch": 0.11, "learning_rate": 1.9646935487640848e-05, "loss": 0.4946, "step": 983 }, { "epoch": 0.11, "learning_rate": 1.964595990419476e-05, "loss": 0.5043, "step": 984 }, { "epoch": 0.11, "learning_rate": 1.964498299903681e-05, "loss": 0.4751, "step": 985 }, { "epoch": 0.11, "learning_rate": 1.964400477230085e-05, "loss": 0.5033, "step": 986 }, { "epoch": 0.11, "learning_rate": 1.9643025224120923e-05, "loss": 0.4757, "step": 987 }, { "epoch": 0.11, "learning_rate": 1.9642044354631255e-05, "loss": 0.4983, "step": 988 }, { "epoch": 0.11, "learning_rate": 1.9641062163966232e-05, "loss": 0.49, "step": 989 }, { "epoch": 0.11, "learning_rate": 1.9640078652260447e-05, "loss": 0.4855, "step": 990 }, { "epoch": 0.11, "learning_rate": 1.9639093819648664e-05, "loss": 0.5073, "step": 991 }, { "epoch": 0.11, "learning_rate": 1.963810766626582e-05, "loss": 0.5177, "step": 992 }, { "epoch": 0.11, "learning_rate": 1.9637120192247046e-05, "loss": 0.4823, "step": 993 }, { "epoch": 0.11, "learning_rate": 1.9636131397727646e-05, "loss": 0.4998, "step": 994 }, { "epoch": 0.11, "learning_rate": 1.9635141282843105e-05, "loss": 0.4702, "step": 995 }, { "epoch": 0.11, "learning_rate": 1.9634149847729093e-05, "loss": 0.4997, "step": 996 }, { "epoch": 0.11, "learning_rate": 1.963315709252146e-05, "loss": 0.4942, "step": 997 }, { "epoch": 0.11, "learning_rate": 1.963216301735623e-05, "loss": 0.5002, "step": 998 }, { "epoch": 0.11, "learning_rate": 1.9631167622369617e-05, "loss": 0.5039, "step": 999 }, { "epoch": 0.11, "learning_rate": 1.9630170907698015e-05, "loss": 0.497, "step": 1000 }, { "epoch": 0.11, "learning_rate": 1.9629172873477995e-05, "loss": 0.4884, "step": 1001 }, { "epoch": 0.11, "learning_rate": 1.9628173519846308e-05, "loss": 0.4728, "step": 1002 }, { "epoch": 0.11, "learning_rate": 1.9627172846939886e-05, "loss": 0.5004, "step": 1003 }, { "epoch": 0.11, "learning_rate": 1.962617085489585e-05, "loss": 0.4989, "step": 1004 }, { "epoch": 0.11, "learning_rate": 1.962516754385149e-05, "loss": 0.4877, "step": 1005 }, { "epoch": 0.11, "learning_rate": 1.962416291394428e-05, "loss": 0.4992, "step": 1006 }, { "epoch": 0.12, "learning_rate": 1.9623156965311884e-05, "loss": 0.4895, "step": 1007 }, { "epoch": 0.12, "learning_rate": 1.9622149698092135e-05, "loss": 0.4922, "step": 1008 }, { "epoch": 0.12, "learning_rate": 1.962114111242305e-05, "loss": 0.5085, "step": 1009 }, { "epoch": 0.12, "learning_rate": 1.962013120844283e-05, "loss": 0.473, "step": 1010 }, { "epoch": 0.12, "learning_rate": 1.9619119986289855e-05, "loss": 0.4942, "step": 1011 }, { "epoch": 0.12, "learning_rate": 1.9618107446102682e-05, "loss": 0.4962, "step": 1012 }, { "epoch": 0.12, "learning_rate": 1.9617093588020057e-05, "loss": 0.4859, "step": 1013 }, { "epoch": 0.12, "learning_rate": 1.9616078412180896e-05, "loss": 0.4819, "step": 1014 }, { "epoch": 0.12, "learning_rate": 1.96150619187243e-05, "loss": 0.4826, "step": 1015 }, { "epoch": 0.12, "learning_rate": 1.9614044107789553e-05, "loss": 0.5166, "step": 1016 }, { "epoch": 0.12, "learning_rate": 1.9613024979516123e-05, "loss": 0.4963, "step": 1017 }, { "epoch": 0.12, "learning_rate": 1.9612004534043644e-05, "loss": 0.4796, "step": 1018 }, { "epoch": 0.12, "learning_rate": 1.9610982771511947e-05, "loss": 0.4787, "step": 1019 }, { "epoch": 0.12, "learning_rate": 1.9609959692061037e-05, "loss": 0.4938, "step": 1020 }, { "epoch": 0.12, "learning_rate": 1.9608935295831092e-05, "loss": 0.48, "step": 1021 }, { "epoch": 0.12, "learning_rate": 1.9607909582962478e-05, "loss": 0.4807, "step": 1022 }, { "epoch": 0.12, "learning_rate": 1.9606882553595748e-05, "loss": 0.4893, "step": 1023 }, { "epoch": 0.12, "learning_rate": 1.960585420787162e-05, "loss": 0.4854, "step": 1024 }, { "epoch": 0.12, "learning_rate": 1.9604824545931005e-05, "loss": 0.5115, "step": 1025 }, { "epoch": 0.12, "learning_rate": 1.960379356791499e-05, "loss": 0.4804, "step": 1026 }, { "epoch": 0.12, "learning_rate": 1.960276127396484e-05, "loss": 0.4954, "step": 1027 }, { "epoch": 0.12, "learning_rate": 1.9601727664222e-05, "loss": 0.4761, "step": 1028 }, { "epoch": 0.12, "learning_rate": 1.96006927388281e-05, "loss": 0.5093, "step": 1029 }, { "epoch": 0.12, "learning_rate": 1.959965649792495e-05, "loss": 0.4766, "step": 1030 }, { "epoch": 0.12, "learning_rate": 1.9598618941654535e-05, "loss": 0.4788, "step": 1031 }, { "epoch": 0.12, "learning_rate": 1.9597580070159026e-05, "loss": 0.4934, "step": 1032 }, { "epoch": 0.12, "learning_rate": 1.9596539883580773e-05, "loss": 0.4993, "step": 1033 }, { "epoch": 0.12, "learning_rate": 1.9595498382062295e-05, "loss": 0.4967, "step": 1034 }, { "epoch": 0.12, "learning_rate": 1.9594455565746313e-05, "loss": 0.5108, "step": 1035 }, { "epoch": 0.12, "learning_rate": 1.959341143477571e-05, "loss": 0.482, "step": 1036 }, { "epoch": 0.12, "learning_rate": 1.9592365989293557e-05, "loss": 0.4744, "step": 1037 }, { "epoch": 0.12, "learning_rate": 1.95913192294431e-05, "loss": 0.5033, "step": 1038 }, { "epoch": 0.12, "learning_rate": 1.9590271155367776e-05, "loss": 0.4749, "step": 1039 }, { "epoch": 0.12, "learning_rate": 1.9589221767211188e-05, "loss": 0.489, "step": 1040 }, { "epoch": 0.12, "learning_rate": 1.9588171065117122e-05, "loss": 0.4956, "step": 1041 }, { "epoch": 0.12, "learning_rate": 1.9587119049229558e-05, "loss": 0.4975, "step": 1042 }, { "epoch": 0.12, "learning_rate": 1.9586065719692636e-05, "loss": 0.5006, "step": 1043 }, { "epoch": 0.12, "learning_rate": 1.9585011076650695e-05, "loss": 0.5086, "step": 1044 }, { "epoch": 0.12, "learning_rate": 1.958395512024824e-05, "loss": 0.4902, "step": 1045 }, { "epoch": 0.12, "learning_rate": 1.9582897850629958e-05, "loss": 0.4795, "step": 1046 }, { "epoch": 0.12, "learning_rate": 1.9581839267940722e-05, "loss": 0.4852, "step": 1047 }, { "epoch": 0.12, "learning_rate": 1.9580779372325583e-05, "loss": 0.4886, "step": 1048 }, { "epoch": 0.12, "learning_rate": 1.9579718163929767e-05, "loss": 0.4913, "step": 1049 }, { "epoch": 0.12, "learning_rate": 1.957865564289868e-05, "loss": 0.5032, "step": 1050 }, { "epoch": 0.12, "learning_rate": 1.9577591809377917e-05, "loss": 0.4787, "step": 1051 }, { "epoch": 0.12, "learning_rate": 1.957652666351325e-05, "loss": 0.5013, "step": 1052 }, { "epoch": 0.12, "learning_rate": 1.9575460205450616e-05, "loss": 0.5499, "step": 1053 }, { "epoch": 0.12, "learning_rate": 1.9574392435336156e-05, "loss": 0.4768, "step": 1054 }, { "epoch": 0.12, "learning_rate": 1.957332335331617e-05, "loss": 0.4963, "step": 1055 }, { "epoch": 0.12, "learning_rate": 1.957225295953715e-05, "loss": 0.4937, "step": 1056 }, { "epoch": 0.12, "learning_rate": 1.9571181254145762e-05, "loss": 0.4775, "step": 1057 }, { "epoch": 0.12, "learning_rate": 1.9570108237288853e-05, "loss": 0.5146, "step": 1058 }, { "epoch": 0.12, "learning_rate": 1.9569033909113454e-05, "loss": 0.4953, "step": 1059 }, { "epoch": 0.12, "learning_rate": 1.9567958269766768e-05, "loss": 0.4758, "step": 1060 }, { "epoch": 0.12, "learning_rate": 1.9566881319396184e-05, "loss": 0.5177, "step": 1061 }, { "epoch": 0.12, "learning_rate": 1.956580305814927e-05, "loss": 0.4715, "step": 1062 }, { "epoch": 0.12, "learning_rate": 1.9564723486173766e-05, "loss": 0.4987, "step": 1063 }, { "epoch": 0.12, "learning_rate": 1.95636426036176e-05, "loss": 0.4819, "step": 1064 }, { "epoch": 0.12, "learning_rate": 1.9562560410628883e-05, "loss": 0.5034, "step": 1065 }, { "epoch": 0.12, "learning_rate": 1.9561476907355886e-05, "loss": 0.5026, "step": 1066 }, { "epoch": 0.12, "learning_rate": 1.956039209394709e-05, "loss": 0.5056, "step": 1067 }, { "epoch": 0.12, "learning_rate": 1.9559305970551125e-05, "loss": 0.4825, "step": 1068 }, { "epoch": 0.12, "learning_rate": 1.955821853731682e-05, "loss": 0.515, "step": 1069 }, { "epoch": 0.12, "learning_rate": 1.955712979439318e-05, "loss": 0.4992, "step": 1070 }, { "epoch": 0.12, "learning_rate": 1.955603974192938e-05, "loss": 0.483, "step": 1071 }, { "epoch": 0.12, "learning_rate": 1.955494838007479e-05, "loss": 0.493, "step": 1072 }, { "epoch": 0.12, "learning_rate": 1.9553855708978943e-05, "loss": 0.4969, "step": 1073 }, { "epoch": 0.12, "learning_rate": 1.9552761728791563e-05, "loss": 0.506, "step": 1074 }, { "epoch": 0.12, "learning_rate": 1.955166643966255e-05, "loss": 0.4959, "step": 1075 }, { "epoch": 0.12, "learning_rate": 1.9550569841741984e-05, "loss": 0.4879, "step": 1076 }, { "epoch": 0.12, "learning_rate": 1.9549471935180123e-05, "loss": 0.4908, "step": 1077 }, { "epoch": 0.12, "learning_rate": 1.95483727201274e-05, "loss": 0.4847, "step": 1078 }, { "epoch": 0.12, "learning_rate": 1.9547272196734436e-05, "loss": 0.5054, "step": 1079 }, { "epoch": 0.12, "learning_rate": 1.954617036515203e-05, "loss": 0.4997, "step": 1080 }, { "epoch": 0.12, "learning_rate": 1.9545067225531155e-05, "loss": 0.5026, "step": 1081 }, { "epoch": 0.12, "learning_rate": 1.954396277802296e-05, "loss": 0.5015, "step": 1082 }, { "epoch": 0.12, "learning_rate": 1.954285702277879e-05, "loss": 0.4918, "step": 1083 }, { "epoch": 0.12, "learning_rate": 1.954174995995015e-05, "loss": 0.4966, "step": 1084 }, { "epoch": 0.12, "learning_rate": 1.9540641589688735e-05, "loss": 0.4972, "step": 1085 }, { "epoch": 0.12, "learning_rate": 1.953953191214642e-05, "loss": 0.4849, "step": 1086 }, { "epoch": 0.12, "learning_rate": 1.9538420927475247e-05, "loss": 0.5057, "step": 1087 }, { "epoch": 0.12, "learning_rate": 1.953730863582745e-05, "loss": 0.4687, "step": 1088 }, { "epoch": 0.12, "learning_rate": 1.9536195037355438e-05, "loss": 0.4987, "step": 1089 }, { "epoch": 0.12, "learning_rate": 1.9535080132211805e-05, "loss": 0.4879, "step": 1090 }, { "epoch": 0.12, "learning_rate": 1.9533963920549307e-05, "loss": 0.4896, "step": 1091 }, { "epoch": 0.12, "learning_rate": 1.9532846402520898e-05, "loss": 0.4914, "step": 1092 }, { "epoch": 0.12, "learning_rate": 1.95317275782797e-05, "loss": 0.4981, "step": 1093 }, { "epoch": 0.13, "learning_rate": 1.953060744797901e-05, "loss": 0.5114, "step": 1094 }, { "epoch": 0.13, "learning_rate": 1.9529486011772326e-05, "loss": 0.4893, "step": 1095 }, { "epoch": 0.13, "learning_rate": 1.95283632698133e-05, "loss": 0.4894, "step": 1096 }, { "epoch": 0.13, "learning_rate": 1.952723922225577e-05, "loss": 0.4872, "step": 1097 }, { "epoch": 0.13, "learning_rate": 1.952611386925376e-05, "loss": 0.4907, "step": 1098 }, { "epoch": 0.13, "learning_rate": 1.952498721096147e-05, "loss": 0.4816, "step": 1099 }, { "epoch": 0.13, "learning_rate": 1.952385924753328e-05, "loss": 0.4909, "step": 1100 }, { "epoch": 0.13, "learning_rate": 1.9522729979123735e-05, "loss": 0.493, "step": 1101 }, { "epoch": 0.13, "learning_rate": 1.952159940588758e-05, "loss": 0.5024, "step": 1102 }, { "epoch": 0.13, "learning_rate": 1.9520467527979726e-05, "loss": 0.4942, "step": 1103 }, { "epoch": 0.13, "learning_rate": 1.9519334345555264e-05, "loss": 0.484, "step": 1104 }, { "epoch": 0.13, "learning_rate": 1.9518199858769466e-05, "loss": 0.4942, "step": 1105 }, { "epoch": 0.13, "learning_rate": 1.9517064067777786e-05, "loss": 0.469, "step": 1106 }, { "epoch": 0.13, "learning_rate": 1.9515926972735847e-05, "loss": 0.4857, "step": 1107 }, { "epoch": 0.13, "learning_rate": 1.9514788573799457e-05, "loss": 0.4872, "step": 1108 }, { "epoch": 0.13, "learning_rate": 1.9513648871124604e-05, "loss": 0.5115, "step": 1109 }, { "epoch": 0.13, "learning_rate": 1.9512507864867452e-05, "loss": 0.4947, "step": 1110 }, { "epoch": 0.13, "learning_rate": 1.9511365555184345e-05, "loss": 0.4913, "step": 1111 }, { "epoch": 0.13, "learning_rate": 1.9510221942231803e-05, "loss": 0.4762, "step": 1112 }, { "epoch": 0.13, "learning_rate": 1.950907702616653e-05, "loss": 0.4975, "step": 1113 }, { "epoch": 0.13, "learning_rate": 1.9507930807145406e-05, "loss": 0.4734, "step": 1114 }, { "epoch": 0.13, "learning_rate": 1.9506783285325482e-05, "loss": 0.4966, "step": 1115 }, { "epoch": 0.13, "learning_rate": 1.9505634460863997e-05, "loss": 0.4885, "step": 1116 }, { "epoch": 0.13, "learning_rate": 1.950448433391837e-05, "loss": 0.4667, "step": 1117 }, { "epoch": 0.13, "learning_rate": 1.9503332904646188e-05, "loss": 0.5057, "step": 1118 }, { "epoch": 0.13, "learning_rate": 1.9502180173205227e-05, "loss": 0.5029, "step": 1119 }, { "epoch": 0.13, "learning_rate": 1.9501026139753433e-05, "loss": 0.4856, "step": 1120 }, { "epoch": 0.13, "learning_rate": 1.9499870804448936e-05, "loss": 0.4836, "step": 1121 }, { "epoch": 0.13, "learning_rate": 1.9498714167450047e-05, "loss": 0.4915, "step": 1122 }, { "epoch": 0.13, "learning_rate": 1.9497556228915246e-05, "loss": 0.4904, "step": 1123 }, { "epoch": 0.13, "learning_rate": 1.9496396989003195e-05, "loss": 0.4843, "step": 1124 }, { "epoch": 0.13, "learning_rate": 1.9495236447872738e-05, "loss": 0.481, "step": 1125 }, { "epoch": 0.13, "learning_rate": 1.94940746056829e-05, "loss": 0.5034, "step": 1126 }, { "epoch": 0.13, "learning_rate": 1.949291146259287e-05, "loss": 0.4913, "step": 1127 }, { "epoch": 0.13, "learning_rate": 1.949174701876203e-05, "loss": 0.4805, "step": 1128 }, { "epoch": 0.13, "learning_rate": 1.9490581274349934e-05, "loss": 0.4944, "step": 1129 }, { "epoch": 0.13, "learning_rate": 1.9489414229516318e-05, "loss": 0.4868, "step": 1130 }, { "epoch": 0.13, "learning_rate": 1.9488245884421087e-05, "loss": 0.4768, "step": 1131 }, { "epoch": 0.13, "learning_rate": 1.9487076239224337e-05, "loss": 0.4823, "step": 1132 }, { "epoch": 0.13, "learning_rate": 1.948590529408633e-05, "loss": 0.4853, "step": 1133 }, { "epoch": 0.13, "learning_rate": 1.948473304916751e-05, "loss": 0.4846, "step": 1134 }, { "epoch": 0.13, "learning_rate": 1.948355950462851e-05, "loss": 0.5139, "step": 1135 }, { "epoch": 0.13, "learning_rate": 1.9482384660630125e-05, "loss": 0.4903, "step": 1136 }, { "epoch": 0.13, "learning_rate": 1.9481208517333336e-05, "loss": 0.5032, "step": 1137 }, { "epoch": 0.13, "learning_rate": 1.9480031074899303e-05, "loss": 0.4933, "step": 1138 }, { "epoch": 0.13, "learning_rate": 1.9478852333489356e-05, "loss": 0.4865, "step": 1139 }, { "epoch": 0.13, "learning_rate": 1.9477672293265014e-05, "loss": 0.4838, "step": 1140 }, { "epoch": 0.13, "learning_rate": 1.9476490954387968e-05, "loss": 0.4925, "step": 1141 }, { "epoch": 0.13, "learning_rate": 1.947530831702009e-05, "loss": 0.5201, "step": 1142 }, { "epoch": 0.13, "learning_rate": 1.9474124381323424e-05, "loss": 0.4918, "step": 1143 }, { "epoch": 0.13, "learning_rate": 1.9472939147460194e-05, "loss": 0.4993, "step": 1144 }, { "epoch": 0.13, "learning_rate": 1.947175261559281e-05, "loss": 0.4926, "step": 1145 }, { "epoch": 0.13, "learning_rate": 1.9470564785883848e-05, "loss": 0.5156, "step": 1146 }, { "epoch": 0.13, "learning_rate": 1.9469375658496066e-05, "loss": 0.4835, "step": 1147 }, { "epoch": 0.13, "learning_rate": 1.946818523359241e-05, "loss": 0.4778, "step": 1148 }, { "epoch": 0.13, "learning_rate": 1.9466993511335985e-05, "loss": 0.4853, "step": 1149 }, { "epoch": 0.13, "learning_rate": 1.9465800491890087e-05, "loss": 0.4952, "step": 1150 }, { "epoch": 0.13, "learning_rate": 1.946460617541819e-05, "loss": 0.4911, "step": 1151 }, { "epoch": 0.13, "learning_rate": 1.9463410562083937e-05, "loss": 0.4908, "step": 1152 }, { "epoch": 0.13, "learning_rate": 1.946221365205115e-05, "loss": 0.4897, "step": 1153 }, { "epoch": 0.13, "learning_rate": 1.9461015445483843e-05, "loss": 0.4868, "step": 1154 }, { "epoch": 0.13, "learning_rate": 1.9459815942546192e-05, "loss": 0.497, "step": 1155 }, { "epoch": 0.13, "learning_rate": 1.9458615143402554e-05, "loss": 0.4966, "step": 1156 }, { "epoch": 0.13, "learning_rate": 1.9457413048217466e-05, "loss": 0.4687, "step": 1157 }, { "epoch": 0.13, "learning_rate": 1.9456209657155645e-05, "loss": 0.4876, "step": 1158 }, { "epoch": 0.13, "learning_rate": 1.9455004970381978e-05, "loss": 0.5257, "step": 1159 }, { "epoch": 0.13, "learning_rate": 1.9453798988061535e-05, "loss": 0.4873, "step": 1160 }, { "epoch": 0.13, "learning_rate": 1.9452591710359566e-05, "loss": 0.4734, "step": 1161 }, { "epoch": 0.13, "learning_rate": 1.9451383137441492e-05, "loss": 0.485, "step": 1162 }, { "epoch": 0.13, "learning_rate": 1.9450173269472915e-05, "loss": 0.4731, "step": 1163 }, { "epoch": 0.13, "learning_rate": 1.9448962106619614e-05, "loss": 0.4943, "step": 1164 }, { "epoch": 0.13, "learning_rate": 1.944774964904754e-05, "loss": 0.4884, "step": 1165 }, { "epoch": 0.13, "learning_rate": 1.944653589692284e-05, "loss": 0.48, "step": 1166 }, { "epoch": 0.13, "learning_rate": 1.9445320850411816e-05, "loss": 0.5034, "step": 1167 }, { "epoch": 0.13, "learning_rate": 1.9444104509680954e-05, "loss": 0.5059, "step": 1168 }, { "epoch": 0.13, "learning_rate": 1.9442886874896924e-05, "loss": 0.4864, "step": 1169 }, { "epoch": 0.13, "learning_rate": 1.944166794622657e-05, "loss": 0.491, "step": 1170 }, { "epoch": 0.13, "learning_rate": 1.9440447723836914e-05, "loss": 0.4786, "step": 1171 }, { "epoch": 0.13, "learning_rate": 1.9439226207895143e-05, "loss": 0.4786, "step": 1172 }, { "epoch": 0.13, "learning_rate": 1.9438003398568647e-05, "loss": 0.4986, "step": 1173 }, { "epoch": 0.13, "learning_rate": 1.9436779296024967e-05, "loss": 0.4635, "step": 1174 }, { "epoch": 0.13, "learning_rate": 1.9435553900431838e-05, "loss": 0.5228, "step": 1175 }, { "epoch": 0.13, "learning_rate": 1.9434327211957166e-05, "loss": 0.4745, "step": 1176 }, { "epoch": 0.13, "learning_rate": 1.943309923076903e-05, "loss": 0.4875, "step": 1177 }, { "epoch": 0.13, "learning_rate": 1.9431869957035698e-05, "loss": 0.479, "step": 1178 }, { "epoch": 0.13, "learning_rate": 1.9430639390925604e-05, "loss": 0.4843, "step": 1179 }, { "epoch": 0.13, "learning_rate": 1.942940753260736e-05, "loss": 0.4825, "step": 1180 }, { "epoch": 0.13, "learning_rate": 1.9428174382249764e-05, "loss": 0.4885, "step": 1181 }, { "epoch": 0.14, "learning_rate": 1.942693994002178e-05, "loss": 0.4608, "step": 1182 }, { "epoch": 0.14, "learning_rate": 1.9425704206092562e-05, "loss": 0.4976, "step": 1183 }, { "epoch": 0.14, "learning_rate": 1.9424467180631422e-05, "loss": 0.4948, "step": 1184 }, { "epoch": 0.14, "learning_rate": 1.942322886380787e-05, "loss": 0.5119, "step": 1185 }, { "epoch": 0.14, "learning_rate": 1.942198925579158e-05, "loss": 0.4797, "step": 1186 }, { "epoch": 0.14, "learning_rate": 1.9420748356752405e-05, "loss": 0.4915, "step": 1187 }, { "epoch": 0.14, "learning_rate": 1.9419506166860374e-05, "loss": 0.4795, "step": 1188 }, { "epoch": 0.14, "learning_rate": 1.9418262686285697e-05, "loss": 0.4857, "step": 1189 }, { "epoch": 0.14, "learning_rate": 1.9417017915198758e-05, "loss": 0.4809, "step": 1190 }, { "epoch": 0.14, "learning_rate": 1.9415771853770117e-05, "loss": 0.4958, "step": 1191 }, { "epoch": 0.14, "learning_rate": 1.9414524502170514e-05, "loss": 0.49, "step": 1192 }, { "epoch": 0.14, "learning_rate": 1.941327586057087e-05, "loss": 0.5236, "step": 1193 }, { "epoch": 0.14, "learning_rate": 1.9412025929142263e-05, "loss": 0.4767, "step": 1194 }, { "epoch": 0.14, "learning_rate": 1.9410774708055972e-05, "loss": 0.5111, "step": 1195 }, { "epoch": 0.14, "learning_rate": 1.940952219748344e-05, "loss": 0.4883, "step": 1196 }, { "epoch": 0.14, "learning_rate": 1.9408268397596287e-05, "loss": 0.4899, "step": 1197 }, { "epoch": 0.14, "learning_rate": 1.9407013308566315e-05, "loss": 0.4783, "step": 1198 }, { "epoch": 0.14, "learning_rate": 1.9405756930565496e-05, "loss": 0.5071, "step": 1199 }, { "epoch": 0.14, "learning_rate": 1.9404499263765983e-05, "loss": 0.4763, "step": 1200 }, { "epoch": 0.14, "learning_rate": 1.9403240308340105e-05, "loss": 0.4966, "step": 1201 }, { "epoch": 0.14, "learning_rate": 1.940198006446037e-05, "loss": 0.4701, "step": 1202 }, { "epoch": 0.14, "learning_rate": 1.940071853229945e-05, "loss": 0.5047, "step": 1203 }, { "epoch": 0.14, "learning_rate": 1.939945571203021e-05, "loss": 0.4907, "step": 1204 }, { "epoch": 0.14, "learning_rate": 1.9398191603825687e-05, "loss": 0.4777, "step": 1205 }, { "epoch": 0.14, "learning_rate": 1.9396926207859085e-05, "loss": 0.4816, "step": 1206 }, { "epoch": 0.14, "learning_rate": 1.9395659524303795e-05, "loss": 0.492, "step": 1207 }, { "epoch": 0.14, "learning_rate": 1.9394391553333384e-05, "loss": 0.4973, "step": 1208 }, { "epoch": 0.14, "learning_rate": 1.939312229512159e-05, "loss": 0.501, "step": 1209 }, { "epoch": 0.14, "learning_rate": 1.9391851749842326e-05, "loss": 0.4835, "step": 1210 }, { "epoch": 0.14, "learning_rate": 1.939057991766969e-05, "loss": 0.4839, "step": 1211 }, { "epoch": 0.14, "learning_rate": 1.938930679877795e-05, "loss": 0.4796, "step": 1212 }, { "epoch": 0.14, "learning_rate": 1.938803239334155e-05, "loss": 0.4854, "step": 1213 }, { "epoch": 0.14, "learning_rate": 1.9386756701535115e-05, "loss": 0.5023, "step": 1214 }, { "epoch": 0.14, "learning_rate": 1.938547972353344e-05, "loss": 0.476, "step": 1215 }, { "epoch": 0.14, "learning_rate": 1.93842014595115e-05, "loss": 0.4784, "step": 1216 }, { "epoch": 0.14, "learning_rate": 1.9382921909644448e-05, "loss": 0.5077, "step": 1217 }, { "epoch": 0.14, "learning_rate": 1.938164107410761e-05, "loss": 0.5086, "step": 1218 }, { "epoch": 0.14, "learning_rate": 1.938035895307649e-05, "loss": 0.4828, "step": 1219 }, { "epoch": 0.14, "learning_rate": 1.9379075546726764e-05, "loss": 0.4738, "step": 1220 }, { "epoch": 0.14, "learning_rate": 1.9377790855234288e-05, "loss": 0.484, "step": 1221 }, { "epoch": 0.14, "learning_rate": 1.9376504878775098e-05, "loss": 0.4836, "step": 1222 }, { "epoch": 0.14, "learning_rate": 1.9375217617525396e-05, "loss": 0.4859, "step": 1223 }, { "epoch": 0.14, "learning_rate": 1.937392907166157e-05, "loss": 0.4851, "step": 1224 }, { "epoch": 0.14, "learning_rate": 1.9372639241360173e-05, "loss": 0.4709, "step": 1225 }, { "epoch": 0.14, "learning_rate": 1.937134812679795e-05, "loss": 0.5075, "step": 1226 }, { "epoch": 0.14, "learning_rate": 1.9370055728151805e-05, "loss": 0.5, "step": 1227 }, { "epoch": 0.14, "learning_rate": 1.936876204559883e-05, "loss": 0.4768, "step": 1228 }, { "epoch": 0.14, "learning_rate": 1.936746707931628e-05, "loss": 0.5111, "step": 1229 }, { "epoch": 0.14, "learning_rate": 1.9366170829481607e-05, "loss": 0.4642, "step": 1230 }, { "epoch": 0.14, "learning_rate": 1.9364873296272414e-05, "loss": 0.4755, "step": 1231 }, { "epoch": 0.14, "learning_rate": 1.9363574479866504e-05, "loss": 0.4973, "step": 1232 }, { "epoch": 0.14, "learning_rate": 1.936227438044183e-05, "loss": 0.4738, "step": 1233 }, { "epoch": 0.14, "learning_rate": 1.9360972998176547e-05, "loss": 0.4883, "step": 1234 }, { "epoch": 0.14, "learning_rate": 1.9359670333248967e-05, "loss": 0.4855, "step": 1235 }, { "epoch": 0.14, "learning_rate": 1.935836638583759e-05, "loss": 0.503, "step": 1236 }, { "epoch": 0.14, "learning_rate": 1.935706115612108e-05, "loss": 0.4941, "step": 1237 }, { "epoch": 0.14, "learning_rate": 1.935575464427828e-05, "loss": 0.4675, "step": 1238 }, { "epoch": 0.14, "learning_rate": 1.9354446850488216e-05, "loss": 0.468, "step": 1239 }, { "epoch": 0.14, "learning_rate": 1.9353137774930085e-05, "loss": 0.5015, "step": 1240 }, { "epoch": 0.14, "learning_rate": 1.935182741778326e-05, "loss": 0.4915, "step": 1241 }, { "epoch": 0.14, "learning_rate": 1.9350515779227294e-05, "loss": 0.4781, "step": 1242 }, { "epoch": 0.14, "learning_rate": 1.93492028594419e-05, "loss": 0.4798, "step": 1243 }, { "epoch": 0.14, "learning_rate": 1.934788865860698e-05, "loss": 0.4966, "step": 1244 }, { "epoch": 0.14, "learning_rate": 1.9346573176902616e-05, "loss": 0.4916, "step": 1245 }, { "epoch": 0.14, "learning_rate": 1.934525641450905e-05, "loss": 0.4928, "step": 1246 }, { "epoch": 0.14, "learning_rate": 1.9343938371606714e-05, "loss": 0.4975, "step": 1247 }, { "epoch": 0.14, "learning_rate": 1.9342619048376202e-05, "loss": 0.4795, "step": 1248 }, { "epoch": 0.14, "learning_rate": 1.93412984449983e-05, "loss": 0.4847, "step": 1249 }, { "epoch": 0.14, "learning_rate": 1.9339976561653956e-05, "loss": 0.4977, "step": 1250 }, { "epoch": 0.14, "learning_rate": 1.9338653398524295e-05, "loss": 0.4751, "step": 1251 }, { "epoch": 0.14, "learning_rate": 1.933732895579062e-05, "loss": 0.4929, "step": 1252 }, { "epoch": 0.14, "learning_rate": 1.933600323363442e-05, "loss": 0.4971, "step": 1253 }, { "epoch": 0.14, "learning_rate": 1.933467623223733e-05, "loss": 0.4927, "step": 1254 }, { "epoch": 0.14, "learning_rate": 1.9333347951781194e-05, "loss": 0.4969, "step": 1255 }, { "epoch": 0.14, "learning_rate": 1.933201839244801e-05, "loss": 0.4833, "step": 1256 }, { "epoch": 0.14, "learning_rate": 1.9330687554419956e-05, "loss": 0.4656, "step": 1257 }, { "epoch": 0.14, "learning_rate": 1.932935543787939e-05, "loss": 0.496, "step": 1258 }, { "epoch": 0.14, "learning_rate": 1.9328022043008842e-05, "loss": 0.4697, "step": 1259 }, { "epoch": 0.14, "learning_rate": 1.9326687369991012e-05, "loss": 0.4901, "step": 1260 }, { "epoch": 0.14, "learning_rate": 1.9325351419008783e-05, "loss": 0.4935, "step": 1261 }, { "epoch": 0.14, "learning_rate": 1.932401419024521e-05, "loss": 0.5023, "step": 1262 }, { "epoch": 0.14, "learning_rate": 1.9322675683883528e-05, "loss": 0.4864, "step": 1263 }, { "epoch": 0.14, "learning_rate": 1.9321335900107134e-05, "loss": 0.4949, "step": 1264 }, { "epoch": 0.14, "learning_rate": 1.931999483909961e-05, "loss": 0.4694, "step": 1265 }, { "epoch": 0.14, "learning_rate": 1.9318652501044715e-05, "loss": 0.4915, "step": 1266 }, { "epoch": 0.14, "learning_rate": 1.931730888612638e-05, "loss": 0.492, "step": 1267 }, { "epoch": 0.14, "learning_rate": 1.9315963994528707e-05, "loss": 0.4826, "step": 1268 }, { "epoch": 0.15, "learning_rate": 1.931461782643598e-05, "loss": 0.4878, "step": 1269 }, { "epoch": 0.15, "learning_rate": 1.9313270382032644e-05, "loss": 0.5038, "step": 1270 }, { "epoch": 0.15, "learning_rate": 1.9311921661503338e-05, "loss": 0.4938, "step": 1271 }, { "epoch": 0.15, "learning_rate": 1.9310571665032867e-05, "loss": 0.487, "step": 1272 }, { "epoch": 0.15, "learning_rate": 1.9309220392806206e-05, "loss": 0.4885, "step": 1273 }, { "epoch": 0.15, "learning_rate": 1.9307867845008513e-05, "loss": 0.4796, "step": 1274 }, { "epoch": 0.15, "learning_rate": 1.930651402182512e-05, "loss": 0.4803, "step": 1275 }, { "epoch": 0.15, "learning_rate": 1.9305158923441524e-05, "loss": 0.4871, "step": 1276 }, { "epoch": 0.15, "learning_rate": 1.9303802550043404e-05, "loss": 0.4888, "step": 1277 }, { "epoch": 0.15, "learning_rate": 1.930244490181662e-05, "loss": 0.4926, "step": 1278 }, { "epoch": 0.15, "learning_rate": 1.9301085978947195e-05, "loss": 0.4892, "step": 1279 }, { "epoch": 0.15, "learning_rate": 1.9299725781621335e-05, "loss": 0.4975, "step": 1280 }, { "epoch": 0.15, "learning_rate": 1.9298364310025412e-05, "loss": 0.4898, "step": 1281 }, { "epoch": 0.15, "learning_rate": 1.929700156434599e-05, "loss": 0.472, "step": 1282 }, { "epoch": 0.15, "learning_rate": 1.929563754476978e-05, "loss": 0.4749, "step": 1283 }, { "epoch": 0.15, "learning_rate": 1.929427225148369e-05, "loss": 0.4967, "step": 1284 }, { "epoch": 0.15, "learning_rate": 1.92929056846748e-05, "loss": 0.4912, "step": 1285 }, { "epoch": 0.15, "learning_rate": 1.9291537844530352e-05, "loss": 0.4963, "step": 1286 }, { "epoch": 0.15, "learning_rate": 1.9290168731237776e-05, "loss": 0.5038, "step": 1287 }, { "epoch": 0.15, "learning_rate": 1.9288798344984673e-05, "loss": 0.4706, "step": 1288 }, { "epoch": 0.15, "learning_rate": 1.928742668595881e-05, "loss": 0.498, "step": 1289 }, { "epoch": 0.15, "learning_rate": 1.9286053754348142e-05, "loss": 0.488, "step": 1290 }, { "epoch": 0.15, "learning_rate": 1.9284679550340783e-05, "loss": 0.4734, "step": 1291 }, { "epoch": 0.15, "learning_rate": 1.928330407412504e-05, "loss": 0.4883, "step": 1292 }, { "epoch": 0.15, "learning_rate": 1.9281927325889373e-05, "loss": 0.4742, "step": 1293 }, { "epoch": 0.15, "learning_rate": 1.9280549305822435e-05, "loss": 0.499, "step": 1294 }, { "epoch": 0.15, "learning_rate": 1.927917001411304e-05, "loss": 0.4847, "step": 1295 }, { "epoch": 0.15, "learning_rate": 1.9277789450950187e-05, "loss": 0.4661, "step": 1296 }, { "epoch": 0.15, "learning_rate": 1.9276407616523044e-05, "loss": 0.4792, "step": 1297 }, { "epoch": 0.15, "learning_rate": 1.927502451102095e-05, "loss": 0.4986, "step": 1298 }, { "epoch": 0.15, "learning_rate": 1.927364013463342e-05, "loss": 0.4912, "step": 1299 }, { "epoch": 0.15, "learning_rate": 1.9272254487550144e-05, "loss": 0.4729, "step": 1300 }, { "epoch": 0.15, "learning_rate": 1.9270867569960994e-05, "loss": 0.4785, "step": 1301 }, { "epoch": 0.15, "learning_rate": 1.9269479382056008e-05, "loss": 0.5064, "step": 1302 }, { "epoch": 0.15, "learning_rate": 1.926808992402539e-05, "loss": 0.4841, "step": 1303 }, { "epoch": 0.15, "learning_rate": 1.926669919605953e-05, "loss": 0.4717, "step": 1304 }, { "epoch": 0.15, "learning_rate": 1.926530719834899e-05, "loss": 0.4853, "step": 1305 }, { "epoch": 0.15, "learning_rate": 1.9263913931084507e-05, "loss": 0.4704, "step": 1306 }, { "epoch": 0.15, "learning_rate": 1.9262519394456985e-05, "loss": 0.5001, "step": 1307 }, { "epoch": 0.15, "learning_rate": 1.9261123588657514e-05, "loss": 0.4755, "step": 1308 }, { "epoch": 0.15, "learning_rate": 1.925972651387734e-05, "loss": 0.4841, "step": 1309 }, { "epoch": 0.15, "learning_rate": 1.9258328170307905e-05, "loss": 0.5065, "step": 1310 }, { "epoch": 0.15, "learning_rate": 1.9256928558140806e-05, "loss": 0.4867, "step": 1311 }, { "epoch": 0.15, "learning_rate": 1.925552767756782e-05, "loss": 0.4879, "step": 1312 }, { "epoch": 0.15, "learning_rate": 1.9254125528780908e-05, "loss": 0.4927, "step": 1313 }, { "epoch": 0.15, "learning_rate": 1.9252722111972182e-05, "loss": 0.5016, "step": 1314 }, { "epoch": 0.15, "learning_rate": 1.9251317427333953e-05, "loss": 0.5064, "step": 1315 }, { "epoch": 0.15, "learning_rate": 1.924991147505869e-05, "loss": 0.4779, "step": 1316 }, { "epoch": 0.15, "learning_rate": 1.924850425533904e-05, "loss": 0.4678, "step": 1317 }, { "epoch": 0.15, "learning_rate": 1.9247095768367822e-05, "loss": 0.4932, "step": 1318 }, { "epoch": 0.15, "learning_rate": 1.924568601433803e-05, "loss": 0.4863, "step": 1319 }, { "epoch": 0.15, "learning_rate": 1.9244274993442836e-05, "loss": 0.484, "step": 1320 }, { "epoch": 0.15, "learning_rate": 1.924286270587558e-05, "loss": 0.4773, "step": 1321 }, { "epoch": 0.15, "learning_rate": 1.924144915182977e-05, "loss": 0.4771, "step": 1322 }, { "epoch": 0.15, "learning_rate": 1.9240034331499105e-05, "loss": 0.4836, "step": 1323 }, { "epoch": 0.15, "learning_rate": 1.923861824507744e-05, "loss": 0.4933, "step": 1324 }, { "epoch": 0.15, "learning_rate": 1.9237200892758814e-05, "loss": 0.4814, "step": 1325 }, { "epoch": 0.15, "learning_rate": 1.923578227473743e-05, "loss": 0.477, "step": 1326 }, { "epoch": 0.15, "learning_rate": 1.923436239120768e-05, "loss": 0.4851, "step": 1327 }, { "epoch": 0.15, "learning_rate": 1.9232941242364114e-05, "loss": 0.4971, "step": 1328 }, { "epoch": 0.15, "learning_rate": 1.9231518828401458e-05, "loss": 0.488, "step": 1329 }, { "epoch": 0.15, "learning_rate": 1.923009514951462e-05, "loss": 0.4949, "step": 1330 }, { "epoch": 0.15, "learning_rate": 1.9228670205898675e-05, "loss": 0.4887, "step": 1331 }, { "epoch": 0.15, "learning_rate": 1.922724399774887e-05, "loss": 0.4823, "step": 1332 }, { "epoch": 0.15, "learning_rate": 1.9225816525260626e-05, "loss": 0.4923, "step": 1333 }, { "epoch": 0.15, "learning_rate": 1.9224387788629547e-05, "loss": 0.4817, "step": 1334 }, { "epoch": 0.15, "learning_rate": 1.922295778805139e-05, "loss": 0.4834, "step": 1335 }, { "epoch": 0.15, "learning_rate": 1.9221526523722104e-05, "loss": 0.5067, "step": 1336 }, { "epoch": 0.15, "learning_rate": 1.9220093995837805e-05, "loss": 0.4721, "step": 1337 }, { "epoch": 0.15, "learning_rate": 1.9218660204594778e-05, "loss": 0.5119, "step": 1338 }, { "epoch": 0.15, "learning_rate": 1.9217225150189483e-05, "loss": 0.469, "step": 1339 }, { "epoch": 0.15, "learning_rate": 1.921578883281856e-05, "loss": 0.4769, "step": 1340 }, { "epoch": 0.15, "learning_rate": 1.9214351252678815e-05, "loss": 0.4706, "step": 1341 }, { "epoch": 0.15, "learning_rate": 1.9212912409967223e-05, "loss": 0.4812, "step": 1342 }, { "epoch": 0.15, "learning_rate": 1.9211472304880945e-05, "loss": 0.4874, "step": 1343 }, { "epoch": 0.15, "learning_rate": 1.9210030937617303e-05, "loss": 0.5001, "step": 1344 }, { "epoch": 0.15, "learning_rate": 1.9208588308373798e-05, "loss": 0.477, "step": 1345 }, { "epoch": 0.15, "learning_rate": 1.9207144417348103e-05, "loss": 0.5098, "step": 1346 }, { "epoch": 0.15, "learning_rate": 1.9205699264738063e-05, "loss": 0.4901, "step": 1347 }, { "epoch": 0.15, "learning_rate": 1.9204252850741695e-05, "loss": 0.4818, "step": 1348 }, { "epoch": 0.15, "learning_rate": 1.920280517555719e-05, "loss": 0.4806, "step": 1349 }, { "epoch": 0.15, "learning_rate": 1.9201356239382914e-05, "loss": 0.4831, "step": 1350 }, { "epoch": 0.15, "learning_rate": 1.9199906042417403e-05, "loss": 0.4894, "step": 1351 }, { "epoch": 0.15, "learning_rate": 1.919845458485936e-05, "loss": 0.4902, "step": 1352 }, { "epoch": 0.15, "learning_rate": 1.9197001866907676e-05, "loss": 0.4933, "step": 1353 }, { "epoch": 0.15, "learning_rate": 1.9195547888761403e-05, "loss": 0.4747, "step": 1354 }, { "epoch": 0.15, "learning_rate": 1.9194092650619767e-05, "loss": 0.4754, "step": 1355 }, { "epoch": 0.15, "learning_rate": 1.9192636152682173e-05, "loss": 0.5062, "step": 1356 }, { "epoch": 0.16, "learning_rate": 1.9191178395148188e-05, "loss": 0.4714, "step": 1357 }, { "epoch": 0.16, "learning_rate": 1.9189719378217554e-05, "loss": 0.4884, "step": 1358 }, { "epoch": 0.16, "learning_rate": 1.91882591020902e-05, "loss": 0.4867, "step": 1359 }, { "epoch": 0.16, "learning_rate": 1.9186797566966205e-05, "loss": 0.5001, "step": 1360 }, { "epoch": 0.16, "learning_rate": 1.918533477304584e-05, "loss": 0.4858, "step": 1361 }, { "epoch": 0.16, "learning_rate": 1.918387072052954e-05, "loss": 0.4954, "step": 1362 }, { "epoch": 0.16, "learning_rate": 1.918240540961791e-05, "loss": 0.4623, "step": 1363 }, { "epoch": 0.16, "learning_rate": 1.9180938840511727e-05, "loss": 0.5021, "step": 1364 }, { "epoch": 0.16, "learning_rate": 1.917947101341195e-05, "loss": 0.4912, "step": 1365 }, { "epoch": 0.16, "learning_rate": 1.9178001928519703e-05, "loss": 0.4741, "step": 1366 }, { "epoch": 0.16, "learning_rate": 1.9176531586036282e-05, "loss": 0.4754, "step": 1367 }, { "epoch": 0.16, "learning_rate": 1.9175059986163157e-05, "loss": 0.4776, "step": 1368 }, { "epoch": 0.16, "learning_rate": 1.9173587129101967e-05, "loss": 0.4847, "step": 1369 }, { "epoch": 0.16, "learning_rate": 1.917211301505453e-05, "loss": 0.4818, "step": 1370 }, { "epoch": 0.16, "learning_rate": 1.9170637644222835e-05, "loss": 0.465, "step": 1371 }, { "epoch": 0.16, "learning_rate": 1.9169161016809036e-05, "loss": 0.516, "step": 1372 }, { "epoch": 0.16, "learning_rate": 1.9167683133015465e-05, "loss": 0.4855, "step": 1373 }, { "epoch": 0.16, "learning_rate": 1.9166203993044627e-05, "loss": 0.4876, "step": 1374 }, { "epoch": 0.16, "learning_rate": 1.9164723597099192e-05, "loss": 0.4911, "step": 1375 }, { "epoch": 0.16, "learning_rate": 1.9163241945382012e-05, "loss": 0.4916, "step": 1376 }, { "epoch": 0.16, "learning_rate": 1.9161759038096108e-05, "loss": 0.4721, "step": 1377 }, { "epoch": 0.16, "learning_rate": 1.9160274875444668e-05, "loss": 0.4814, "step": 1378 }, { "epoch": 0.16, "learning_rate": 1.9158789457631054e-05, "loss": 0.4883, "step": 1379 }, { "epoch": 0.16, "learning_rate": 1.9157302784858807e-05, "loss": 0.4865, "step": 1380 }, { "epoch": 0.16, "learning_rate": 1.915581485733163e-05, "loss": 0.4839, "step": 1381 }, { "epoch": 0.16, "learning_rate": 1.91543256752534e-05, "loss": 0.4959, "step": 1382 }, { "epoch": 0.16, "learning_rate": 1.915283523882818e-05, "loss": 0.4822, "step": 1383 }, { "epoch": 0.16, "learning_rate": 1.9151343548260176e-05, "loss": 0.4907, "step": 1384 }, { "epoch": 0.16, "learning_rate": 1.9149850603753793e-05, "loss": 0.4936, "step": 1385 }, { "epoch": 0.16, "learning_rate": 1.91483564055136e-05, "loss": 0.4744, "step": 1386 }, { "epoch": 0.16, "learning_rate": 1.9146860953744325e-05, "loss": 0.4955, "step": 1387 }, { "epoch": 0.16, "learning_rate": 1.9145364248650892e-05, "loss": 0.4918, "step": 1388 }, { "epoch": 0.16, "learning_rate": 1.914386629043837e-05, "loss": 0.4582, "step": 1389 }, { "epoch": 0.16, "learning_rate": 1.9142367079312023e-05, "loss": 0.4987, "step": 1390 }, { "epoch": 0.16, "learning_rate": 1.9140866615477272e-05, "loss": 0.4701, "step": 1391 }, { "epoch": 0.16, "learning_rate": 1.913936489913971e-05, "loss": 0.4822, "step": 1392 }, { "epoch": 0.16, "learning_rate": 1.9137861930505112e-05, "loss": 0.4738, "step": 1393 }, { "epoch": 0.16, "learning_rate": 1.9136357709779418e-05, "loss": 0.4974, "step": 1394 }, { "epoch": 0.16, "learning_rate": 1.9134852237168738e-05, "loss": 0.4939, "step": 1395 }, { "epoch": 0.16, "learning_rate": 1.9133345512879353e-05, "loss": 0.4838, "step": 1396 }, { "epoch": 0.16, "learning_rate": 1.9131837537117724e-05, "loss": 0.4822, "step": 1397 }, { "epoch": 0.16, "learning_rate": 1.913032831009047e-05, "loss": 0.5028, "step": 1398 }, { "epoch": 0.16, "learning_rate": 1.9128817832004393e-05, "loss": 0.4745, "step": 1399 }, { "epoch": 0.16, "learning_rate": 1.912730610306646e-05, "loss": 0.4764, "step": 1400 }, { "epoch": 0.16, "learning_rate": 1.9125793123483814e-05, "loss": 0.4963, "step": 1401 }, { "epoch": 0.16, "learning_rate": 1.912427889346377e-05, "loss": 0.4879, "step": 1402 }, { "epoch": 0.16, "learning_rate": 1.91227634132138e-05, "loss": 0.4866, "step": 1403 }, { "epoch": 0.16, "learning_rate": 1.912124668294157e-05, "loss": 0.4828, "step": 1404 }, { "epoch": 0.16, "learning_rate": 1.91197287028549e-05, "loss": 0.5033, "step": 1405 }, { "epoch": 0.16, "learning_rate": 1.9118209473161794e-05, "loss": 0.4922, "step": 1406 }, { "epoch": 0.16, "learning_rate": 1.9116688994070413e-05, "loss": 0.4738, "step": 1407 }, { "epoch": 0.16, "learning_rate": 1.9115167265789096e-05, "loss": 0.4901, "step": 1408 }, { "epoch": 0.16, "learning_rate": 1.911364428852636e-05, "loss": 0.4672, "step": 1409 }, { "epoch": 0.16, "learning_rate": 1.9112120062490883e-05, "loss": 0.4893, "step": 1410 }, { "epoch": 0.16, "learning_rate": 1.911059458789152e-05, "loss": 0.4717, "step": 1411 }, { "epoch": 0.16, "learning_rate": 1.9109067864937292e-05, "loss": 0.4992, "step": 1412 }, { "epoch": 0.16, "learning_rate": 1.9107539893837396e-05, "loss": 0.4814, "step": 1413 }, { "epoch": 0.16, "learning_rate": 1.91060106748012e-05, "loss": 0.4832, "step": 1414 }, { "epoch": 0.16, "learning_rate": 1.9104480208038236e-05, "loss": 0.4766, "step": 1415 }, { "epoch": 0.16, "learning_rate": 1.9102948493758217e-05, "loss": 0.4931, "step": 1416 }, { "epoch": 0.16, "learning_rate": 1.9101415532171018e-05, "loss": 0.4702, "step": 1417 }, { "epoch": 0.16, "learning_rate": 1.90998813234867e-05, "loss": 0.4695, "step": 1418 }, { "epoch": 0.16, "learning_rate": 1.9098345867915467e-05, "loss": 0.5036, "step": 1419 }, { "epoch": 0.16, "learning_rate": 1.909680916566772e-05, "loss": 0.5027, "step": 1420 }, { "epoch": 0.16, "learning_rate": 1.9095271216954022e-05, "loss": 0.4953, "step": 1421 }, { "epoch": 0.16, "learning_rate": 1.9093732021985103e-05, "loss": 0.4851, "step": 1422 }, { "epoch": 0.16, "learning_rate": 1.909219158097187e-05, "loss": 0.4972, "step": 1423 }, { "epoch": 0.16, "learning_rate": 1.9090649894125395e-05, "loss": 0.4746, "step": 1424 }, { "epoch": 0.16, "learning_rate": 1.908910696165693e-05, "loss": 0.4911, "step": 1425 }, { "epoch": 0.16, "learning_rate": 1.908756278377788e-05, "loss": 0.4701, "step": 1426 }, { "epoch": 0.16, "learning_rate": 1.9086017360699843e-05, "loss": 0.4793, "step": 1427 }, { "epoch": 0.16, "learning_rate": 1.9084470692634567e-05, "loss": 0.4962, "step": 1428 }, { "epoch": 0.16, "learning_rate": 1.9082922779793988e-05, "loss": 0.4917, "step": 1429 }, { "epoch": 0.16, "learning_rate": 1.9081373622390204e-05, "loss": 0.5028, "step": 1430 }, { "epoch": 0.16, "learning_rate": 1.9079823220635477e-05, "loss": 0.471, "step": 1431 }, { "epoch": 0.16, "learning_rate": 1.907827157474225e-05, "loss": 0.4818, "step": 1432 }, { "epoch": 0.16, "learning_rate": 1.9076718684923136e-05, "loss": 0.4884, "step": 1433 }, { "epoch": 0.16, "learning_rate": 1.9075164551390918e-05, "loss": 0.4989, "step": 1434 }, { "epoch": 0.16, "learning_rate": 1.9073609174358535e-05, "loss": 0.4663, "step": 1435 }, { "epoch": 0.16, "learning_rate": 1.9072052554039123e-05, "loss": 0.5005, "step": 1436 }, { "epoch": 0.16, "learning_rate": 1.9070494690645966e-05, "loss": 0.4952, "step": 1437 }, { "epoch": 0.16, "learning_rate": 1.9068935584392522e-05, "loss": 0.4959, "step": 1438 }, { "epoch": 0.16, "learning_rate": 1.906737523549243e-05, "loss": 0.4891, "step": 1439 }, { "epoch": 0.16, "learning_rate": 1.9065813644159495e-05, "loss": 0.4844, "step": 1440 }, { "epoch": 0.16, "learning_rate": 1.906425081060768e-05, "loss": 0.4942, "step": 1441 }, { "epoch": 0.16, "learning_rate": 1.906268673505114e-05, "loss": 0.4822, "step": 1442 }, { "epoch": 0.16, "learning_rate": 1.906112141770418e-05, "loss": 0.4636, "step": 1443 }, { "epoch": 0.17, "learning_rate": 1.9059554858781285e-05, "loss": 0.488, "step": 1444 }, { "epoch": 0.17, "learning_rate": 1.9057987058497106e-05, "loss": 0.5003, "step": 1445 }, { "epoch": 0.17, "learning_rate": 1.9056418017066476e-05, "loss": 0.503, "step": 1446 }, { "epoch": 0.17, "learning_rate": 1.905484773470438e-05, "loss": 0.4837, "step": 1447 }, { "epoch": 0.17, "learning_rate": 1.905327621162598e-05, "loss": 0.4655, "step": 1448 }, { "epoch": 0.17, "learning_rate": 1.905170344804662e-05, "loss": 0.4768, "step": 1449 }, { "epoch": 0.17, "learning_rate": 1.90501294441818e-05, "loss": 0.4872, "step": 1450 }, { "epoch": 0.17, "learning_rate": 1.9048554200247184e-05, "loss": 0.4736, "step": 1451 }, { "epoch": 0.17, "learning_rate": 1.9046977716458627e-05, "loss": 0.4808, "step": 1452 }, { "epoch": 0.17, "learning_rate": 1.904539999303214e-05, "loss": 0.4925, "step": 1453 }, { "epoch": 0.17, "learning_rate": 1.90438210301839e-05, "loss": 0.4836, "step": 1454 }, { "epoch": 0.17, "learning_rate": 1.9042240828130267e-05, "loss": 0.4678, "step": 1455 }, { "epoch": 0.17, "learning_rate": 1.9040659387087762e-05, "loss": 0.4835, "step": 1456 }, { "epoch": 0.17, "learning_rate": 1.903907670727308e-05, "loss": 0.4949, "step": 1457 }, { "epoch": 0.17, "learning_rate": 1.903749278890308e-05, "loss": 0.4879, "step": 1458 }, { "epoch": 0.17, "learning_rate": 1.903590763219479e-05, "loss": 0.5004, "step": 1459 }, { "epoch": 0.17, "learning_rate": 1.9034321237365424e-05, "loss": 0.4882, "step": 1460 }, { "epoch": 0.17, "learning_rate": 1.9032733604632347e-05, "loss": 0.4818, "step": 1461 }, { "epoch": 0.17, "learning_rate": 1.9031144734213097e-05, "loss": 0.5016, "step": 1462 }, { "epoch": 0.17, "learning_rate": 1.9029554626325386e-05, "loss": 0.5071, "step": 1463 }, { "epoch": 0.17, "learning_rate": 1.90279632811871e-05, "loss": 0.4721, "step": 1464 }, { "epoch": 0.17, "learning_rate": 1.902637069901628e-05, "loss": 0.4908, "step": 1465 }, { "epoch": 0.17, "learning_rate": 1.9024776880031154e-05, "loss": 0.4762, "step": 1466 }, { "epoch": 0.17, "learning_rate": 1.9023181824450106e-05, "loss": 0.4817, "step": 1467 }, { "epoch": 0.17, "learning_rate": 1.9021585532491694e-05, "loss": 0.4806, "step": 1468 }, { "epoch": 0.17, "learning_rate": 1.9019988004374645e-05, "loss": 0.4877, "step": 1469 }, { "epoch": 0.17, "learning_rate": 1.901838924031786e-05, "loss": 0.4813, "step": 1470 }, { "epoch": 0.17, "learning_rate": 1.90167892405404e-05, "loss": 0.4945, "step": 1471 }, { "epoch": 0.17, "learning_rate": 1.9015188005261505e-05, "loss": 0.4863, "step": 1472 }, { "epoch": 0.17, "learning_rate": 1.9013585534700582e-05, "loss": 0.4841, "step": 1473 }, { "epoch": 0.17, "learning_rate": 1.90119818290772e-05, "loss": 0.4733, "step": 1474 }, { "epoch": 0.17, "learning_rate": 1.9010376888611106e-05, "loss": 0.4872, "step": 1475 }, { "epoch": 0.17, "learning_rate": 1.9008770713522206e-05, "loss": 0.4819, "step": 1476 }, { "epoch": 0.17, "learning_rate": 1.9007163304030593e-05, "loss": 0.4832, "step": 1477 }, { "epoch": 0.17, "learning_rate": 1.9005554660356505e-05, "loss": 0.478, "step": 1478 }, { "epoch": 0.17, "learning_rate": 1.9003944782720375e-05, "loss": 0.4873, "step": 1479 }, { "epoch": 0.17, "learning_rate": 1.9002333671342782e-05, "loss": 0.4852, "step": 1480 }, { "epoch": 0.17, "learning_rate": 1.9000721326444492e-05, "loss": 0.4965, "step": 1481 }, { "epoch": 0.17, "learning_rate": 1.8999107748246427e-05, "loss": 0.4757, "step": 1482 }, { "epoch": 0.17, "learning_rate": 1.8997492936969686e-05, "loss": 0.4775, "step": 1483 }, { "epoch": 0.17, "learning_rate": 1.899587689283553e-05, "loss": 0.4777, "step": 1484 }, { "epoch": 0.17, "learning_rate": 1.89942596160654e-05, "loss": 0.4887, "step": 1485 }, { "epoch": 0.17, "learning_rate": 1.899264110688089e-05, "loss": 0.4752, "step": 1486 }, { "epoch": 0.17, "learning_rate": 1.8991021365503782e-05, "loss": 0.4975, "step": 1487 }, { "epoch": 0.17, "learning_rate": 1.8989400392156012e-05, "loss": 0.4667, "step": 1488 }, { "epoch": 0.17, "learning_rate": 1.898777818705969e-05, "loss": 0.5035, "step": 1489 }, { "epoch": 0.17, "learning_rate": 1.898615475043709e-05, "loss": 0.4994, "step": 1490 }, { "epoch": 0.17, "learning_rate": 1.8984530082510665e-05, "loss": 0.4835, "step": 1491 }, { "epoch": 0.17, "learning_rate": 1.898290418350303e-05, "loss": 0.4679, "step": 1492 }, { "epoch": 0.17, "learning_rate": 1.8981277053636963e-05, "loss": 0.4847, "step": 1493 }, { "epoch": 0.17, "learning_rate": 1.8979648693135428e-05, "loss": 0.4753, "step": 1494 }, { "epoch": 0.17, "learning_rate": 1.8978019102221538e-05, "loss": 0.5043, "step": 1495 }, { "epoch": 0.17, "learning_rate": 1.8976388281118584e-05, "loss": 0.4708, "step": 1496 }, { "epoch": 0.17, "learning_rate": 1.8974756230050028e-05, "loss": 0.4852, "step": 1497 }, { "epoch": 0.17, "learning_rate": 1.8973122949239497e-05, "loss": 0.4888, "step": 1498 }, { "epoch": 0.17, "learning_rate": 1.897148843891079e-05, "loss": 0.4918, "step": 1499 }, { "epoch": 0.17, "learning_rate": 1.8969852699287865e-05, "loss": 0.4865, "step": 1500 }, { "epoch": 0.17, "learning_rate": 1.896821573059486e-05, "loss": 0.4742, "step": 1501 }, { "epoch": 0.17, "learning_rate": 1.896657753305607e-05, "loss": 0.4891, "step": 1502 }, { "epoch": 0.17, "learning_rate": 1.896493810689597e-05, "loss": 0.5085, "step": 1503 }, { "epoch": 0.17, "learning_rate": 1.89632974523392e-05, "loss": 0.5098, "step": 1504 }, { "epoch": 0.17, "learning_rate": 1.8961655569610557e-05, "loss": 0.4616, "step": 1505 }, { "epoch": 0.17, "learning_rate": 1.8960012458935025e-05, "loss": 0.4735, "step": 1506 }, { "epoch": 0.17, "learning_rate": 1.8958368120537746e-05, "loss": 0.5024, "step": 1507 }, { "epoch": 0.17, "learning_rate": 1.8956722554644026e-05, "loss": 0.4795, "step": 1508 }, { "epoch": 0.17, "learning_rate": 1.8955075761479342e-05, "loss": 0.4802, "step": 1509 }, { "epoch": 0.17, "learning_rate": 1.895342774126935e-05, "loss": 0.4744, "step": 1510 }, { "epoch": 0.17, "learning_rate": 1.8951778494239862e-05, "loss": 0.4734, "step": 1511 }, { "epoch": 0.17, "learning_rate": 1.8950128020616863e-05, "loss": 0.4954, "step": 1512 }, { "epoch": 0.17, "learning_rate": 1.89484763206265e-05, "loss": 0.4863, "step": 1513 }, { "epoch": 0.17, "learning_rate": 1.89468233944951e-05, "loss": 0.4804, "step": 1514 }, { "epoch": 0.17, "learning_rate": 1.8945169242449145e-05, "loss": 0.5027, "step": 1515 }, { "epoch": 0.17, "learning_rate": 1.894351386471529e-05, "loss": 0.4762, "step": 1516 }, { "epoch": 0.17, "learning_rate": 1.8941857261520363e-05, "loss": 0.4789, "step": 1517 }, { "epoch": 0.17, "learning_rate": 1.8940199433091354e-05, "loss": 0.4867, "step": 1518 }, { "epoch": 0.17, "learning_rate": 1.893854037965542e-05, "loss": 0.4938, "step": 1519 }, { "epoch": 0.17, "learning_rate": 1.8936880101439893e-05, "loss": 0.4817, "step": 1520 }, { "epoch": 0.17, "learning_rate": 1.8935218598672266e-05, "loss": 0.5014, "step": 1521 }, { "epoch": 0.17, "learning_rate": 1.8933555871580204e-05, "loss": 0.4909, "step": 1522 }, { "epoch": 0.17, "learning_rate": 1.8931891920391533e-05, "loss": 0.5019, "step": 1523 }, { "epoch": 0.17, "learning_rate": 1.893022674533425e-05, "loss": 0.482, "step": 1524 }, { "epoch": 0.17, "learning_rate": 1.8928560346636532e-05, "loss": 0.507, "step": 1525 }, { "epoch": 0.17, "learning_rate": 1.89268927245267e-05, "loss": 0.4968, "step": 1526 }, { "epoch": 0.17, "learning_rate": 1.8925223879233267e-05, "loss": 0.4785, "step": 1527 }, { "epoch": 0.17, "learning_rate": 1.8923553810984893e-05, "loss": 0.4749, "step": 1528 }, { "epoch": 0.17, "learning_rate": 1.8921882520010416e-05, "loss": 0.4744, "step": 1529 }, { "epoch": 0.17, "learning_rate": 1.8920210006538843e-05, "loss": 0.5001, "step": 1530 }, { "epoch": 0.17, "learning_rate": 1.891853627079935e-05, "loss": 0.4816, "step": 1531 }, { "epoch": 0.18, "learning_rate": 1.8916861313021268e-05, "loss": 0.4662, "step": 1532 }, { "epoch": 0.18, "learning_rate": 1.8915185133434107e-05, "loss": 0.4976, "step": 1533 }, { "epoch": 0.18, "learning_rate": 1.891350773226754e-05, "loss": 0.48, "step": 1534 }, { "epoch": 0.18, "learning_rate": 1.891182910975141e-05, "loss": 0.4784, "step": 1535 }, { "epoch": 0.18, "learning_rate": 1.8910149266115724e-05, "loss": 0.4776, "step": 1536 }, { "epoch": 0.18, "learning_rate": 1.890846820159066e-05, "loss": 0.4834, "step": 1537 }, { "epoch": 0.18, "learning_rate": 1.890678591640656e-05, "loss": 0.4873, "step": 1538 }, { "epoch": 0.18, "learning_rate": 1.8905102410793936e-05, "loss": 0.5074, "step": 1539 }, { "epoch": 0.18, "learning_rate": 1.8903417684983465e-05, "loss": 0.478, "step": 1540 }, { "epoch": 0.18, "learning_rate": 1.8901731739205992e-05, "loss": 0.483, "step": 1541 }, { "epoch": 0.18, "learning_rate": 1.8900044573692527e-05, "loss": 0.4688, "step": 1542 }, { "epoch": 0.18, "learning_rate": 1.8898356188674253e-05, "loss": 0.487, "step": 1543 }, { "epoch": 0.18, "learning_rate": 1.8896666584382516e-05, "loss": 0.489, "step": 1544 }, { "epoch": 0.18, "learning_rate": 1.8894975761048826e-05, "loss": 0.4841, "step": 1545 }, { "epoch": 0.18, "learning_rate": 1.8893283718904866e-05, "loss": 0.4876, "step": 1546 }, { "epoch": 0.18, "learning_rate": 1.8891590458182486e-05, "loss": 0.4965, "step": 1547 }, { "epoch": 0.18, "learning_rate": 1.8889895979113698e-05, "loss": 0.4915, "step": 1548 }, { "epoch": 0.18, "learning_rate": 1.888820028193068e-05, "loss": 0.4695, "step": 1549 }, { "epoch": 0.18, "learning_rate": 1.8886503366865786e-05, "loss": 0.4902, "step": 1550 }, { "epoch": 0.18, "learning_rate": 1.888480523415153e-05, "loss": 0.4967, "step": 1551 }, { "epoch": 0.18, "learning_rate": 1.8883105884020595e-05, "loss": 0.4639, "step": 1552 }, { "epoch": 0.18, "learning_rate": 1.8881405316705824e-05, "loss": 0.4954, "step": 1553 }, { "epoch": 0.18, "learning_rate": 1.887970353244024e-05, "loss": 0.4777, "step": 1554 }, { "epoch": 0.18, "learning_rate": 1.887800053145702e-05, "loss": 0.4929, "step": 1555 }, { "epoch": 0.18, "learning_rate": 1.8876296313989516e-05, "loss": 0.5071, "step": 1556 }, { "epoch": 0.18, "learning_rate": 1.8874590880271245e-05, "loss": 0.4704, "step": 1557 }, { "epoch": 0.18, "learning_rate": 1.8872884230535886e-05, "loss": 0.468, "step": 1558 }, { "epoch": 0.18, "learning_rate": 1.8871176365017293e-05, "loss": 0.4986, "step": 1559 }, { "epoch": 0.18, "learning_rate": 1.8869467283949475e-05, "loss": 0.4718, "step": 1560 }, { "epoch": 0.18, "learning_rate": 1.8867756987566615e-05, "loss": 0.4777, "step": 1561 }, { "epoch": 0.18, "learning_rate": 1.8866045476103073e-05, "loss": 0.492, "step": 1562 }, { "epoch": 0.18, "learning_rate": 1.886433274979335e-05, "loss": 0.5308, "step": 1563 }, { "epoch": 0.18, "learning_rate": 1.8862618808872138e-05, "loss": 0.4872, "step": 1564 }, { "epoch": 0.18, "learning_rate": 1.8860903653574277e-05, "loss": 0.4714, "step": 1565 }, { "epoch": 0.18, "learning_rate": 1.8859187284134785e-05, "loss": 0.4829, "step": 1566 }, { "epoch": 0.18, "learning_rate": 1.8857469700788845e-05, "loss": 0.4899, "step": 1567 }, { "epoch": 0.18, "learning_rate": 1.8855750903771805e-05, "loss": 0.4854, "step": 1568 }, { "epoch": 0.18, "learning_rate": 1.8854030893319173e-05, "loss": 0.4738, "step": 1569 }, { "epoch": 0.18, "learning_rate": 1.8852309669666634e-05, "loss": 0.4797, "step": 1570 }, { "epoch": 0.18, "learning_rate": 1.885058723305003e-05, "loss": 0.4985, "step": 1571 }, { "epoch": 0.18, "learning_rate": 1.8848863583705373e-05, "loss": 0.4893, "step": 1572 }, { "epoch": 0.18, "learning_rate": 1.884713872186885e-05, "loss": 0.5035, "step": 1573 }, { "epoch": 0.18, "learning_rate": 1.8845412647776795e-05, "loss": 0.4932, "step": 1574 }, { "epoch": 0.18, "learning_rate": 1.8843685361665724e-05, "loss": 0.4753, "step": 1575 }, { "epoch": 0.18, "learning_rate": 1.8841956863772314e-05, "loss": 0.4796, "step": 1576 }, { "epoch": 0.18, "learning_rate": 1.8840227154333405e-05, "loss": 0.4888, "step": 1577 }, { "epoch": 0.18, "learning_rate": 1.883849623358601e-05, "loss": 0.4732, "step": 1578 }, { "epoch": 0.18, "learning_rate": 1.88367641017673e-05, "loss": 0.4919, "step": 1579 }, { "epoch": 0.18, "learning_rate": 1.8835030759114617e-05, "loss": 0.4883, "step": 1580 }, { "epoch": 0.18, "learning_rate": 1.8833296205865466e-05, "loss": 0.4923, "step": 1581 }, { "epoch": 0.18, "learning_rate": 1.8831560442257523e-05, "loss": 0.477, "step": 1582 }, { "epoch": 0.18, "learning_rate": 1.8829823468528624e-05, "loss": 0.4749, "step": 1583 }, { "epoch": 0.18, "learning_rate": 1.8828085284916777e-05, "loss": 0.4813, "step": 1584 }, { "epoch": 0.18, "learning_rate": 1.882634589166014e-05, "loss": 0.5162, "step": 1585 }, { "epoch": 0.18, "learning_rate": 1.8824605288997064e-05, "loss": 0.4578, "step": 1586 }, { "epoch": 0.18, "learning_rate": 1.882286347716604e-05, "loss": 0.5004, "step": 1587 }, { "epoch": 0.18, "learning_rate": 1.8821120456405743e-05, "loss": 0.4933, "step": 1588 }, { "epoch": 0.18, "learning_rate": 1.8819376226955e-05, "loss": 0.5036, "step": 1589 }, { "epoch": 0.18, "learning_rate": 1.8817630789052813e-05, "loss": 0.4774, "step": 1590 }, { "epoch": 0.18, "learning_rate": 1.881588414293834e-05, "loss": 0.4817, "step": 1591 }, { "epoch": 0.18, "learning_rate": 1.881413628885092e-05, "loss": 0.4606, "step": 1592 }, { "epoch": 0.18, "learning_rate": 1.8812387227030035e-05, "loss": 0.4866, "step": 1593 }, { "epoch": 0.18, "learning_rate": 1.8810636957715357e-05, "loss": 0.4622, "step": 1594 }, { "epoch": 0.18, "learning_rate": 1.880888548114671e-05, "loss": 0.4884, "step": 1595 }, { "epoch": 0.18, "learning_rate": 1.880713279756408e-05, "loss": 0.479, "step": 1596 }, { "epoch": 0.18, "learning_rate": 1.880537890720763e-05, "loss": 0.4996, "step": 1597 }, { "epoch": 0.18, "learning_rate": 1.8803623810317678e-05, "loss": 0.4693, "step": 1598 }, { "epoch": 0.18, "learning_rate": 1.8801867507134712e-05, "loss": 0.4771, "step": 1599 }, { "epoch": 0.18, "learning_rate": 1.8800109997899386e-05, "loss": 0.4914, "step": 1600 }, { "epoch": 0.18, "learning_rate": 1.879835128285252e-05, "loss": 0.4782, "step": 1601 }, { "epoch": 0.18, "learning_rate": 1.879659136223509e-05, "loss": 0.4953, "step": 1602 }, { "epoch": 0.18, "learning_rate": 1.8794830236288254e-05, "loss": 0.4904, "step": 1603 }, { "epoch": 0.18, "learning_rate": 1.8793067905253318e-05, "loss": 0.4721, "step": 1604 }, { "epoch": 0.18, "learning_rate": 1.8791304369371765e-05, "loss": 0.5035, "step": 1605 }, { "epoch": 0.18, "learning_rate": 1.8789539628885233e-05, "loss": 0.4752, "step": 1606 }, { "epoch": 0.18, "learning_rate": 1.878777368403554e-05, "loss": 0.4852, "step": 1607 }, { "epoch": 0.18, "learning_rate": 1.8786006535064654e-05, "loss": 0.496, "step": 1608 }, { "epoch": 0.18, "learning_rate": 1.8784238182214713e-05, "loss": 0.4785, "step": 1609 }, { "epoch": 0.18, "learning_rate": 1.8782468625728027e-05, "loss": 0.4813, "step": 1610 }, { "epoch": 0.18, "learning_rate": 1.8780697865847056e-05, "loss": 0.5088, "step": 1611 }, { "epoch": 0.18, "learning_rate": 1.877892590281444e-05, "loss": 0.4805, "step": 1612 }, { "epoch": 0.18, "learning_rate": 1.877715273687297e-05, "loss": 0.5001, "step": 1613 }, { "epoch": 0.18, "learning_rate": 1.8775378368265622e-05, "loss": 0.4999, "step": 1614 }, { "epoch": 0.18, "learning_rate": 1.8773602797235516e-05, "loss": 0.4834, "step": 1615 }, { "epoch": 0.18, "learning_rate": 1.8771826024025944e-05, "loss": 0.4797, "step": 1616 }, { "epoch": 0.18, "learning_rate": 1.8770048048880367e-05, "loss": 0.488, "step": 1617 }, { "epoch": 0.18, "learning_rate": 1.8768268872042402e-05, "loss": 0.4786, "step": 1618 }, { "epoch": 0.19, "learning_rate": 1.8766488493755845e-05, "loss": 0.4776, "step": 1619 }, { "epoch": 0.19, "learning_rate": 1.8764706914264636e-05, "loss": 0.4899, "step": 1620 }, { "epoch": 0.19, "learning_rate": 1.8762924133812905e-05, "loss": 0.4933, "step": 1621 }, { "epoch": 0.19, "learning_rate": 1.876114015264492e-05, "loss": 0.4851, "step": 1622 }, { "epoch": 0.19, "learning_rate": 1.8759354971005133e-05, "loss": 0.4766, "step": 1623 }, { "epoch": 0.19, "learning_rate": 1.875756858913815e-05, "loss": 0.5006, "step": 1624 }, { "epoch": 0.19, "learning_rate": 1.875578100728875e-05, "loss": 0.4958, "step": 1625 }, { "epoch": 0.19, "learning_rate": 1.8753992225701868e-05, "loss": 0.482, "step": 1626 }, { "epoch": 0.19, "learning_rate": 1.875220224462261e-05, "loss": 0.4894, "step": 1627 }, { "epoch": 0.19, "learning_rate": 1.8750411064296237e-05, "loss": 0.474, "step": 1628 }, { "epoch": 0.19, "learning_rate": 1.8748618684968187e-05, "loss": 0.507, "step": 1629 }, { "epoch": 0.19, "learning_rate": 1.8746825106884055e-05, "loss": 0.4657, "step": 1630 }, { "epoch": 0.19, "learning_rate": 1.87450303302896e-05, "loss": 0.484, "step": 1631 }, { "epoch": 0.19, "learning_rate": 1.8743234355430746e-05, "loss": 0.479, "step": 1632 }, { "epoch": 0.19, "learning_rate": 1.8741437182553582e-05, "loss": 0.4876, "step": 1633 }, { "epoch": 0.19, "learning_rate": 1.8739638811904363e-05, "loss": 0.5082, "step": 1634 }, { "epoch": 0.19, "learning_rate": 1.8737839243729504e-05, "loss": 0.4617, "step": 1635 }, { "epoch": 0.19, "learning_rate": 1.8736038478275584e-05, "loss": 0.4841, "step": 1636 }, { "epoch": 0.19, "learning_rate": 1.873423651578935e-05, "loss": 0.4825, "step": 1637 }, { "epoch": 0.19, "learning_rate": 1.8732433356517713e-05, "loss": 0.4856, "step": 1638 }, { "epoch": 0.19, "learning_rate": 1.8730629000707746e-05, "loss": 0.4894, "step": 1639 }, { "epoch": 0.19, "learning_rate": 1.872882344860668e-05, "loss": 0.4878, "step": 1640 }, { "epoch": 0.19, "learning_rate": 1.872701670046192e-05, "loss": 0.5066, "step": 1641 }, { "epoch": 0.19, "learning_rate": 1.8725208756521036e-05, "loss": 0.4937, "step": 1642 }, { "epoch": 0.19, "learning_rate": 1.8723399617031754e-05, "loss": 0.4747, "step": 1643 }, { "epoch": 0.19, "learning_rate": 1.8721589282241956e-05, "loss": 0.4769, "step": 1644 }, { "epoch": 0.19, "learning_rate": 1.8719777752399713e-05, "loss": 0.4826, "step": 1645 }, { "epoch": 0.19, "learning_rate": 1.8717965027753235e-05, "loss": 0.4781, "step": 1646 }, { "epoch": 0.19, "learning_rate": 1.8716151108550912e-05, "loss": 0.4992, "step": 1647 }, { "epoch": 0.19, "learning_rate": 1.871433599504129e-05, "loss": 0.4906, "step": 1648 }, { "epoch": 0.19, "learning_rate": 1.8712519687473075e-05, "loss": 0.4832, "step": 1649 }, { "epoch": 0.19, "learning_rate": 1.8710702186095147e-05, "loss": 0.4871, "step": 1650 }, { "epoch": 0.19, "learning_rate": 1.8708883491156544e-05, "loss": 0.4787, "step": 1651 }, { "epoch": 0.19, "learning_rate": 1.8707063602906466e-05, "loss": 0.4772, "step": 1652 }, { "epoch": 0.19, "learning_rate": 1.8705242521594276e-05, "loss": 0.4791, "step": 1653 }, { "epoch": 0.19, "learning_rate": 1.870342024746951e-05, "loss": 0.4847, "step": 1654 }, { "epoch": 0.19, "learning_rate": 1.8701596780781855e-05, "loss": 0.4919, "step": 1655 }, { "epoch": 0.19, "learning_rate": 1.869977212178117e-05, "loss": 0.4897, "step": 1656 }, { "epoch": 0.19, "learning_rate": 1.8697946270717468e-05, "loss": 0.4652, "step": 1657 }, { "epoch": 0.19, "learning_rate": 1.8696119227840937e-05, "loss": 0.493, "step": 1658 }, { "epoch": 0.19, "learning_rate": 1.869429099340192e-05, "loss": 0.46, "step": 1659 }, { "epoch": 0.19, "learning_rate": 1.8692461567650925e-05, "loss": 0.5069, "step": 1660 }, { "epoch": 0.19, "learning_rate": 1.869063095083863e-05, "loss": 0.4855, "step": 1661 }, { "epoch": 0.19, "learning_rate": 1.8688799143215863e-05, "loss": 0.4678, "step": 1662 }, { "epoch": 0.19, "learning_rate": 1.8686966145033626e-05, "loss": 0.4733, "step": 1663 }, { "epoch": 0.19, "learning_rate": 1.8685131956543082e-05, "loss": 0.4652, "step": 1664 }, { "epoch": 0.19, "learning_rate": 1.8683296577995554e-05, "loss": 0.4923, "step": 1665 }, { "epoch": 0.19, "learning_rate": 1.8681460009642533e-05, "loss": 0.4963, "step": 1666 }, { "epoch": 0.19, "learning_rate": 1.867962225173566e-05, "loss": 0.4617, "step": 1667 }, { "epoch": 0.19, "learning_rate": 1.867778330452676e-05, "loss": 0.4967, "step": 1668 }, { "epoch": 0.19, "learning_rate": 1.8675943168267804e-05, "loss": 0.4924, "step": 1669 }, { "epoch": 0.19, "learning_rate": 1.8674101843210935e-05, "loss": 0.4953, "step": 1670 }, { "epoch": 0.19, "learning_rate": 1.8672259329608457e-05, "loss": 0.4848, "step": 1671 }, { "epoch": 0.19, "learning_rate": 1.8670415627712825e-05, "loss": 0.4905, "step": 1672 }, { "epoch": 0.19, "learning_rate": 1.866857073777668e-05, "loss": 0.4961, "step": 1673 }, { "epoch": 0.19, "learning_rate": 1.8666724660052807e-05, "loss": 0.4816, "step": 1674 }, { "epoch": 0.19, "learning_rate": 1.8664877394794158e-05, "loss": 0.4707, "step": 1675 }, { "epoch": 0.19, "learning_rate": 1.8663028942253854e-05, "loss": 0.4883, "step": 1676 }, { "epoch": 0.19, "learning_rate": 1.8661179302685177e-05, "loss": 0.4905, "step": 1677 }, { "epoch": 0.19, "learning_rate": 1.8659328476341557e-05, "loss": 0.4828, "step": 1678 }, { "epoch": 0.19, "learning_rate": 1.865747646347661e-05, "loss": 0.4787, "step": 1679 }, { "epoch": 0.19, "learning_rate": 1.8655623264344103e-05, "loss": 0.478, "step": 1680 }, { "epoch": 0.19, "learning_rate": 1.8653768879197956e-05, "loss": 0.5098, "step": 1681 }, { "epoch": 0.19, "learning_rate": 1.865191330829227e-05, "loss": 0.4905, "step": 1682 }, { "epoch": 0.19, "learning_rate": 1.8650056551881297e-05, "loss": 0.4881, "step": 1683 }, { "epoch": 0.19, "learning_rate": 1.8648198610219452e-05, "loss": 0.4741, "step": 1684 }, { "epoch": 0.19, "learning_rate": 1.864633948356132e-05, "loss": 0.4758, "step": 1685 }, { "epoch": 0.19, "learning_rate": 1.8644479172161635e-05, "loss": 0.4836, "step": 1686 }, { "epoch": 0.19, "learning_rate": 1.8642617676275306e-05, "loss": 0.4902, "step": 1687 }, { "epoch": 0.19, "learning_rate": 1.8640754996157397e-05, "loss": 0.4673, "step": 1688 }, { "epoch": 0.19, "learning_rate": 1.863889113206314e-05, "loss": 0.5032, "step": 1689 }, { "epoch": 0.19, "learning_rate": 1.863702608424793e-05, "loss": 0.4906, "step": 1690 }, { "epoch": 0.19, "learning_rate": 1.863515985296731e-05, "loss": 0.4808, "step": 1691 }, { "epoch": 0.19, "learning_rate": 1.8633292438476998e-05, "loss": 0.4903, "step": 1692 }, { "epoch": 0.19, "learning_rate": 1.8631423841032876e-05, "loss": 0.4751, "step": 1693 }, { "epoch": 0.19, "learning_rate": 1.8629554060890982e-05, "loss": 0.4874, "step": 1694 }, { "epoch": 0.19, "learning_rate": 1.8627683098307516e-05, "loss": 0.4805, "step": 1695 }, { "epoch": 0.19, "learning_rate": 1.862581095353884e-05, "loss": 0.4862, "step": 1696 }, { "epoch": 0.19, "learning_rate": 1.8623937626841485e-05, "loss": 0.4728, "step": 1697 }, { "epoch": 0.19, "learning_rate": 1.8622063118472135e-05, "loss": 0.4992, "step": 1698 }, { "epoch": 0.19, "learning_rate": 1.8620187428687643e-05, "loss": 0.4798, "step": 1699 }, { "epoch": 0.19, "learning_rate": 1.861831055774501e-05, "loss": 0.4886, "step": 1700 }, { "epoch": 0.19, "learning_rate": 1.8616432505901427e-05, "loss": 0.4727, "step": 1701 }, { "epoch": 0.19, "learning_rate": 1.861455327341421e-05, "loss": 0.4862, "step": 1702 }, { "epoch": 0.19, "learning_rate": 1.8612672860540865e-05, "loss": 0.4721, "step": 1703 }, { "epoch": 0.19, "learning_rate": 1.8610791267539053e-05, "loss": 0.4631, "step": 1704 }, { "epoch": 0.19, "learning_rate": 1.8608908494666593e-05, "loss": 0.4935, "step": 1705 }, { "epoch": 0.19, "learning_rate": 1.8607024542181465e-05, "loss": 0.4937, "step": 1706 }, { "epoch": 0.2, "learning_rate": 1.860513941034181e-05, "loss": 0.474, "step": 1707 }, { "epoch": 0.2, "learning_rate": 1.8603253099405937e-05, "loss": 0.4716, "step": 1708 }, { "epoch": 0.2, "learning_rate": 1.8601365609632315e-05, "loss": 0.5024, "step": 1709 }, { "epoch": 0.2, "learning_rate": 1.859947694127956e-05, "loss": 0.4774, "step": 1710 }, { "epoch": 0.2, "learning_rate": 1.859758709460648e-05, "loss": 0.4771, "step": 1711 }, { "epoch": 0.2, "learning_rate": 1.8595696069872013e-05, "loss": 0.4811, "step": 1712 }, { "epoch": 0.2, "learning_rate": 1.8593803867335276e-05, "loss": 0.476, "step": 1713 }, { "epoch": 0.2, "learning_rate": 1.859191048725554e-05, "loss": 0.4997, "step": 1714 }, { "epoch": 0.2, "learning_rate": 1.8590015929892245e-05, "loss": 0.4814, "step": 1715 }, { "epoch": 0.2, "learning_rate": 1.858812019550499e-05, "loss": 0.4644, "step": 1716 }, { "epoch": 0.2, "learning_rate": 1.8586223284353522e-05, "loss": 0.4897, "step": 1717 }, { "epoch": 0.2, "learning_rate": 1.8584325196697767e-05, "loss": 0.4907, "step": 1718 }, { "epoch": 0.2, "learning_rate": 1.8582425932797807e-05, "loss": 0.475, "step": 1719 }, { "epoch": 0.2, "learning_rate": 1.8580525492913884e-05, "loss": 0.4799, "step": 1720 }, { "epoch": 0.2, "learning_rate": 1.8578623877306394e-05, "loss": 0.4759, "step": 1721 }, { "epoch": 0.2, "learning_rate": 1.8576721086235908e-05, "loss": 0.509, "step": 1722 }, { "epoch": 0.2, "learning_rate": 1.8574817119963145e-05, "loss": 0.4782, "step": 1723 }, { "epoch": 0.2, "learning_rate": 1.8572911978748993e-05, "loss": 0.4763, "step": 1724 }, { "epoch": 0.2, "learning_rate": 1.8571005662854502e-05, "loss": 0.5017, "step": 1725 }, { "epoch": 0.2, "learning_rate": 1.8569098172540875e-05, "loss": 0.4736, "step": 1726 }, { "epoch": 0.2, "learning_rate": 1.856718950806949e-05, "loss": 0.4701, "step": 1727 }, { "epoch": 0.2, "learning_rate": 1.8565279669701862e-05, "loss": 0.4726, "step": 1728 }, { "epoch": 0.2, "learning_rate": 1.8563368657699693e-05, "loss": 0.4578, "step": 1729 }, { "epoch": 0.2, "learning_rate": 1.856145647232483e-05, "loss": 0.4809, "step": 1730 }, { "epoch": 0.2, "learning_rate": 1.8559543113839285e-05, "loss": 0.4705, "step": 1731 }, { "epoch": 0.2, "learning_rate": 1.8557628582505235e-05, "loss": 0.5124, "step": 1732 }, { "epoch": 0.2, "learning_rate": 1.8555712878585005e-05, "loss": 0.473, "step": 1733 }, { "epoch": 0.2, "learning_rate": 1.8553796002341098e-05, "loss": 0.4715, "step": 1734 }, { "epoch": 0.2, "learning_rate": 1.8551877954036165e-05, "loss": 0.4905, "step": 1735 }, { "epoch": 0.2, "learning_rate": 1.854995873393302e-05, "loss": 0.4924, "step": 1736 }, { "epoch": 0.2, "learning_rate": 1.854803834229464e-05, "loss": 0.4684, "step": 1737 }, { "epoch": 0.2, "learning_rate": 1.8546116779384165e-05, "loss": 0.4869, "step": 1738 }, { "epoch": 0.2, "learning_rate": 1.8544194045464888e-05, "loss": 0.47, "step": 1739 }, { "epoch": 0.2, "learning_rate": 1.8542270140800266e-05, "loss": 0.4872, "step": 1740 }, { "epoch": 0.2, "learning_rate": 1.854034506565392e-05, "loss": 0.4664, "step": 1741 }, { "epoch": 0.2, "learning_rate": 1.8538418820289628e-05, "loss": 0.4862, "step": 1742 }, { "epoch": 0.2, "learning_rate": 1.8536491404971327e-05, "loss": 0.466, "step": 1743 }, { "epoch": 0.2, "learning_rate": 1.8534562819963112e-05, "loss": 0.4869, "step": 1744 }, { "epoch": 0.2, "learning_rate": 1.853263306552925e-05, "loss": 0.477, "step": 1745 }, { "epoch": 0.2, "learning_rate": 1.8530702141934157e-05, "loss": 0.4889, "step": 1746 }, { "epoch": 0.2, "learning_rate": 1.8528770049442413e-05, "loss": 0.4812, "step": 1747 }, { "epoch": 0.2, "learning_rate": 1.852683678831876e-05, "loss": 0.5022, "step": 1748 }, { "epoch": 0.2, "learning_rate": 1.852490235882809e-05, "loss": 0.477, "step": 1749 }, { "epoch": 0.2, "learning_rate": 1.852296676123547e-05, "loss": 0.4985, "step": 1750 }, { "epoch": 0.2, "learning_rate": 1.8521029995806123e-05, "loss": 0.489, "step": 1751 }, { "epoch": 0.2, "learning_rate": 1.851909206280542e-05, "loss": 0.4941, "step": 1752 }, { "epoch": 0.2, "learning_rate": 1.8517152962498908e-05, "loss": 0.4833, "step": 1753 }, { "epoch": 0.2, "learning_rate": 1.8515212695152284e-05, "loss": 0.4874, "step": 1754 }, { "epoch": 0.2, "learning_rate": 1.8513271261031406e-05, "loss": 0.4818, "step": 1755 }, { "epoch": 0.2, "learning_rate": 1.8511328660402302e-05, "loss": 0.4875, "step": 1756 }, { "epoch": 0.2, "learning_rate": 1.850938489353114e-05, "loss": 0.4796, "step": 1757 }, { "epoch": 0.2, "learning_rate": 1.850743996068427e-05, "loss": 0.4783, "step": 1758 }, { "epoch": 0.2, "learning_rate": 1.8505493862128187e-05, "loss": 0.4777, "step": 1759 }, { "epoch": 0.2, "learning_rate": 1.8503546598129547e-05, "loss": 0.478, "step": 1760 }, { "epoch": 0.2, "learning_rate": 1.8501598168955172e-05, "loss": 0.4774, "step": 1761 }, { "epoch": 0.2, "learning_rate": 1.8499648574872042e-05, "loss": 0.4938, "step": 1762 }, { "epoch": 0.2, "learning_rate": 1.849769781614729e-05, "loss": 0.4838, "step": 1763 }, { "epoch": 0.2, "learning_rate": 1.849574589304822e-05, "loss": 0.4955, "step": 1764 }, { "epoch": 0.2, "learning_rate": 1.8493792805842278e-05, "loss": 0.4886, "step": 1765 }, { "epoch": 0.2, "learning_rate": 1.8491838554797096e-05, "loss": 0.4945, "step": 1766 }, { "epoch": 0.2, "learning_rate": 1.8489883140180437e-05, "loss": 0.4612, "step": 1767 }, { "epoch": 0.2, "learning_rate": 1.848792656226024e-05, "loss": 0.492, "step": 1768 }, { "epoch": 0.2, "learning_rate": 1.8485968821304604e-05, "loss": 0.4717, "step": 1769 }, { "epoch": 0.2, "learning_rate": 1.848400991758178e-05, "loss": 0.4814, "step": 1770 }, { "epoch": 0.2, "learning_rate": 1.8482049851360182e-05, "loss": 0.48, "step": 1771 }, { "epoch": 0.2, "learning_rate": 1.8480088622908382e-05, "loss": 0.4792, "step": 1772 }, { "epoch": 0.2, "learning_rate": 1.8478126232495114e-05, "loss": 0.4839, "step": 1773 }, { "epoch": 0.2, "learning_rate": 1.8476162680389268e-05, "loss": 0.4825, "step": 1774 }, { "epoch": 0.2, "learning_rate": 1.847419796685989e-05, "loss": 0.4821, "step": 1775 }, { "epoch": 0.2, "learning_rate": 1.84722320921762e-05, "loss": 0.5115, "step": 1776 }, { "epoch": 0.2, "learning_rate": 1.8470265056607557e-05, "loss": 0.46, "step": 1777 }, { "epoch": 0.2, "learning_rate": 1.8468296860423494e-05, "loss": 0.4905, "step": 1778 }, { "epoch": 0.2, "learning_rate": 1.8466327503893697e-05, "loss": 0.4867, "step": 1779 }, { "epoch": 0.2, "learning_rate": 1.8464356987288012e-05, "loss": 0.4755, "step": 1780 }, { "epoch": 0.2, "learning_rate": 1.8462385310876444e-05, "loss": 0.4933, "step": 1781 }, { "epoch": 0.2, "learning_rate": 1.8460412474929154e-05, "loss": 0.4886, "step": 1782 }, { "epoch": 0.2, "learning_rate": 1.8458438479716466e-05, "loss": 0.4768, "step": 1783 }, { "epoch": 0.2, "learning_rate": 1.845646332550886e-05, "loss": 0.4779, "step": 1784 }, { "epoch": 0.2, "learning_rate": 1.845448701257698e-05, "loss": 0.4866, "step": 1785 }, { "epoch": 0.2, "learning_rate": 1.8452509541191625e-05, "loss": 0.4603, "step": 1786 }, { "epoch": 0.2, "learning_rate": 1.8450530911623747e-05, "loss": 0.5003, "step": 1787 }, { "epoch": 0.2, "learning_rate": 1.8448551124144467e-05, "loss": 0.4798, "step": 1788 }, { "epoch": 0.2, "learning_rate": 1.844657017902506e-05, "loss": 0.4767, "step": 1789 }, { "epoch": 0.2, "learning_rate": 1.844458807653696e-05, "loss": 0.4962, "step": 1790 }, { "epoch": 0.2, "learning_rate": 1.8442604816951757e-05, "loss": 0.4689, "step": 1791 }, { "epoch": 0.2, "learning_rate": 1.8440620400541202e-05, "loss": 0.5121, "step": 1792 }, { "epoch": 0.2, "learning_rate": 1.843863482757721e-05, "loss": 0.4729, "step": 1793 }, { "epoch": 0.21, "learning_rate": 1.8436648098331838e-05, "loss": 0.4883, "step": 1794 }, { "epoch": 0.21, "learning_rate": 1.843466021307732e-05, "loss": 0.4687, "step": 1795 }, { "epoch": 0.21, "learning_rate": 1.8432671172086044e-05, "loss": 0.4604, "step": 1796 }, { "epoch": 0.21, "learning_rate": 1.8430680975630545e-05, "loss": 0.4798, "step": 1797 }, { "epoch": 0.21, "learning_rate": 1.8428689623983526e-05, "loss": 0.468, "step": 1798 }, { "epoch": 0.21, "learning_rate": 1.8426697117417848e-05, "loss": 0.4735, "step": 1799 }, { "epoch": 0.21, "learning_rate": 1.8424703456206533e-05, "loss": 0.4889, "step": 1800 }, { "epoch": 0.21, "learning_rate": 1.842270864062275e-05, "loss": 0.4724, "step": 1801 }, { "epoch": 0.21, "learning_rate": 1.8420712670939837e-05, "loss": 0.4837, "step": 1802 }, { "epoch": 0.21, "learning_rate": 1.8418715547431283e-05, "loss": 0.4789, "step": 1803 }, { "epoch": 0.21, "learning_rate": 1.8416717270370744e-05, "loss": 0.4703, "step": 1804 }, { "epoch": 0.21, "learning_rate": 1.841471784003203e-05, "loss": 0.4746, "step": 1805 }, { "epoch": 0.21, "learning_rate": 1.84127172566891e-05, "loss": 0.4867, "step": 1806 }, { "epoch": 0.21, "learning_rate": 1.841071552061608e-05, "loss": 0.4663, "step": 1807 }, { "epoch": 0.21, "learning_rate": 1.8408712632087256e-05, "loss": 0.5056, "step": 1808 }, { "epoch": 0.21, "learning_rate": 1.840670859137707e-05, "loss": 0.4712, "step": 1809 }, { "epoch": 0.21, "learning_rate": 1.840470339876011e-05, "loss": 0.4915, "step": 1810 }, { "epoch": 0.21, "learning_rate": 1.8402697054511145e-05, "loss": 0.4752, "step": 1811 }, { "epoch": 0.21, "learning_rate": 1.8400689558905083e-05, "loss": 0.4876, "step": 1812 }, { "epoch": 0.21, "learning_rate": 1.8398680912216997e-05, "loss": 0.4676, "step": 1813 }, { "epoch": 0.21, "learning_rate": 1.8396671114722112e-05, "loss": 0.497, "step": 1814 }, { "epoch": 0.21, "learning_rate": 1.8394660166695822e-05, "loss": 0.4645, "step": 1815 }, { "epoch": 0.21, "learning_rate": 1.8392648068413667e-05, "loss": 0.5071, "step": 1816 }, { "epoch": 0.21, "learning_rate": 1.8390634820151353e-05, "loss": 0.4908, "step": 1817 }, { "epoch": 0.21, "learning_rate": 1.8388620422184738e-05, "loss": 0.4663, "step": 1818 }, { "epoch": 0.21, "learning_rate": 1.8386604874789836e-05, "loss": 0.4705, "step": 1819 }, { "epoch": 0.21, "learning_rate": 1.8384588178242828e-05, "loss": 0.4809, "step": 1820 }, { "epoch": 0.21, "learning_rate": 1.8382570332820045e-05, "loss": 0.5041, "step": 1821 }, { "epoch": 0.21, "learning_rate": 1.8380551338797974e-05, "loss": 0.472, "step": 1822 }, { "epoch": 0.21, "learning_rate": 1.8378531196453265e-05, "loss": 0.4672, "step": 1823 }, { "epoch": 0.21, "learning_rate": 1.837650990606272e-05, "loss": 0.498, "step": 1824 }, { "epoch": 0.21, "learning_rate": 1.8374487467903303e-05, "loss": 0.4822, "step": 1825 }, { "epoch": 0.21, "learning_rate": 1.8372463882252133e-05, "loss": 0.5021, "step": 1826 }, { "epoch": 0.21, "learning_rate": 1.8370439149386484e-05, "loss": 0.4562, "step": 1827 }, { "epoch": 0.21, "learning_rate": 1.8368413269583795e-05, "loss": 0.4936, "step": 1828 }, { "epoch": 0.21, "learning_rate": 1.8366386243121654e-05, "loss": 0.4606, "step": 1829 }, { "epoch": 0.21, "learning_rate": 1.8364358070277807e-05, "loss": 0.4959, "step": 1830 }, { "epoch": 0.21, "learning_rate": 1.836232875133016e-05, "loss": 0.4866, "step": 1831 }, { "epoch": 0.21, "learning_rate": 1.8360298286556774e-05, "loss": 0.4869, "step": 1832 }, { "epoch": 0.21, "learning_rate": 1.8358266676235872e-05, "loss": 0.4695, "step": 1833 }, { "epoch": 0.21, "learning_rate": 1.8356233920645822e-05, "loss": 0.5119, "step": 1834 }, { "epoch": 0.21, "learning_rate": 1.8354200020065168e-05, "loss": 0.4823, "step": 1835 }, { "epoch": 0.21, "learning_rate": 1.8352164974772592e-05, "loss": 0.4872, "step": 1836 }, { "epoch": 0.21, "learning_rate": 1.8350128785046943e-05, "loss": 0.4604, "step": 1837 }, { "epoch": 0.21, "learning_rate": 1.8348091451167224e-05, "loss": 0.4571, "step": 1838 }, { "epoch": 0.21, "learning_rate": 1.8346052973412593e-05, "loss": 0.5112, "step": 1839 }, { "epoch": 0.21, "learning_rate": 1.834401335206237e-05, "loss": 0.4873, "step": 1840 }, { "epoch": 0.21, "learning_rate": 1.8341972587396032e-05, "loss": 0.4778, "step": 1841 }, { "epoch": 0.21, "learning_rate": 1.8339930679693202e-05, "loss": 0.475, "step": 1842 }, { "epoch": 0.21, "learning_rate": 1.8337887629233672e-05, "loss": 0.4649, "step": 1843 }, { "epoch": 0.21, "learning_rate": 1.833584343629738e-05, "loss": 0.5096, "step": 1844 }, { "epoch": 0.21, "learning_rate": 1.8333798101164433e-05, "loss": 0.4945, "step": 1845 }, { "epoch": 0.21, "learning_rate": 1.833175162411508e-05, "loss": 0.4645, "step": 1846 }, { "epoch": 0.21, "learning_rate": 1.8329704005429745e-05, "loss": 0.4822, "step": 1847 }, { "epoch": 0.21, "learning_rate": 1.8327655245388986e-05, "loss": 0.4826, "step": 1848 }, { "epoch": 0.21, "learning_rate": 1.8325605344273536e-05, "loss": 0.4994, "step": 1849 }, { "epoch": 0.21, "learning_rate": 1.8323554302364273e-05, "loss": 0.4873, "step": 1850 }, { "epoch": 0.21, "learning_rate": 1.832150211994224e-05, "loss": 0.4714, "step": 1851 }, { "epoch": 0.21, "learning_rate": 1.8319448797288628e-05, "loss": 0.4985, "step": 1852 }, { "epoch": 0.21, "learning_rate": 1.831739433468479e-05, "loss": 0.4863, "step": 1853 }, { "epoch": 0.21, "learning_rate": 1.831533873241223e-05, "loss": 0.4833, "step": 1854 }, { "epoch": 0.21, "learning_rate": 1.831328199075262e-05, "loss": 0.4667, "step": 1855 }, { "epoch": 0.21, "learning_rate": 1.8311224109987768e-05, "loss": 0.476, "step": 1856 }, { "epoch": 0.21, "learning_rate": 1.8309165090399657e-05, "loss": 0.516, "step": 1857 }, { "epoch": 0.21, "learning_rate": 1.8307104932270415e-05, "loss": 0.4699, "step": 1858 }, { "epoch": 0.21, "learning_rate": 1.8305043635882334e-05, "loss": 0.4787, "step": 1859 }, { "epoch": 0.21, "learning_rate": 1.830298120151785e-05, "loss": 0.4944, "step": 1860 }, { "epoch": 0.21, "learning_rate": 1.8300917629459575e-05, "loss": 0.494, "step": 1861 }, { "epoch": 0.21, "learning_rate": 1.8298852919990254e-05, "loss": 0.4809, "step": 1862 }, { "epoch": 0.21, "learning_rate": 1.82967870733928e-05, "loss": 0.4735, "step": 1863 }, { "epoch": 0.21, "learning_rate": 1.8294720089950282e-05, "loss": 0.4649, "step": 1864 }, { "epoch": 0.21, "learning_rate": 1.8292651969945923e-05, "loss": 0.491, "step": 1865 }, { "epoch": 0.21, "learning_rate": 1.82905827136631e-05, "loss": 0.4947, "step": 1866 }, { "epoch": 0.21, "learning_rate": 1.828851232138535e-05, "loss": 0.4686, "step": 1867 }, { "epoch": 0.21, "learning_rate": 1.828644079339636e-05, "loss": 0.4651, "step": 1868 }, { "epoch": 0.21, "learning_rate": 1.828436812997998e-05, "loss": 0.4662, "step": 1869 }, { "epoch": 0.21, "learning_rate": 1.8282294331420204e-05, "loss": 0.4872, "step": 1870 }, { "epoch": 0.21, "learning_rate": 1.8280219398001192e-05, "loss": 0.4907, "step": 1871 }, { "epoch": 0.21, "learning_rate": 1.827814333000726e-05, "loss": 0.4671, "step": 1872 }, { "epoch": 0.21, "learning_rate": 1.827606612772287e-05, "loss": 0.474, "step": 1873 }, { "epoch": 0.21, "learning_rate": 1.827398779143265e-05, "loss": 0.4831, "step": 1874 }, { "epoch": 0.21, "learning_rate": 1.8271908321421376e-05, "loss": 0.4973, "step": 1875 }, { "epoch": 0.21, "learning_rate": 1.8269827717973982e-05, "loss": 0.4786, "step": 1876 }, { "epoch": 0.21, "learning_rate": 1.8267745981375555e-05, "loss": 0.4745, "step": 1877 }, { "epoch": 0.21, "learning_rate": 1.8265663111911344e-05, "loss": 0.5025, "step": 1878 }, { "epoch": 0.21, "learning_rate": 1.8263579109866745e-05, "loss": 0.4768, "step": 1879 }, { "epoch": 0.21, "learning_rate": 1.8261493975527312e-05, "loss": 0.4807, "step": 1880 }, { "epoch": 0.21, "learning_rate": 1.8259407709178758e-05, "loss": 0.4922, "step": 1881 }, { "epoch": 0.22, "learning_rate": 1.8257320311106948e-05, "loss": 0.4806, "step": 1882 }, { "epoch": 0.22, "learning_rate": 1.82552317815979e-05, "loss": 0.491, "step": 1883 }, { "epoch": 0.22, "learning_rate": 1.825314212093779e-05, "loss": 0.4727, "step": 1884 }, { "epoch": 0.22, "learning_rate": 1.825105132941295e-05, "loss": 0.4835, "step": 1885 }, { "epoch": 0.22, "learning_rate": 1.8248959407309862e-05, "loss": 0.4773, "step": 1886 }, { "epoch": 0.22, "learning_rate": 1.824686635491517e-05, "loss": 0.4654, "step": 1887 }, { "epoch": 0.22, "learning_rate": 1.824477217251566e-05, "loss": 0.4921, "step": 1888 }, { "epoch": 0.22, "learning_rate": 1.8242676860398295e-05, "loss": 0.5063, "step": 1889 }, { "epoch": 0.22, "learning_rate": 1.824058041885017e-05, "loss": 0.4779, "step": 1890 }, { "epoch": 0.22, "learning_rate": 1.8238482848158548e-05, "loss": 0.4864, "step": 1891 }, { "epoch": 0.22, "learning_rate": 1.8236384148610843e-05, "loss": 0.4714, "step": 1892 }, { "epoch": 0.22, "learning_rate": 1.823428432049462e-05, "loss": 0.4911, "step": 1893 }, { "epoch": 0.22, "learning_rate": 1.8232183364097605e-05, "loss": 0.4711, "step": 1894 }, { "epoch": 0.22, "learning_rate": 1.8230081279707675e-05, "loss": 0.4749, "step": 1895 }, { "epoch": 0.22, "learning_rate": 1.822797806761287e-05, "loss": 0.4695, "step": 1896 }, { "epoch": 0.22, "learning_rate": 1.8225873728101367e-05, "loss": 0.4946, "step": 1897 }, { "epoch": 0.22, "learning_rate": 1.822376826146151e-05, "loss": 0.4869, "step": 1898 }, { "epoch": 0.22, "learning_rate": 1.8221661667981795e-05, "loss": 0.4795, "step": 1899 }, { "epoch": 0.22, "learning_rate": 1.8219553947950874e-05, "loss": 0.4721, "step": 1900 }, { "epoch": 0.22, "learning_rate": 1.8217445101657553e-05, "loss": 0.4663, "step": 1901 }, { "epoch": 0.22, "learning_rate": 1.8215335129390785e-05, "loss": 0.4833, "step": 1902 }, { "epoch": 0.22, "learning_rate": 1.821322403143969e-05, "loss": 0.481, "step": 1903 }, { "epoch": 0.22, "learning_rate": 1.8211111808093534e-05, "loss": 0.473, "step": 1904 }, { "epoch": 0.22, "learning_rate": 1.8208998459641737e-05, "loss": 0.4881, "step": 1905 }, { "epoch": 0.22, "learning_rate": 1.8206883986373872e-05, "loss": 0.4802, "step": 1906 }, { "epoch": 0.22, "learning_rate": 1.820476838857968e-05, "loss": 0.4852, "step": 1907 }, { "epoch": 0.22, "learning_rate": 1.820265166654903e-05, "loss": 0.4831, "step": 1908 }, { "epoch": 0.22, "learning_rate": 1.8200533820571973e-05, "loss": 0.497, "step": 1909 }, { "epoch": 0.22, "learning_rate": 1.8198414850938694e-05, "loss": 0.4615, "step": 1910 }, { "epoch": 0.22, "learning_rate": 1.8196294757939543e-05, "loss": 0.4956, "step": 1911 }, { "epoch": 0.22, "learning_rate": 1.8194173541865014e-05, "loss": 0.4716, "step": 1912 }, { "epoch": 0.22, "learning_rate": 1.8192051203005768e-05, "loss": 0.4638, "step": 1913 }, { "epoch": 0.22, "learning_rate": 1.818992774165261e-05, "loss": 0.4879, "step": 1914 }, { "epoch": 0.22, "learning_rate": 1.81878031580965e-05, "loss": 0.4875, "step": 1915 }, { "epoch": 0.22, "learning_rate": 1.8185677452628557e-05, "loss": 0.4882, "step": 1916 }, { "epoch": 0.22, "learning_rate": 1.818355062554005e-05, "loss": 0.4997, "step": 1917 }, { "epoch": 0.22, "learning_rate": 1.81814226771224e-05, "loss": 0.4726, "step": 1918 }, { "epoch": 0.22, "learning_rate": 1.8179293607667177e-05, "loss": 0.4946, "step": 1919 }, { "epoch": 0.22, "learning_rate": 1.8177163417466122e-05, "loss": 0.4876, "step": 1920 }, { "epoch": 0.22, "learning_rate": 1.8175032106811114e-05, "loss": 0.4709, "step": 1921 }, { "epoch": 0.22, "learning_rate": 1.817289967599419e-05, "loss": 0.4999, "step": 1922 }, { "epoch": 0.22, "learning_rate": 1.8170766125307543e-05, "loss": 0.4864, "step": 1923 }, { "epoch": 0.22, "learning_rate": 1.816863145504351e-05, "loss": 0.4812, "step": 1924 }, { "epoch": 0.22, "learning_rate": 1.81664956654946e-05, "loss": 0.4748, "step": 1925 }, { "epoch": 0.22, "learning_rate": 1.816435875695345e-05, "loss": 0.4671, "step": 1926 }, { "epoch": 0.22, "learning_rate": 1.8162220729712875e-05, "loss": 0.4808, "step": 1927 }, { "epoch": 0.22, "learning_rate": 1.8160081584065833e-05, "loss": 0.4736, "step": 1928 }, { "epoch": 0.22, "learning_rate": 1.8157941320305424e-05, "loss": 0.4868, "step": 1929 }, { "epoch": 0.22, "learning_rate": 1.815579993872492e-05, "loss": 0.4725, "step": 1930 }, { "epoch": 0.22, "learning_rate": 1.8153657439617738e-05, "loss": 0.491, "step": 1931 }, { "epoch": 0.22, "learning_rate": 1.8151513823277447e-05, "loss": 0.4761, "step": 1932 }, { "epoch": 0.22, "learning_rate": 1.8149369089997767e-05, "loss": 0.5125, "step": 1933 }, { "epoch": 0.22, "learning_rate": 1.814722324007258e-05, "loss": 0.4676, "step": 1934 }, { "epoch": 0.22, "learning_rate": 1.8145076273795914e-05, "loss": 0.4984, "step": 1935 }, { "epoch": 0.22, "learning_rate": 1.814292819146195e-05, "loss": 0.47, "step": 1936 }, { "epoch": 0.22, "learning_rate": 1.814077899336502e-05, "loss": 0.4997, "step": 1937 }, { "epoch": 0.22, "learning_rate": 1.813862867979962e-05, "loss": 0.4623, "step": 1938 }, { "epoch": 0.22, "learning_rate": 1.8136477251060385e-05, "loss": 0.463, "step": 1939 }, { "epoch": 0.22, "learning_rate": 1.813432470744211e-05, "loss": 0.4888, "step": 1940 }, { "epoch": 0.22, "learning_rate": 1.813217104923974e-05, "loss": 0.4848, "step": 1941 }, { "epoch": 0.22, "learning_rate": 1.813001627674838e-05, "loss": 0.5043, "step": 1942 }, { "epoch": 0.22, "learning_rate": 1.8127860390263275e-05, "loss": 0.4762, "step": 1943 }, { "epoch": 0.22, "learning_rate": 1.812570339007983e-05, "loss": 0.4681, "step": 1944 }, { "epoch": 0.22, "learning_rate": 1.8123545276493607e-05, "loss": 0.4824, "step": 1945 }, { "epoch": 0.22, "learning_rate": 1.8121386049800317e-05, "loss": 0.4819, "step": 1946 }, { "epoch": 0.22, "learning_rate": 1.8119225710295815e-05, "loss": 0.4734, "step": 1947 }, { "epoch": 0.22, "learning_rate": 1.811706425827612e-05, "loss": 0.4641, "step": 1948 }, { "epoch": 0.22, "learning_rate": 1.8114901694037402e-05, "loss": 0.4786, "step": 1949 }, { "epoch": 0.22, "learning_rate": 1.8112738017875974e-05, "loss": 0.484, "step": 1950 }, { "epoch": 0.22, "learning_rate": 1.811057323008831e-05, "loss": 0.5028, "step": 1951 }, { "epoch": 0.22, "learning_rate": 1.810840733097104e-05, "loss": 0.481, "step": 1952 }, { "epoch": 0.22, "learning_rate": 1.8106240320820928e-05, "loss": 0.4853, "step": 1953 }, { "epoch": 0.22, "learning_rate": 1.8104072199934916e-05, "loss": 0.468, "step": 1954 }, { "epoch": 0.22, "learning_rate": 1.8101902968610082e-05, "loss": 0.4989, "step": 1955 }, { "epoch": 0.22, "learning_rate": 1.8099732627143655e-05, "loss": 0.4905, "step": 1956 }, { "epoch": 0.22, "learning_rate": 1.809756117583302e-05, "loss": 0.464, "step": 1957 }, { "epoch": 0.22, "learning_rate": 1.809538861497572e-05, "loss": 0.4789, "step": 1958 }, { "epoch": 0.22, "learning_rate": 1.8093214944869437e-05, "loss": 0.4867, "step": 1959 }, { "epoch": 0.22, "learning_rate": 1.8091040165812018e-05, "loss": 0.4939, "step": 1960 }, { "epoch": 0.22, "learning_rate": 1.8088864278101452e-05, "loss": 0.4874, "step": 1961 }, { "epoch": 0.22, "learning_rate": 1.808668728203589e-05, "loss": 0.4741, "step": 1962 }, { "epoch": 0.22, "learning_rate": 1.8084509177913623e-05, "loss": 0.4968, "step": 1963 }, { "epoch": 0.22, "learning_rate": 1.8082329966033105e-05, "loss": 0.4904, "step": 1964 }, { "epoch": 0.22, "learning_rate": 1.8080149646692932e-05, "loss": 0.4782, "step": 1965 }, { "epoch": 0.22, "learning_rate": 1.807796822019186e-05, "loss": 0.4839, "step": 1966 }, { "epoch": 0.22, "learning_rate": 1.807578568682879e-05, "loss": 0.4976, "step": 1967 }, { "epoch": 0.22, "learning_rate": 1.8073602046902784e-05, "loss": 0.4823, "step": 1968 }, { "epoch": 0.23, "learning_rate": 1.8071417300713038e-05, "loss": 0.4928, "step": 1969 }, { "epoch": 0.23, "learning_rate": 1.8069231448558923e-05, "loss": 0.4787, "step": 1970 }, { "epoch": 0.23, "learning_rate": 1.806704449073994e-05, "loss": 0.4659, "step": 1971 }, { "epoch": 0.23, "learning_rate": 1.806485642755576e-05, "loss": 0.477, "step": 1972 }, { "epoch": 0.23, "learning_rate": 1.8062667259306193e-05, "loss": 0.4825, "step": 1973 }, { "epoch": 0.23, "learning_rate": 1.80604769862912e-05, "loss": 0.4756, "step": 1974 }, { "epoch": 0.23, "learning_rate": 1.8058285608810903e-05, "loss": 0.4778, "step": 1975 }, { "epoch": 0.23, "learning_rate": 1.8056093127165564e-05, "loss": 0.5072, "step": 1976 }, { "epoch": 0.23, "learning_rate": 1.8053899541655605e-05, "loss": 0.4728, "step": 1977 }, { "epoch": 0.23, "learning_rate": 1.8051704852581595e-05, "loss": 0.4835, "step": 1978 }, { "epoch": 0.23, "learning_rate": 1.804950906024426e-05, "loss": 0.4829, "step": 1979 }, { "epoch": 0.23, "learning_rate": 1.804731216494447e-05, "loss": 0.4627, "step": 1980 }, { "epoch": 0.23, "learning_rate": 1.804511416698324e-05, "loss": 0.4922, "step": 1981 }, { "epoch": 0.23, "learning_rate": 1.804291506666176e-05, "loss": 0.4687, "step": 1982 }, { "epoch": 0.23, "learning_rate": 1.8040714864281347e-05, "loss": 0.5074, "step": 1983 }, { "epoch": 0.23, "learning_rate": 1.8038513560143477e-05, "loss": 0.479, "step": 1984 }, { "epoch": 0.23, "learning_rate": 1.8036311154549783e-05, "loss": 0.4841, "step": 1985 }, { "epoch": 0.23, "learning_rate": 1.803410764780204e-05, "loss": 0.4791, "step": 1986 }, { "epoch": 0.23, "learning_rate": 1.803190304020218e-05, "loss": 0.5005, "step": 1987 }, { "epoch": 0.23, "learning_rate": 1.8029697332052277e-05, "loss": 0.4771, "step": 1988 }, { "epoch": 0.23, "learning_rate": 1.8027490523654568e-05, "loss": 0.4959, "step": 1989 }, { "epoch": 0.23, "learning_rate": 1.8025282615311437e-05, "loss": 0.4576, "step": 1990 }, { "epoch": 0.23, "learning_rate": 1.802307360732541e-05, "loss": 0.4692, "step": 1991 }, { "epoch": 0.23, "learning_rate": 1.8020863499999182e-05, "loss": 0.4766, "step": 1992 }, { "epoch": 0.23, "learning_rate": 1.801865229363557e-05, "loss": 0.4822, "step": 1993 }, { "epoch": 0.23, "learning_rate": 1.8016439988537576e-05, "loss": 0.4648, "step": 1994 }, { "epoch": 0.23, "learning_rate": 1.8014226585008322e-05, "loss": 0.505, "step": 1995 }, { "epoch": 0.23, "learning_rate": 1.80120120833511e-05, "loss": 0.4659, "step": 1996 }, { "epoch": 0.23, "learning_rate": 1.8009796483869347e-05, "loss": 0.485, "step": 1997 }, { "epoch": 0.23, "learning_rate": 1.8007579786866648e-05, "loss": 0.4654, "step": 1998 }, { "epoch": 0.23, "learning_rate": 1.8005361992646736e-05, "loss": 0.4911, "step": 1999 }, { "epoch": 0.23, "learning_rate": 1.8003143101513502e-05, "loss": 0.5044, "step": 2000 }, { "epoch": 0.23, "learning_rate": 1.8000923113770987e-05, "loss": 0.4838, "step": 2001 }, { "epoch": 0.23, "learning_rate": 1.7998702029723372e-05, "loss": 0.454, "step": 2002 }, { "epoch": 0.23, "learning_rate": 1.7996479849675e-05, "loss": 0.4945, "step": 2003 }, { "epoch": 0.23, "learning_rate": 1.799425657393036e-05, "loss": 0.4773, "step": 2004 }, { "epoch": 0.23, "learning_rate": 1.7992032202794084e-05, "loss": 0.4931, "step": 2005 }, { "epoch": 0.23, "learning_rate": 1.798980673657097e-05, "loss": 0.4624, "step": 2006 }, { "epoch": 0.23, "learning_rate": 1.7987580175565948e-05, "loss": 0.481, "step": 2007 }, { "epoch": 0.23, "learning_rate": 1.798535252008411e-05, "loss": 0.4772, "step": 2008 }, { "epoch": 0.23, "learning_rate": 1.7983123770430696e-05, "loss": 0.4951, "step": 2009 }, { "epoch": 0.23, "learning_rate": 1.7980893926911092e-05, "loss": 0.4809, "step": 2010 }, { "epoch": 0.23, "learning_rate": 1.7978662989830834e-05, "loss": 0.4861, "step": 2011 }, { "epoch": 0.23, "learning_rate": 1.7976430959495617e-05, "loss": 0.4623, "step": 2012 }, { "epoch": 0.23, "learning_rate": 1.7974197836211275e-05, "loss": 0.4759, "step": 2013 }, { "epoch": 0.23, "learning_rate": 1.7971963620283795e-05, "loss": 0.4842, "step": 2014 }, { "epoch": 0.23, "learning_rate": 1.7969728312019316e-05, "loss": 0.4847, "step": 2015 }, { "epoch": 0.23, "learning_rate": 1.7967491911724125e-05, "loss": 0.484, "step": 2016 }, { "epoch": 0.23, "learning_rate": 1.796525441970466e-05, "loss": 0.4841, "step": 2017 }, { "epoch": 0.23, "learning_rate": 1.7963015836267502e-05, "loss": 0.4862, "step": 2018 }, { "epoch": 0.23, "learning_rate": 1.7960776161719396e-05, "loss": 0.4713, "step": 2019 }, { "epoch": 0.23, "learning_rate": 1.7958535396367218e-05, "loss": 0.4855, "step": 2020 }, { "epoch": 0.23, "learning_rate": 1.795629354051801e-05, "loss": 0.4947, "step": 2021 }, { "epoch": 0.23, "learning_rate": 1.7954050594478952e-05, "loss": 0.4709, "step": 2022 }, { "epoch": 0.23, "learning_rate": 1.795180655855738e-05, "loss": 0.4753, "step": 2023 }, { "epoch": 0.23, "learning_rate": 1.7949561433060775e-05, "loss": 0.4592, "step": 2024 }, { "epoch": 0.23, "learning_rate": 1.794731521829677e-05, "loss": 0.479, "step": 2025 }, { "epoch": 0.23, "learning_rate": 1.7945067914573147e-05, "loss": 0.4769, "step": 2026 }, { "epoch": 0.23, "learning_rate": 1.7942819522197837e-05, "loss": 0.4883, "step": 2027 }, { "epoch": 0.23, "learning_rate": 1.794057004147892e-05, "loss": 0.4726, "step": 2028 }, { "epoch": 0.23, "learning_rate": 1.793831947272463e-05, "loss": 0.4931, "step": 2029 }, { "epoch": 0.23, "learning_rate": 1.793606781624333e-05, "loss": 0.4699, "step": 2030 }, { "epoch": 0.23, "learning_rate": 1.7933815072343565e-05, "loss": 0.4965, "step": 2031 }, { "epoch": 0.23, "learning_rate": 1.7931561241333998e-05, "loss": 0.4694, "step": 2032 }, { "epoch": 0.23, "learning_rate": 1.7929306323523463e-05, "loss": 0.4896, "step": 2033 }, { "epoch": 0.23, "learning_rate": 1.792705031922093e-05, "loss": 0.4737, "step": 2034 }, { "epoch": 0.23, "learning_rate": 1.792479322873552e-05, "loss": 0.4702, "step": 2035 }, { "epoch": 0.23, "learning_rate": 1.792253505237651e-05, "loss": 0.5163, "step": 2036 }, { "epoch": 0.23, "learning_rate": 1.7920275790453318e-05, "loss": 0.4697, "step": 2037 }, { "epoch": 0.23, "learning_rate": 1.7918015443275517e-05, "loss": 0.4757, "step": 2038 }, { "epoch": 0.23, "learning_rate": 1.7915754011152815e-05, "loss": 0.4824, "step": 2039 }, { "epoch": 0.23, "learning_rate": 1.791349149439509e-05, "loss": 0.4852, "step": 2040 }, { "epoch": 0.23, "learning_rate": 1.7911227893312347e-05, "loss": 0.4749, "step": 2041 }, { "epoch": 0.23, "learning_rate": 1.790896320821476e-05, "loss": 0.485, "step": 2042 }, { "epoch": 0.23, "learning_rate": 1.7906697439412634e-05, "loss": 0.4604, "step": 2043 }, { "epoch": 0.23, "learning_rate": 1.790443058721643e-05, "loss": 0.4646, "step": 2044 }, { "epoch": 0.23, "learning_rate": 1.7902162651936766e-05, "loss": 0.4981, "step": 2045 }, { "epoch": 0.23, "learning_rate": 1.789989363388439e-05, "loss": 0.4722, "step": 2046 }, { "epoch": 0.23, "learning_rate": 1.7897623533370212e-05, "loss": 0.4707, "step": 2047 }, { "epoch": 0.23, "learning_rate": 1.7895352350705288e-05, "loss": 0.4786, "step": 2048 }, { "epoch": 0.23, "learning_rate": 1.7893080086200817e-05, "loss": 0.4885, "step": 2049 }, { "epoch": 0.23, "learning_rate": 1.789080674016815e-05, "loss": 0.4913, "step": 2050 }, { "epoch": 0.23, "learning_rate": 1.7888532312918793e-05, "loss": 0.498, "step": 2051 }, { "epoch": 0.23, "learning_rate": 1.7886256804764385e-05, "loss": 0.4651, "step": 2052 }, { "epoch": 0.23, "learning_rate": 1.7883980216016724e-05, "loss": 0.4745, "step": 2053 }, { "epoch": 0.23, "learning_rate": 1.788170254698776e-05, "loss": 0.4867, "step": 2054 }, { "epoch": 0.23, "learning_rate": 1.7879423797989573e-05, "loss": 0.455, "step": 2055 }, { "epoch": 0.23, "learning_rate": 1.787714396933441e-05, "loss": 0.4727, "step": 2056 }, { "epoch": 0.24, "learning_rate": 1.7874863061334658e-05, "loss": 0.4833, "step": 2057 }, { "epoch": 0.24, "learning_rate": 1.7872581074302852e-05, "loss": 0.494, "step": 2058 }, { "epoch": 0.24, "learning_rate": 1.7870298008551674e-05, "loss": 0.4881, "step": 2059 }, { "epoch": 0.24, "learning_rate": 1.786801386439395e-05, "loss": 0.4843, "step": 2060 }, { "epoch": 0.24, "learning_rate": 1.7865728642142668e-05, "loss": 0.4787, "step": 2061 }, { "epoch": 0.24, "learning_rate": 1.786344234211095e-05, "loss": 0.4876, "step": 2062 }, { "epoch": 0.24, "learning_rate": 1.786115496461207e-05, "loss": 0.4639, "step": 2063 }, { "epoch": 0.24, "learning_rate": 1.7858866509959455e-05, "loss": 0.4657, "step": 2064 }, { "epoch": 0.24, "learning_rate": 1.7856576978466666e-05, "loss": 0.4768, "step": 2065 }, { "epoch": 0.24, "learning_rate": 1.785428637044742e-05, "loss": 0.4837, "step": 2066 }, { "epoch": 0.24, "learning_rate": 1.7851994686215592e-05, "loss": 0.498, "step": 2067 }, { "epoch": 0.24, "learning_rate": 1.7849701926085183e-05, "loss": 0.4789, "step": 2068 }, { "epoch": 0.24, "learning_rate": 1.7847408090370355e-05, "loss": 0.47, "step": 2069 }, { "epoch": 0.24, "learning_rate": 1.784511317938542e-05, "loss": 0.4868, "step": 2070 }, { "epoch": 0.24, "learning_rate": 1.7842817193444823e-05, "loss": 0.4803, "step": 2071 }, { "epoch": 0.24, "learning_rate": 1.7840520132863173e-05, "loss": 0.4863, "step": 2072 }, { "epoch": 0.24, "learning_rate": 1.783822199795522e-05, "loss": 0.4667, "step": 2073 }, { "epoch": 0.24, "learning_rate": 1.7835922789035853e-05, "loss": 0.4738, "step": 2074 }, { "epoch": 0.24, "learning_rate": 1.7833622506420116e-05, "loss": 0.454, "step": 2075 }, { "epoch": 0.24, "learning_rate": 1.7831321150423203e-05, "loss": 0.5017, "step": 2076 }, { "epoch": 0.24, "learning_rate": 1.782901872136045e-05, "loss": 0.4968, "step": 2077 }, { "epoch": 0.24, "learning_rate": 1.7826715219547336e-05, "loss": 0.4852, "step": 2078 }, { "epoch": 0.24, "learning_rate": 1.78244106452995e-05, "loss": 0.4827, "step": 2079 }, { "epoch": 0.24, "learning_rate": 1.7822104998932715e-05, "loss": 0.4838, "step": 2080 }, { "epoch": 0.24, "learning_rate": 1.7819798280762907e-05, "loss": 0.4729, "step": 2081 }, { "epoch": 0.24, "learning_rate": 1.7817490491106148e-05, "loss": 0.4647, "step": 2082 }, { "epoch": 0.24, "learning_rate": 1.7815181630278656e-05, "loss": 0.4783, "step": 2083 }, { "epoch": 0.24, "learning_rate": 1.78128716985968e-05, "loss": 0.4797, "step": 2084 }, { "epoch": 0.24, "learning_rate": 1.781056069637709e-05, "loss": 0.5009, "step": 2085 }, { "epoch": 0.24, "learning_rate": 1.7808248623936183e-05, "loss": 0.5092, "step": 2086 }, { "epoch": 0.24, "learning_rate": 1.780593548159089e-05, "loss": 0.4692, "step": 2087 }, { "epoch": 0.24, "learning_rate": 1.7803621269658154e-05, "loss": 0.4904, "step": 2088 }, { "epoch": 0.24, "learning_rate": 1.7801305988455085e-05, "loss": 0.4693, "step": 2089 }, { "epoch": 0.24, "learning_rate": 1.779898963829892e-05, "loss": 0.4656, "step": 2090 }, { "epoch": 0.24, "learning_rate": 1.779667221950705e-05, "loss": 0.4907, "step": 2091 }, { "epoch": 0.24, "learning_rate": 1.7794353732397018e-05, "loss": 0.47, "step": 2092 }, { "epoch": 0.24, "learning_rate": 1.7792034177286508e-05, "loss": 0.4755, "step": 2093 }, { "epoch": 0.24, "learning_rate": 1.778971355449335e-05, "loss": 0.4875, "step": 2094 }, { "epoch": 0.24, "learning_rate": 1.7787391864335517e-05, "loss": 0.4787, "step": 2095 }, { "epoch": 0.24, "learning_rate": 1.778506910713114e-05, "loss": 0.4721, "step": 2096 }, { "epoch": 0.24, "learning_rate": 1.778274528319848e-05, "loss": 0.4827, "step": 2097 }, { "epoch": 0.24, "learning_rate": 1.778042039285596e-05, "loss": 0.462, "step": 2098 }, { "epoch": 0.24, "learning_rate": 1.777809443642214e-05, "loss": 0.4773, "step": 2099 }, { "epoch": 0.24, "learning_rate": 1.7775767414215726e-05, "loss": 0.4847, "step": 2100 }, { "epoch": 0.24, "learning_rate": 1.7773439326555574e-05, "loss": 0.4716, "step": 2101 }, { "epoch": 0.24, "learning_rate": 1.777111017376068e-05, "loss": 0.4797, "step": 2102 }, { "epoch": 0.24, "learning_rate": 1.7768779956150196e-05, "loss": 0.4778, "step": 2103 }, { "epoch": 0.24, "learning_rate": 1.776644867404341e-05, "loss": 0.4625, "step": 2104 }, { "epoch": 0.24, "learning_rate": 1.776411632775976e-05, "loss": 0.46, "step": 2105 }, { "epoch": 0.24, "learning_rate": 1.7761782917618836e-05, "loss": 0.4934, "step": 2106 }, { "epoch": 0.24, "learning_rate": 1.7759448443940355e-05, "loss": 0.459, "step": 2107 }, { "epoch": 0.24, "learning_rate": 1.77571129070442e-05, "loss": 0.4785, "step": 2108 }, { "epoch": 0.24, "learning_rate": 1.775477630725039e-05, "loss": 0.4648, "step": 2109 }, { "epoch": 0.24, "learning_rate": 1.7752438644879092e-05, "loss": 0.5045, "step": 2110 }, { "epoch": 0.24, "learning_rate": 1.7750099920250616e-05, "loss": 0.4848, "step": 2111 }, { "epoch": 0.24, "learning_rate": 1.774776013368542e-05, "loss": 0.4724, "step": 2112 }, { "epoch": 0.24, "learning_rate": 1.774541928550411e-05, "loss": 0.4749, "step": 2113 }, { "epoch": 0.24, "learning_rate": 1.7743077376027433e-05, "loss": 0.4872, "step": 2114 }, { "epoch": 0.24, "learning_rate": 1.7740734405576283e-05, "loss": 0.4778, "step": 2115 }, { "epoch": 0.24, "learning_rate": 1.7738390374471696e-05, "loss": 0.4904, "step": 2116 }, { "epoch": 0.24, "learning_rate": 1.773604528303486e-05, "loss": 0.4892, "step": 2117 }, { "epoch": 0.24, "learning_rate": 1.7733699131587104e-05, "loss": 0.4918, "step": 2118 }, { "epoch": 0.24, "learning_rate": 1.77313519204499e-05, "loss": 0.4776, "step": 2119 }, { "epoch": 0.24, "learning_rate": 1.7729003649944878e-05, "loss": 0.4777, "step": 2120 }, { "epoch": 0.24, "learning_rate": 1.7726654320393795e-05, "loss": 0.4935, "step": 2121 }, { "epoch": 0.24, "learning_rate": 1.772430393211856e-05, "loss": 0.482, "step": 2122 }, { "epoch": 0.24, "learning_rate": 1.7721952485441232e-05, "loss": 0.4718, "step": 2123 }, { "epoch": 0.24, "learning_rate": 1.7719599980684016e-05, "loss": 0.4591, "step": 2124 }, { "epoch": 0.24, "learning_rate": 1.7717246418169252e-05, "loss": 0.481, "step": 2125 }, { "epoch": 0.24, "learning_rate": 1.7714891798219432e-05, "loss": 0.4851, "step": 2126 }, { "epoch": 0.24, "learning_rate": 1.771253612115719e-05, "loss": 0.5005, "step": 2127 }, { "epoch": 0.24, "learning_rate": 1.7710179387305308e-05, "loss": 0.4734, "step": 2128 }, { "epoch": 0.24, "learning_rate": 1.7707821596986715e-05, "loss": 0.4805, "step": 2129 }, { "epoch": 0.24, "learning_rate": 1.7705462750524474e-05, "loss": 0.4809, "step": 2130 }, { "epoch": 0.24, "learning_rate": 1.77031028482418e-05, "loss": 0.4728, "step": 2131 }, { "epoch": 0.24, "learning_rate": 1.770074189046206e-05, "loss": 0.4759, "step": 2132 }, { "epoch": 0.24, "learning_rate": 1.7698379877508755e-05, "loss": 0.4709, "step": 2133 }, { "epoch": 0.24, "learning_rate": 1.7696016809705525e-05, "loss": 0.4993, "step": 2134 }, { "epoch": 0.24, "learning_rate": 1.7693652687376173e-05, "loss": 0.4765, "step": 2135 }, { "epoch": 0.24, "learning_rate": 1.769128751084463e-05, "loss": 0.4845, "step": 2136 }, { "epoch": 0.24, "learning_rate": 1.7688921280434984e-05, "loss": 0.4776, "step": 2137 }, { "epoch": 0.24, "learning_rate": 1.768655399647146e-05, "loss": 0.4779, "step": 2138 }, { "epoch": 0.24, "learning_rate": 1.7684185659278423e-05, "loss": 0.4532, "step": 2139 }, { "epoch": 0.24, "learning_rate": 1.7681816269180394e-05, "loss": 0.4901, "step": 2140 }, { "epoch": 0.24, "learning_rate": 1.7679445826502033e-05, "loss": 0.4582, "step": 2141 }, { "epoch": 0.24, "learning_rate": 1.767707433156814e-05, "loss": 0.4821, "step": 2142 }, { "epoch": 0.24, "learning_rate": 1.767470178470366e-05, "loss": 0.4743, "step": 2143 }, { "epoch": 0.25, "learning_rate": 1.7672328186233692e-05, "loss": 0.5039, "step": 2144 }, { "epoch": 0.25, "learning_rate": 1.766995353648347e-05, "loss": 0.4517, "step": 2145 }, { "epoch": 0.25, "learning_rate": 1.766757783577837e-05, "loss": 0.4928, "step": 2146 }, { "epoch": 0.25, "learning_rate": 1.766520108444392e-05, "loss": 0.4828, "step": 2147 }, { "epoch": 0.25, "learning_rate": 1.7662823282805788e-05, "loss": 0.4716, "step": 2148 }, { "epoch": 0.25, "learning_rate": 1.766044443118978e-05, "loss": 0.4756, "step": 2149 }, { "epoch": 0.25, "learning_rate": 1.765806452992186e-05, "loss": 0.4674, "step": 2150 }, { "epoch": 0.25, "learning_rate": 1.7655683579328128e-05, "loss": 0.4787, "step": 2151 }, { "epoch": 0.25, "learning_rate": 1.765330157973482e-05, "loss": 0.5245, "step": 2152 }, { "epoch": 0.25, "learning_rate": 1.7650918531468326e-05, "loss": 0.4759, "step": 2153 }, { "epoch": 0.25, "learning_rate": 1.7648534434855177e-05, "loss": 0.4719, "step": 2154 }, { "epoch": 0.25, "learning_rate": 1.764614929022205e-05, "loss": 0.4807, "step": 2155 }, { "epoch": 0.25, "learning_rate": 1.764376309789576e-05, "loss": 0.4773, "step": 2156 }, { "epoch": 0.25, "learning_rate": 1.764137585820327e-05, "loss": 0.4787, "step": 2157 }, { "epoch": 0.25, "learning_rate": 1.7638987571471685e-05, "loss": 0.4781, "step": 2158 }, { "epoch": 0.25, "learning_rate": 1.7636598238028253e-05, "loss": 0.4679, "step": 2159 }, { "epoch": 0.25, "learning_rate": 1.7634207858200366e-05, "loss": 0.4922, "step": 2160 }, { "epoch": 0.25, "learning_rate": 1.763181643231556e-05, "loss": 0.491, "step": 2161 }, { "epoch": 0.25, "learning_rate": 1.7629423960701513e-05, "loss": 0.4677, "step": 2162 }, { "epoch": 0.25, "learning_rate": 1.7627030443686047e-05, "loss": 0.4873, "step": 2163 }, { "epoch": 0.25, "learning_rate": 1.762463588159713e-05, "loss": 0.4677, "step": 2164 }, { "epoch": 0.25, "learning_rate": 1.762224027476287e-05, "loss": 0.4581, "step": 2165 }, { "epoch": 0.25, "learning_rate": 1.761984362351151e-05, "loss": 0.5085, "step": 2166 }, { "epoch": 0.25, "learning_rate": 1.7617445928171458e-05, "loss": 0.4582, "step": 2167 }, { "epoch": 0.25, "learning_rate": 1.761504718907124e-05, "loss": 0.499, "step": 2168 }, { "epoch": 0.25, "learning_rate": 1.7612647406539548e-05, "loss": 0.4789, "step": 2169 }, { "epoch": 0.25, "learning_rate": 1.76102465809052e-05, "loss": 0.4757, "step": 2170 }, { "epoch": 0.25, "learning_rate": 1.760784471249716e-05, "loss": 0.4804, "step": 2171 }, { "epoch": 0.25, "learning_rate": 1.760544180164454e-05, "loss": 0.4877, "step": 2172 }, { "epoch": 0.25, "learning_rate": 1.7603037848676593e-05, "loss": 0.4686, "step": 2173 }, { "epoch": 0.25, "learning_rate": 1.7600632853922713e-05, "loss": 0.4784, "step": 2174 }, { "epoch": 0.25, "learning_rate": 1.7598226817712442e-05, "loss": 0.4851, "step": 2175 }, { "epoch": 0.25, "learning_rate": 1.7595819740375457e-05, "loss": 0.4848, "step": 2176 }, { "epoch": 0.25, "learning_rate": 1.7593411622241584e-05, "loss": 0.4683, "step": 2177 }, { "epoch": 0.25, "learning_rate": 1.7591002463640784e-05, "loss": 0.4815, "step": 2178 }, { "epoch": 0.25, "learning_rate": 1.758859226490317e-05, "loss": 0.5039, "step": 2179 }, { "epoch": 0.25, "learning_rate": 1.7586181026358987e-05, "loss": 0.4845, "step": 2180 }, { "epoch": 0.25, "learning_rate": 1.758376874833864e-05, "loss": 0.4929, "step": 2181 }, { "epoch": 0.25, "learning_rate": 1.7581355431172653e-05, "loss": 0.4848, "step": 2182 }, { "epoch": 0.25, "learning_rate": 1.757894107519171e-05, "loss": 0.4796, "step": 2183 }, { "epoch": 0.25, "learning_rate": 1.757652568072663e-05, "loss": 0.4889, "step": 2184 }, { "epoch": 0.25, "learning_rate": 1.757410924810838e-05, "loss": 0.4622, "step": 2185 }, { "epoch": 0.25, "learning_rate": 1.757169177766806e-05, "loss": 0.4766, "step": 2186 }, { "epoch": 0.25, "learning_rate": 1.7569273269736918e-05, "loss": 0.4708, "step": 2187 }, { "epoch": 0.25, "learning_rate": 1.756685372464635e-05, "loss": 0.537, "step": 2188 }, { "epoch": 0.25, "learning_rate": 1.7564433142727882e-05, "loss": 0.4926, "step": 2189 }, { "epoch": 0.25, "learning_rate": 1.7562011524313187e-05, "loss": 0.4633, "step": 2190 }, { "epoch": 0.25, "learning_rate": 1.755958886973408e-05, "loss": 0.4688, "step": 2191 }, { "epoch": 0.25, "learning_rate": 1.7557165179322522e-05, "loss": 0.4958, "step": 2192 }, { "epoch": 0.25, "learning_rate": 1.7554740453410617e-05, "loss": 0.4528, "step": 2193 }, { "epoch": 0.25, "learning_rate": 1.75523146923306e-05, "loss": 0.4919, "step": 2194 }, { "epoch": 0.25, "learning_rate": 1.7549887896414853e-05, "loss": 0.4762, "step": 2195 }, { "epoch": 0.25, "learning_rate": 1.7547460065995903e-05, "loss": 0.4834, "step": 2196 }, { "epoch": 0.25, "learning_rate": 1.754503120140642e-05, "loss": 0.5091, "step": 2197 }, { "epoch": 0.25, "learning_rate": 1.7542601302979213e-05, "loss": 0.4773, "step": 2198 }, { "epoch": 0.25, "learning_rate": 1.7540170371047228e-05, "loss": 0.4704, "step": 2199 }, { "epoch": 0.25, "learning_rate": 1.753773840594356e-05, "loss": 0.4855, "step": 2200 }, { "epoch": 0.25, "learning_rate": 1.753530540800144e-05, "loss": 0.48, "step": 2201 }, { "epoch": 0.25, "learning_rate": 1.7532871377554243e-05, "loss": 0.4906, "step": 2202 }, { "epoch": 0.25, "learning_rate": 1.7530436314935492e-05, "loss": 0.4709, "step": 2203 }, { "epoch": 0.25, "learning_rate": 1.7528000220478836e-05, "loss": 0.4907, "step": 2204 }, { "epoch": 0.25, "learning_rate": 1.7525563094518078e-05, "loss": 0.4629, "step": 2205 }, { "epoch": 0.25, "learning_rate": 1.7523124937387162e-05, "loss": 0.4857, "step": 2206 }, { "epoch": 0.25, "learning_rate": 1.7520685749420164e-05, "loss": 0.4732, "step": 2207 }, { "epoch": 0.25, "learning_rate": 1.7518245530951315e-05, "loss": 0.4853, "step": 2208 }, { "epoch": 0.25, "learning_rate": 1.7515804282314974e-05, "loss": 0.4757, "step": 2209 }, { "epoch": 0.25, "learning_rate": 1.751336200384564e-05, "loss": 0.48, "step": 2210 }, { "epoch": 0.25, "learning_rate": 1.751091869587797e-05, "loss": 0.4729, "step": 2211 }, { "epoch": 0.25, "learning_rate": 1.7508474358746753e-05, "loss": 0.4996, "step": 2212 }, { "epoch": 0.25, "learning_rate": 1.7506028992786912e-05, "loss": 0.4631, "step": 2213 }, { "epoch": 0.25, "learning_rate": 1.7503582598333517e-05, "loss": 0.4687, "step": 2214 }, { "epoch": 0.25, "learning_rate": 1.750113517572178e-05, "loss": 0.4873, "step": 2215 }, { "epoch": 0.25, "learning_rate": 1.749868672528705e-05, "loss": 0.474, "step": 2216 }, { "epoch": 0.25, "learning_rate": 1.7496237247364827e-05, "loss": 0.4696, "step": 2217 }, { "epoch": 0.25, "learning_rate": 1.7493786742290734e-05, "loss": 0.4869, "step": 2218 }, { "epoch": 0.25, "learning_rate": 1.7491335210400554e-05, "loss": 0.4751, "step": 2219 }, { "epoch": 0.25, "learning_rate": 1.7488882652030193e-05, "loss": 0.5086, "step": 2220 }, { "epoch": 0.25, "learning_rate": 1.748642906751571e-05, "loss": 0.4697, "step": 2221 }, { "epoch": 0.25, "learning_rate": 1.7483974457193307e-05, "loss": 0.4575, "step": 2222 }, { "epoch": 0.25, "learning_rate": 1.748151882139931e-05, "loss": 0.482, "step": 2223 }, { "epoch": 0.25, "learning_rate": 1.7479062160470205e-05, "loss": 0.4892, "step": 2224 }, { "epoch": 0.25, "learning_rate": 1.74766044747426e-05, "loss": 0.4507, "step": 2225 }, { "epoch": 0.25, "learning_rate": 1.7474145764553262e-05, "loss": 0.4824, "step": 2226 }, { "epoch": 0.25, "learning_rate": 1.7471686030239082e-05, "loss": 0.4685, "step": 2227 }, { "epoch": 0.25, "learning_rate": 1.7469225272137104e-05, "loss": 0.5125, "step": 2228 }, { "epoch": 0.25, "learning_rate": 1.7466763490584504e-05, "loss": 0.4813, "step": 2229 }, { "epoch": 0.25, "learning_rate": 1.7464300685918602e-05, "loss": 0.4821, "step": 2230 }, { "epoch": 0.25, "learning_rate": 1.7461836858476858e-05, "loss": 0.4607, "step": 2231 }, { "epoch": 0.26, "learning_rate": 1.745937200859687e-05, "loss": 0.4742, "step": 2232 }, { "epoch": 0.26, "learning_rate": 1.7456906136616374e-05, "loss": 0.47, "step": 2233 }, { "epoch": 0.26, "learning_rate": 1.7454439242873257e-05, "loss": 0.4881, "step": 2234 }, { "epoch": 0.26, "learning_rate": 1.745197132770553e-05, "loss": 0.4716, "step": 2235 }, { "epoch": 0.26, "learning_rate": 1.7449502391451362e-05, "loss": 0.5046, "step": 2236 }, { "epoch": 0.26, "learning_rate": 1.7447032434449045e-05, "loss": 0.48, "step": 2237 }, { "epoch": 0.26, "learning_rate": 1.7444561457037022e-05, "loss": 0.4854, "step": 2238 }, { "epoch": 0.26, "learning_rate": 1.744208945955387e-05, "loss": 0.4625, "step": 2239 }, { "epoch": 0.26, "learning_rate": 1.743961644233831e-05, "loss": 0.4795, "step": 2240 }, { "epoch": 0.26, "learning_rate": 1.7437142405729196e-05, "loss": 0.4831, "step": 2241 }, { "epoch": 0.26, "learning_rate": 1.743466735006553e-05, "loss": 0.4779, "step": 2242 }, { "epoch": 0.26, "learning_rate": 1.7432191275686454e-05, "loss": 0.4721, "step": 2243 }, { "epoch": 0.26, "learning_rate": 1.7429714182931238e-05, "loss": 0.4879, "step": 2244 }, { "epoch": 0.26, "learning_rate": 1.7427236072139306e-05, "loss": 0.4855, "step": 2245 }, { "epoch": 0.26, "learning_rate": 1.7424756943650203e-05, "loss": 0.4936, "step": 2246 }, { "epoch": 0.26, "learning_rate": 1.7422276797803638e-05, "loss": 0.4762, "step": 2247 }, { "epoch": 0.26, "learning_rate": 1.741979563493944e-05, "loss": 0.4638, "step": 2248 }, { "epoch": 0.26, "learning_rate": 1.741731345539758e-05, "loss": 0.4827, "step": 2249 }, { "epoch": 0.26, "learning_rate": 1.741483025951818e-05, "loss": 0.4847, "step": 2250 }, { "epoch": 0.26, "learning_rate": 1.7412346047641485e-05, "loss": 0.4682, "step": 2251 }, { "epoch": 0.26, "learning_rate": 1.74098608201079e-05, "loss": 0.4909, "step": 2252 }, { "epoch": 0.26, "learning_rate": 1.7407374577257945e-05, "loss": 0.479, "step": 2253 }, { "epoch": 0.26, "learning_rate": 1.7404887319432294e-05, "loss": 0.5104, "step": 2254 }, { "epoch": 0.26, "learning_rate": 1.740239904697176e-05, "loss": 0.4657, "step": 2255 }, { "epoch": 0.26, "learning_rate": 1.7399909760217285e-05, "loss": 0.4881, "step": 2256 }, { "epoch": 0.26, "learning_rate": 1.7397419459509962e-05, "loss": 0.4684, "step": 2257 }, { "epoch": 0.26, "learning_rate": 1.739492814519102e-05, "loss": 0.4574, "step": 2258 }, { "epoch": 0.26, "learning_rate": 1.739243581760182e-05, "loss": 0.4794, "step": 2259 }, { "epoch": 0.26, "learning_rate": 1.738994247708387e-05, "loss": 0.4778, "step": 2260 }, { "epoch": 0.26, "learning_rate": 1.7387448123978813e-05, "loss": 0.489, "step": 2261 }, { "epoch": 0.26, "learning_rate": 1.7384952758628423e-05, "loss": 0.4871, "step": 2262 }, { "epoch": 0.26, "learning_rate": 1.738245638137463e-05, "loss": 0.4855, "step": 2263 }, { "epoch": 0.26, "learning_rate": 1.7379958992559494e-05, "loss": 0.471, "step": 2264 }, { "epoch": 0.26, "learning_rate": 1.737746059252521e-05, "loss": 0.4735, "step": 2265 }, { "epoch": 0.26, "learning_rate": 1.737496118161411e-05, "loss": 0.4721, "step": 2266 }, { "epoch": 0.26, "learning_rate": 1.7372460760168676e-05, "loss": 0.492, "step": 2267 }, { "epoch": 0.26, "learning_rate": 1.736995932853152e-05, "loss": 0.4756, "step": 2268 }, { "epoch": 0.26, "learning_rate": 1.736745688704539e-05, "loss": 0.5099, "step": 2269 }, { "epoch": 0.26, "learning_rate": 1.736495343605318e-05, "loss": 0.476, "step": 2270 }, { "epoch": 0.26, "learning_rate": 1.736244897589792e-05, "loss": 0.4761, "step": 2271 }, { "epoch": 0.26, "learning_rate": 1.7359943506922775e-05, "loss": 0.4725, "step": 2272 }, { "epoch": 0.26, "learning_rate": 1.735743702947105e-05, "loss": 0.477, "step": 2273 }, { "epoch": 0.26, "learning_rate": 1.7354929543886186e-05, "loss": 0.4682, "step": 2274 }, { "epoch": 0.26, "learning_rate": 1.7352421050511767e-05, "loss": 0.4591, "step": 2275 }, { "epoch": 0.26, "learning_rate": 1.734991154969152e-05, "loss": 0.4755, "step": 2276 }, { "epoch": 0.26, "learning_rate": 1.7347401041769284e-05, "loss": 0.4902, "step": 2277 }, { "epoch": 0.26, "learning_rate": 1.7344889527089074e-05, "loss": 0.4777, "step": 2278 }, { "epoch": 0.26, "learning_rate": 1.7342377005995014e-05, "loss": 0.4873, "step": 2279 }, { "epoch": 0.26, "learning_rate": 1.733986347883138e-05, "loss": 0.4777, "step": 2280 }, { "epoch": 0.26, "learning_rate": 1.7337348945942572e-05, "loss": 0.4675, "step": 2281 }, { "epoch": 0.26, "learning_rate": 1.7334833407673145e-05, "loss": 0.4943, "step": 2282 }, { "epoch": 0.26, "learning_rate": 1.7332316864367785e-05, "loss": 0.4708, "step": 2283 }, { "epoch": 0.26, "learning_rate": 1.732979931637131e-05, "loss": 0.4695, "step": 2284 }, { "epoch": 0.26, "learning_rate": 1.7327280764028683e-05, "loss": 0.488, "step": 2285 }, { "epoch": 0.26, "learning_rate": 1.7324761207685005e-05, "loss": 0.5035, "step": 2286 }, { "epoch": 0.26, "learning_rate": 1.7322240647685503e-05, "loss": 0.4726, "step": 2287 }, { "epoch": 0.26, "learning_rate": 1.7319719084375556e-05, "loss": 0.4609, "step": 2288 }, { "epoch": 0.26, "learning_rate": 1.7317196518100672e-05, "loss": 0.488, "step": 2289 }, { "epoch": 0.26, "learning_rate": 1.7314672949206502e-05, "loss": 0.474, "step": 2290 }, { "epoch": 0.26, "learning_rate": 1.731214837803883e-05, "loss": 0.4646, "step": 2291 }, { "epoch": 0.26, "learning_rate": 1.7309622804943573e-05, "loss": 0.4767, "step": 2292 }, { "epoch": 0.26, "learning_rate": 1.73070962302668e-05, "loss": 0.5126, "step": 2293 }, { "epoch": 0.26, "learning_rate": 1.7304568654354703e-05, "loss": 0.4779, "step": 2294 }, { "epoch": 0.26, "learning_rate": 1.7302040077553616e-05, "loss": 0.4769, "step": 2295 }, { "epoch": 0.26, "learning_rate": 1.7299510500210015e-05, "loss": 0.4764, "step": 2296 }, { "epoch": 0.26, "learning_rate": 1.7296979922670502e-05, "loss": 0.4786, "step": 2297 }, { "epoch": 0.26, "learning_rate": 1.729444834528183e-05, "loss": 0.4735, "step": 2298 }, { "epoch": 0.26, "learning_rate": 1.7291915768390875e-05, "loss": 0.4773, "step": 2299 }, { "epoch": 0.26, "learning_rate": 1.728938219234466e-05, "loss": 0.4762, "step": 2300 }, { "epoch": 0.26, "learning_rate": 1.728684761749034e-05, "loss": 0.4629, "step": 2301 }, { "epoch": 0.26, "learning_rate": 1.728431204417521e-05, "loss": 0.4624, "step": 2302 }, { "epoch": 0.26, "learning_rate": 1.7281775472746695e-05, "loss": 0.4793, "step": 2303 }, { "epoch": 0.26, "learning_rate": 1.727923790355237e-05, "loss": 0.4707, "step": 2304 }, { "epoch": 0.26, "learning_rate": 1.7276699336939936e-05, "loss": 0.4638, "step": 2305 }, { "epoch": 0.26, "learning_rate": 1.7274159773257227e-05, "loss": 0.492, "step": 2306 }, { "epoch": 0.26, "learning_rate": 1.7271619212852232e-05, "loss": 0.4632, "step": 2307 }, { "epoch": 0.26, "learning_rate": 1.726907765607305e-05, "loss": 0.479, "step": 2308 }, { "epoch": 0.26, "learning_rate": 1.7266535103267943e-05, "loss": 0.4955, "step": 2309 }, { "epoch": 0.26, "learning_rate": 1.726399155478529e-05, "loss": 0.471, "step": 2310 }, { "epoch": 0.26, "learning_rate": 1.7261447010973623e-05, "loss": 0.4869, "step": 2311 }, { "epoch": 0.26, "learning_rate": 1.7258901472181587e-05, "loss": 0.4765, "step": 2312 }, { "epoch": 0.26, "learning_rate": 1.725635493875799e-05, "loss": 0.4795, "step": 2313 }, { "epoch": 0.26, "learning_rate": 1.725380741105176e-05, "loss": 0.4612, "step": 2314 }, { "epoch": 0.26, "learning_rate": 1.7251258889411964e-05, "loss": 0.48, "step": 2315 }, { "epoch": 0.26, "learning_rate": 1.724870937418781e-05, "loss": 0.483, "step": 2316 }, { "epoch": 0.26, "learning_rate": 1.7246158865728634e-05, "loss": 0.4708, "step": 2317 }, { "epoch": 0.26, "learning_rate": 1.7243607364383916e-05, "loss": 0.4752, "step": 2318 }, { "epoch": 0.27, "learning_rate": 1.7241054870503262e-05, "loss": 0.4801, "step": 2319 }, { "epoch": 0.27, "learning_rate": 1.723850138443643e-05, "loss": 0.4739, "step": 2320 }, { "epoch": 0.27, "learning_rate": 1.72359469065333e-05, "loss": 0.4771, "step": 2321 }, { "epoch": 0.27, "learning_rate": 1.723339143714389e-05, "loss": 0.4811, "step": 2322 }, { "epoch": 0.27, "learning_rate": 1.7230834976618364e-05, "loss": 0.5013, "step": 2323 }, { "epoch": 0.27, "learning_rate": 1.7228277525307007e-05, "loss": 0.4576, "step": 2324 }, { "epoch": 0.27, "learning_rate": 1.7225719083560246e-05, "loss": 0.4736, "step": 2325 }, { "epoch": 0.27, "learning_rate": 1.7223159651728653e-05, "loss": 0.4784, "step": 2326 }, { "epoch": 0.27, "learning_rate": 1.7220599230162917e-05, "loss": 0.4742, "step": 2327 }, { "epoch": 0.27, "learning_rate": 1.7218037819213883e-05, "loss": 0.4799, "step": 2328 }, { "epoch": 0.27, "learning_rate": 1.7215475419232516e-05, "loss": 0.4987, "step": 2329 }, { "epoch": 0.27, "learning_rate": 1.7212912030569923e-05, "loss": 0.4768, "step": 2330 }, { "epoch": 0.27, "learning_rate": 1.7210347653577343e-05, "loss": 0.4819, "step": 2331 }, { "epoch": 0.27, "learning_rate": 1.7207782288606154e-05, "loss": 0.4671, "step": 2332 }, { "epoch": 0.27, "learning_rate": 1.720521593600787e-05, "loss": 0.4661, "step": 2333 }, { "epoch": 0.27, "learning_rate": 1.7202648596134143e-05, "loss": 0.4803, "step": 2334 }, { "epoch": 0.27, "learning_rate": 1.7200080269336745e-05, "loss": 0.4671, "step": 2335 }, { "epoch": 0.27, "learning_rate": 1.71975109559676e-05, "loss": 0.4705, "step": 2336 }, { "epoch": 0.27, "learning_rate": 1.7194940656378763e-05, "loss": 0.4898, "step": 2337 }, { "epoch": 0.27, "learning_rate": 1.7192369370922423e-05, "loss": 0.4762, "step": 2338 }, { "epoch": 0.27, "learning_rate": 1.7189797099950895e-05, "loss": 0.4991, "step": 2339 }, { "epoch": 0.27, "learning_rate": 1.7187223843816648e-05, "loss": 0.4784, "step": 2340 }, { "epoch": 0.27, "learning_rate": 1.7184649602872274e-05, "loss": 0.4749, "step": 2341 }, { "epoch": 0.27, "learning_rate": 1.7182074377470494e-05, "loss": 0.4777, "step": 2342 }, { "epoch": 0.27, "learning_rate": 1.717949816796418e-05, "loss": 0.4733, "step": 2343 }, { "epoch": 0.27, "learning_rate": 1.7176920974706318e-05, "loss": 0.4914, "step": 2344 }, { "epoch": 0.27, "learning_rate": 1.7174342798050056e-05, "loss": 0.4806, "step": 2345 }, { "epoch": 0.27, "learning_rate": 1.7171763638348653e-05, "loss": 0.4793, "step": 2346 }, { "epoch": 0.27, "learning_rate": 1.7169183495955516e-05, "loss": 0.4827, "step": 2347 }, { "epoch": 0.27, "learning_rate": 1.7166602371224178e-05, "loss": 0.4725, "step": 2348 }, { "epoch": 0.27, "learning_rate": 1.716402026450831e-05, "loss": 0.4927, "step": 2349 }, { "epoch": 0.27, "learning_rate": 1.7161437176161727e-05, "loss": 0.4618, "step": 2350 }, { "epoch": 0.27, "learning_rate": 1.7158853106538358e-05, "loss": 0.4854, "step": 2351 }, { "epoch": 0.27, "learning_rate": 1.7156268055992286e-05, "loss": 0.4853, "step": 2352 }, { "epoch": 0.27, "learning_rate": 1.7153682024877716e-05, "loss": 0.4795, "step": 2353 }, { "epoch": 0.27, "learning_rate": 1.7151095013548996e-05, "loss": 0.4838, "step": 2354 }, { "epoch": 0.27, "learning_rate": 1.7148507022360602e-05, "loss": 0.4743, "step": 2355 }, { "epoch": 0.27, "learning_rate": 1.7145918051667147e-05, "loss": 0.4669, "step": 2356 }, { "epoch": 0.27, "learning_rate": 1.714332810182338e-05, "loss": 0.4712, "step": 2357 }, { "epoch": 0.27, "learning_rate": 1.7140737173184178e-05, "loss": 0.4703, "step": 2358 }, { "epoch": 0.27, "learning_rate": 1.713814526610456e-05, "loss": 0.48, "step": 2359 }, { "epoch": 0.27, "learning_rate": 1.713555238093967e-05, "loss": 0.4717, "step": 2360 }, { "epoch": 0.27, "learning_rate": 1.7132958518044797e-05, "loss": 0.4669, "step": 2361 }, { "epoch": 0.27, "learning_rate": 1.713036367777535e-05, "loss": 0.4762, "step": 2362 }, { "epoch": 0.27, "learning_rate": 1.7127767860486892e-05, "loss": 0.4835, "step": 2363 }, { "epoch": 0.27, "learning_rate": 1.71251710665351e-05, "loss": 0.4753, "step": 2364 }, { "epoch": 0.27, "learning_rate": 1.7122573296275788e-05, "loss": 0.4621, "step": 2365 }, { "epoch": 0.27, "learning_rate": 1.711997455006492e-05, "loss": 0.4649, "step": 2366 }, { "epoch": 0.27, "learning_rate": 1.711737482825858e-05, "loss": 0.4877, "step": 2367 }, { "epoch": 0.27, "learning_rate": 1.7114774131212983e-05, "loss": 0.4709, "step": 2368 }, { "epoch": 0.27, "learning_rate": 1.7112172459284478e-05, "loss": 0.4921, "step": 2369 }, { "epoch": 0.27, "learning_rate": 1.7109569812829565e-05, "loss": 0.4739, "step": 2370 }, { "epoch": 0.27, "learning_rate": 1.710696619220486e-05, "loss": 0.4971, "step": 2371 }, { "epoch": 0.27, "learning_rate": 1.7104361597767107e-05, "loss": 0.4782, "step": 2372 }, { "epoch": 0.27, "learning_rate": 1.7101756029873208e-05, "loss": 0.4725, "step": 2373 }, { "epoch": 0.27, "learning_rate": 1.7099149488880174e-05, "loss": 0.4709, "step": 2374 }, { "epoch": 0.27, "learning_rate": 1.709654197514517e-05, "loss": 0.4594, "step": 2375 }, { "epoch": 0.27, "learning_rate": 1.709393348902547e-05, "loss": 0.4697, "step": 2376 }, { "epoch": 0.27, "learning_rate": 1.7091324030878504e-05, "loss": 0.4889, "step": 2377 }, { "epoch": 0.27, "learning_rate": 1.7088713601061823e-05, "loss": 0.4615, "step": 2378 }, { "epoch": 0.27, "learning_rate": 1.7086102199933116e-05, "loss": 0.4891, "step": 2379 }, { "epoch": 0.27, "learning_rate": 1.7083489827850202e-05, "loss": 0.4881, "step": 2380 }, { "epoch": 0.27, "learning_rate": 1.7080876485171035e-05, "loss": 0.4834, "step": 2381 }, { "epoch": 0.27, "learning_rate": 1.70782621722537e-05, "loss": 0.4731, "step": 2382 }, { "epoch": 0.27, "learning_rate": 1.7075646889456415e-05, "loss": 0.5067, "step": 2383 }, { "epoch": 0.27, "learning_rate": 1.7073030637137535e-05, "loss": 0.4691, "step": 2384 }, { "epoch": 0.27, "learning_rate": 1.7070413415655548e-05, "loss": 0.4868, "step": 2385 }, { "epoch": 0.27, "learning_rate": 1.7067795225369063e-05, "loss": 0.4821, "step": 2386 }, { "epoch": 0.27, "learning_rate": 1.7065176066636836e-05, "loss": 0.4938, "step": 2387 }, { "epoch": 0.27, "learning_rate": 1.706255593981775e-05, "loss": 0.4777, "step": 2388 }, { "epoch": 0.27, "learning_rate": 1.7059934845270826e-05, "loss": 0.5058, "step": 2389 }, { "epoch": 0.27, "learning_rate": 1.70573127833552e-05, "loss": 0.4644, "step": 2390 }, { "epoch": 0.27, "learning_rate": 1.705468975443016e-05, "loss": 0.4899, "step": 2391 }, { "epoch": 0.27, "learning_rate": 1.7052065758855123e-05, "loss": 0.4905, "step": 2392 }, { "epoch": 0.27, "learning_rate": 1.704944079698963e-05, "loss": 0.4652, "step": 2393 }, { "epoch": 0.27, "learning_rate": 1.704681486919336e-05, "loss": 0.4839, "step": 2394 }, { "epoch": 0.27, "learning_rate": 1.7044187975826126e-05, "loss": 0.4743, "step": 2395 }, { "epoch": 0.27, "learning_rate": 1.704156011724787e-05, "loss": 0.4723, "step": 2396 }, { "epoch": 0.27, "learning_rate": 1.7038931293818665e-05, "loss": 0.4885, "step": 2397 }, { "epoch": 0.27, "learning_rate": 1.703630150589872e-05, "loss": 0.471, "step": 2398 }, { "epoch": 0.27, "learning_rate": 1.7033670753848373e-05, "loss": 0.4791, "step": 2399 }, { "epoch": 0.27, "learning_rate": 1.7031039038028103e-05, "loss": 0.4562, "step": 2400 }, { "epoch": 0.27, "learning_rate": 1.7028406358798505e-05, "loss": 0.4891, "step": 2401 }, { "epoch": 0.27, "learning_rate": 1.7025772716520324e-05, "loss": 0.4637, "step": 2402 }, { "epoch": 0.27, "learning_rate": 1.7023138111554412e-05, "loss": 0.4753, "step": 2403 }, { "epoch": 0.27, "learning_rate": 1.702050254426179e-05, "loss": 0.4727, "step": 2404 }, { "epoch": 0.27, "learning_rate": 1.701786601500357e-05, "loss": 0.4795, "step": 2405 }, { "epoch": 0.27, "learning_rate": 1.701522852414103e-05, "loss": 0.4705, "step": 2406 }, { "epoch": 0.28, "learning_rate": 1.7012590072035554e-05, "loss": 0.5054, "step": 2407 }, { "epoch": 0.28, "learning_rate": 1.7009950659048677e-05, "loss": 0.4825, "step": 2408 }, { "epoch": 0.28, "learning_rate": 1.7007310285542057e-05, "loss": 0.4799, "step": 2409 }, { "epoch": 0.28, "learning_rate": 1.7004668951877475e-05, "loss": 0.4526, "step": 2410 }, { "epoch": 0.28, "learning_rate": 1.7002026658416862e-05, "loss": 0.4672, "step": 2411 }, { "epoch": 0.28, "learning_rate": 1.699938340552227e-05, "loss": 0.4956, "step": 2412 }, { "epoch": 0.28, "learning_rate": 1.699673919355588e-05, "loss": 0.4727, "step": 2413 }, { "epoch": 0.28, "learning_rate": 1.699409402288001e-05, "loss": 0.4746, "step": 2414 }, { "epoch": 0.28, "learning_rate": 1.699144789385711e-05, "loss": 0.4814, "step": 2415 }, { "epoch": 0.28, "learning_rate": 1.6988800806849754e-05, "loss": 0.4645, "step": 2416 }, { "epoch": 0.28, "learning_rate": 1.6986152762220655e-05, "loss": 0.4808, "step": 2417 }, { "epoch": 0.28, "learning_rate": 1.6983503760332653e-05, "loss": 0.4715, "step": 2418 }, { "epoch": 0.28, "learning_rate": 1.698085380154872e-05, "loss": 0.4588, "step": 2419 }, { "epoch": 0.28, "learning_rate": 1.6978202886231963e-05, "loss": 0.4597, "step": 2420 }, { "epoch": 0.28, "learning_rate": 1.6975551014745614e-05, "loss": 0.5044, "step": 2421 }, { "epoch": 0.28, "learning_rate": 1.697289818745304e-05, "loss": 0.463, "step": 2422 }, { "epoch": 0.28, "learning_rate": 1.6970244404717732e-05, "loss": 0.481, "step": 2423 }, { "epoch": 0.28, "learning_rate": 1.6967589666903324e-05, "loss": 0.4816, "step": 2424 }, { "epoch": 0.28, "learning_rate": 1.696493397437357e-05, "loss": 0.4928, "step": 2425 }, { "epoch": 0.28, "learning_rate": 1.6962277327492366e-05, "loss": 0.4689, "step": 2426 }, { "epoch": 0.28, "learning_rate": 1.6959619726623722e-05, "loss": 0.4803, "step": 2427 }, { "epoch": 0.28, "learning_rate": 1.6956961172131796e-05, "loss": 0.4684, "step": 2428 }, { "epoch": 0.28, "learning_rate": 1.6954301664380867e-05, "loss": 0.4796, "step": 2429 }, { "epoch": 0.28, "learning_rate": 1.6951641203735345e-05, "loss": 0.4839, "step": 2430 }, { "epoch": 0.28, "learning_rate": 1.694897979055978e-05, "loss": 0.4781, "step": 2431 }, { "epoch": 0.28, "learning_rate": 1.6946317425218834e-05, "loss": 0.4846, "step": 2432 }, { "epoch": 0.28, "learning_rate": 1.6943654108077317e-05, "loss": 0.4773, "step": 2433 }, { "epoch": 0.28, "learning_rate": 1.6940989839500167e-05, "loss": 0.4712, "step": 2434 }, { "epoch": 0.28, "learning_rate": 1.6938324619852435e-05, "loss": 0.4936, "step": 2435 }, { "epoch": 0.28, "learning_rate": 1.693565844949933e-05, "loss": 0.4735, "step": 2436 }, { "epoch": 0.28, "learning_rate": 1.693299132880617e-05, "loss": 0.4663, "step": 2437 }, { "epoch": 0.28, "learning_rate": 1.693032325813841e-05, "loss": 0.488, "step": 2438 }, { "epoch": 0.28, "learning_rate": 1.6927654237861635e-05, "loss": 0.4665, "step": 2439 }, { "epoch": 0.28, "learning_rate": 1.6924984268341563e-05, "loss": 0.4767, "step": 2440 }, { "epoch": 0.28, "learning_rate": 1.6922313349944037e-05, "loss": 0.4821, "step": 2441 }, { "epoch": 0.28, "learning_rate": 1.6919641483035035e-05, "loss": 0.4513, "step": 2442 }, { "epoch": 0.28, "learning_rate": 1.6916968667980658e-05, "loss": 0.4734, "step": 2443 }, { "epoch": 0.28, "learning_rate": 1.6914294905147144e-05, "loss": 0.4782, "step": 2444 }, { "epoch": 0.28, "learning_rate": 1.6911620194900862e-05, "loss": 0.4684, "step": 2445 }, { "epoch": 0.28, "learning_rate": 1.6908944537608302e-05, "loss": 0.4643, "step": 2446 }, { "epoch": 0.28, "learning_rate": 1.6906267933636087e-05, "loss": 0.4868, "step": 2447 }, { "epoch": 0.28, "learning_rate": 1.6903590383350975e-05, "loss": 0.4797, "step": 2448 }, { "epoch": 0.28, "learning_rate": 1.690091188711985e-05, "loss": 0.4894, "step": 2449 }, { "epoch": 0.28, "learning_rate": 1.689823244530973e-05, "loss": 0.4657, "step": 2450 }, { "epoch": 0.28, "learning_rate": 1.6895552058287752e-05, "loss": 0.4817, "step": 2451 }, { "epoch": 0.28, "learning_rate": 1.689287072642119e-05, "loss": 0.4785, "step": 2452 }, { "epoch": 0.28, "learning_rate": 1.6890188450077445e-05, "loss": 0.4668, "step": 2453 }, { "epoch": 0.28, "learning_rate": 1.6887505229624053e-05, "loss": 0.4684, "step": 2454 }, { "epoch": 0.28, "learning_rate": 1.6884821065428673e-05, "loss": 0.4807, "step": 2455 }, { "epoch": 0.28, "learning_rate": 1.6882135957859095e-05, "loss": 0.4894, "step": 2456 }, { "epoch": 0.28, "learning_rate": 1.6879449907283238e-05, "loss": 0.4591, "step": 2457 }, { "epoch": 0.28, "learning_rate": 1.6876762914069154e-05, "loss": 0.4734, "step": 2458 }, { "epoch": 0.28, "learning_rate": 1.6874074978585018e-05, "loss": 0.4596, "step": 2459 }, { "epoch": 0.28, "learning_rate": 1.687138610119914e-05, "loss": 0.4737, "step": 2460 }, { "epoch": 0.28, "learning_rate": 1.686869628227995e-05, "loss": 0.5029, "step": 2461 }, { "epoch": 0.28, "learning_rate": 1.686600552219602e-05, "loss": 0.4675, "step": 2462 }, { "epoch": 0.28, "learning_rate": 1.686331382131604e-05, "loss": 0.4601, "step": 2463 }, { "epoch": 0.28, "learning_rate": 1.686062118000884e-05, "loss": 0.4806, "step": 2464 }, { "epoch": 0.28, "learning_rate": 1.6857927598643362e-05, "loss": 0.4758, "step": 2465 }, { "epoch": 0.28, "learning_rate": 1.6855233077588697e-05, "loss": 0.503, "step": 2466 }, { "epoch": 0.28, "learning_rate": 1.6852537617214043e-05, "loss": 0.4894, "step": 2467 }, { "epoch": 0.28, "learning_rate": 1.6849841217888748e-05, "loss": 0.4551, "step": 2468 }, { "epoch": 0.28, "learning_rate": 1.6847143879982276e-05, "loss": 0.4697, "step": 2469 }, { "epoch": 0.28, "learning_rate": 1.684444560386422e-05, "loss": 0.4702, "step": 2470 }, { "epoch": 0.28, "learning_rate": 1.6841746389904306e-05, "loss": 0.4724, "step": 2471 }, { "epoch": 0.28, "learning_rate": 1.6839046238472387e-05, "loss": 0.49, "step": 2472 }, { "epoch": 0.28, "learning_rate": 1.6836345149938445e-05, "loss": 0.4787, "step": 2473 }, { "epoch": 0.28, "learning_rate": 1.6833643124672586e-05, "loss": 0.4715, "step": 2474 }, { "epoch": 0.28, "learning_rate": 1.683094016304505e-05, "loss": 0.4781, "step": 2475 }, { "epoch": 0.28, "learning_rate": 1.6828236265426205e-05, "loss": 0.4622, "step": 2476 }, { "epoch": 0.28, "learning_rate": 1.6825531432186545e-05, "loss": 0.4672, "step": 2477 }, { "epoch": 0.28, "learning_rate": 1.6822825663696683e-05, "loss": 0.4731, "step": 2478 }, { "epoch": 0.28, "learning_rate": 1.6820118960327386e-05, "loss": 0.4835, "step": 2479 }, { "epoch": 0.28, "learning_rate": 1.681741132244952e-05, "loss": 0.4742, "step": 2480 }, { "epoch": 0.28, "learning_rate": 1.6814702750434097e-05, "loss": 0.4779, "step": 2481 }, { "epoch": 0.28, "learning_rate": 1.6811993244652248e-05, "loss": 0.4848, "step": 2482 }, { "epoch": 0.28, "learning_rate": 1.6809282805475243e-05, "loss": 0.4667, "step": 2483 }, { "epoch": 0.28, "learning_rate": 1.680657143327447e-05, "loss": 0.479, "step": 2484 }, { "epoch": 0.28, "learning_rate": 1.680385912842144e-05, "loss": 0.466, "step": 2485 }, { "epoch": 0.28, "learning_rate": 1.680114589128781e-05, "loss": 0.4768, "step": 2486 }, { "epoch": 0.28, "learning_rate": 1.6798431722245346e-05, "loss": 0.4632, "step": 2487 }, { "epoch": 0.28, "learning_rate": 1.6795716621665957e-05, "loss": 0.5026, "step": 2488 }, { "epoch": 0.28, "learning_rate": 1.6793000589921666e-05, "loss": 0.4801, "step": 2489 }, { "epoch": 0.28, "learning_rate": 1.6790283627384633e-05, "loss": 0.4888, "step": 2490 }, { "epoch": 0.28, "learning_rate": 1.6787565734427143e-05, "loss": 0.4666, "step": 2491 }, { "epoch": 0.28, "learning_rate": 1.6784846911421605e-05, "loss": 0.4721, "step": 2492 }, { "epoch": 0.28, "learning_rate": 1.678212715874056e-05, "loss": 0.4713, "step": 2493 }, { "epoch": 0.29, "learning_rate": 1.677940647675668e-05, "loss": 0.4702, "step": 2494 }, { "epoch": 0.29, "learning_rate": 1.6776684865842748e-05, "loss": 0.4716, "step": 2495 }, { "epoch": 0.29, "learning_rate": 1.6773962326371696e-05, "loss": 0.4623, "step": 2496 }, { "epoch": 0.29, "learning_rate": 1.677123885871657e-05, "loss": 0.4892, "step": 2497 }, { "epoch": 0.29, "learning_rate": 1.6768514463250544e-05, "loss": 0.4916, "step": 2498 }, { "epoch": 0.29, "learning_rate": 1.6765789140346916e-05, "loss": 0.4808, "step": 2499 }, { "epoch": 0.29, "learning_rate": 1.6763062890379128e-05, "loss": 0.4719, "step": 2500 }, { "epoch": 0.29, "learning_rate": 1.6760335713720727e-05, "loss": 0.4711, "step": 2501 }, { "epoch": 0.29, "learning_rate": 1.6757607610745405e-05, "loss": 0.4837, "step": 2502 }, { "epoch": 0.29, "learning_rate": 1.6754878581826966e-05, "loss": 0.4707, "step": 2503 }, { "epoch": 0.29, "learning_rate": 1.675214862733935e-05, "loss": 0.4648, "step": 2504 }, { "epoch": 0.29, "learning_rate": 1.674941774765662e-05, "loss": 0.4742, "step": 2505 }, { "epoch": 0.29, "learning_rate": 1.6746685943152975e-05, "loss": 0.4896, "step": 2506 }, { "epoch": 0.29, "learning_rate": 1.674395321420273e-05, "loss": 0.4759, "step": 2507 }, { "epoch": 0.29, "learning_rate": 1.674121956118032e-05, "loss": 0.4774, "step": 2508 }, { "epoch": 0.29, "learning_rate": 1.673848498446033e-05, "loss": 0.4727, "step": 2509 }, { "epoch": 0.29, "learning_rate": 1.6735749484417452e-05, "loss": 0.4816, "step": 2510 }, { "epoch": 0.29, "learning_rate": 1.673301306142651e-05, "loss": 0.475, "step": 2511 }, { "epoch": 0.29, "learning_rate": 1.6730275715862455e-05, "loss": 0.4677, "step": 2512 }, { "epoch": 0.29, "learning_rate": 1.672753744810037e-05, "loss": 0.4701, "step": 2513 }, { "epoch": 0.29, "learning_rate": 1.6724798258515452e-05, "loss": 0.4852, "step": 2514 }, { "epoch": 0.29, "learning_rate": 1.6722058147483034e-05, "loss": 0.49, "step": 2515 }, { "epoch": 0.29, "learning_rate": 1.671931711537857e-05, "loss": 0.4704, "step": 2516 }, { "epoch": 0.29, "learning_rate": 1.6716575162577647e-05, "loss": 0.4733, "step": 2517 }, { "epoch": 0.29, "learning_rate": 1.671383228945597e-05, "loss": 0.4668, "step": 2518 }, { "epoch": 0.29, "learning_rate": 1.6711088496389375e-05, "loss": 0.4812, "step": 2519 }, { "epoch": 0.29, "learning_rate": 1.6708343783753824e-05, "loss": 0.4573, "step": 2520 }, { "epoch": 0.29, "learning_rate": 1.67055981519254e-05, "loss": 0.485, "step": 2521 }, { "epoch": 0.29, "learning_rate": 1.6702851601280322e-05, "loss": 0.4801, "step": 2522 }, { "epoch": 0.29, "learning_rate": 1.6700104132194925e-05, "loss": 0.4627, "step": 2523 }, { "epoch": 0.29, "learning_rate": 1.6697355745045678e-05, "loss": 0.479, "step": 2524 }, { "epoch": 0.29, "learning_rate": 1.6694606440209163e-05, "loss": 0.4802, "step": 2525 }, { "epoch": 0.29, "learning_rate": 1.6691856218062105e-05, "loss": 0.4808, "step": 2526 }, { "epoch": 0.29, "learning_rate": 1.6689105078981333e-05, "loss": 0.4646, "step": 2527 }, { "epoch": 0.29, "learning_rate": 1.668635302334383e-05, "loss": 0.48, "step": 2528 }, { "epoch": 0.29, "learning_rate": 1.6683600051526682e-05, "loss": 0.4655, "step": 2529 }, { "epoch": 0.29, "learning_rate": 1.6680846163907107e-05, "loss": 0.4952, "step": 2530 }, { "epoch": 0.29, "learning_rate": 1.6678091360862447e-05, "loss": 0.4787, "step": 2531 }, { "epoch": 0.29, "learning_rate": 1.6675335642770178e-05, "loss": 0.4895, "step": 2532 }, { "epoch": 0.29, "learning_rate": 1.667257901000789e-05, "loss": 0.4627, "step": 2533 }, { "epoch": 0.29, "learning_rate": 1.6669821462953303e-05, "loss": 0.4718, "step": 2534 }, { "epoch": 0.29, "learning_rate": 1.6667063001984267e-05, "loss": 0.4801, "step": 2535 }, { "epoch": 0.29, "learning_rate": 1.6664303627478745e-05, "loss": 0.4728, "step": 2536 }, { "epoch": 0.29, "learning_rate": 1.6661543339814847e-05, "loss": 0.4682, "step": 2537 }, { "epoch": 0.29, "learning_rate": 1.6658782139370775e-05, "loss": 0.4591, "step": 2538 }, { "epoch": 0.29, "learning_rate": 1.6656020026524887e-05, "loss": 0.4752, "step": 2539 }, { "epoch": 0.29, "learning_rate": 1.6653257001655652e-05, "loss": 0.4631, "step": 2540 }, { "epoch": 0.29, "learning_rate": 1.6650493065141672e-05, "loss": 0.4763, "step": 2541 }, { "epoch": 0.29, "learning_rate": 1.6647728217361658e-05, "loss": 0.4713, "step": 2542 }, { "epoch": 0.29, "learning_rate": 1.6644962458694457e-05, "loss": 0.4599, "step": 2543 }, { "epoch": 0.29, "learning_rate": 1.6642195789519045e-05, "loss": 0.4702, "step": 2544 }, { "epoch": 0.29, "learning_rate": 1.6639428210214514e-05, "loss": 0.4738, "step": 2545 }, { "epoch": 0.29, "learning_rate": 1.6636659721160088e-05, "loss": 0.4827, "step": 2546 }, { "epoch": 0.29, "learning_rate": 1.6633890322735107e-05, "loss": 0.4857, "step": 2547 }, { "epoch": 0.29, "learning_rate": 1.6631120015319044e-05, "loss": 0.4765, "step": 2548 }, { "epoch": 0.29, "learning_rate": 1.662834879929149e-05, "loss": 0.4676, "step": 2549 }, { "epoch": 0.29, "learning_rate": 1.6625576675032163e-05, "loss": 0.4788, "step": 2550 }, { "epoch": 0.29, "learning_rate": 1.6622803642920912e-05, "loss": 0.4827, "step": 2551 }, { "epoch": 0.29, "learning_rate": 1.6620029703337697e-05, "loss": 0.469, "step": 2552 }, { "epoch": 0.29, "learning_rate": 1.6617254856662613e-05, "loss": 0.4874, "step": 2553 }, { "epoch": 0.29, "learning_rate": 1.6614479103275875e-05, "loss": 0.4735, "step": 2554 }, { "epoch": 0.29, "learning_rate": 1.6611702443557826e-05, "loss": 0.4696, "step": 2555 }, { "epoch": 0.29, "learning_rate": 1.6608924877888926e-05, "loss": 0.4801, "step": 2556 }, { "epoch": 0.29, "learning_rate": 1.6606146406649767e-05, "loss": 0.471, "step": 2557 }, { "epoch": 0.29, "learning_rate": 1.660336703022106e-05, "loss": 0.4862, "step": 2558 }, { "epoch": 0.29, "learning_rate": 1.6600586748983642e-05, "loss": 0.4797, "step": 2559 }, { "epoch": 0.29, "learning_rate": 1.6597805563318475e-05, "loss": 0.4754, "step": 2560 }, { "epoch": 0.29, "learning_rate": 1.659502347360664e-05, "loss": 0.4828, "step": 2561 }, { "epoch": 0.29, "learning_rate": 1.659224048022935e-05, "loss": 0.4729, "step": 2562 }, { "epoch": 0.29, "learning_rate": 1.6589456583567934e-05, "loss": 0.4708, "step": 2563 }, { "epoch": 0.29, "learning_rate": 1.6586671784003846e-05, "loss": 0.4831, "step": 2564 }, { "epoch": 0.29, "learning_rate": 1.658388608191867e-05, "loss": 0.4759, "step": 2565 }, { "epoch": 0.29, "learning_rate": 1.658109947769411e-05, "loss": 0.4712, "step": 2566 }, { "epoch": 0.29, "learning_rate": 1.657831197171199e-05, "loss": 0.4785, "step": 2567 }, { "epoch": 0.29, "learning_rate": 1.657552356435426e-05, "loss": 0.4917, "step": 2568 }, { "epoch": 0.29, "learning_rate": 1.6572734256002997e-05, "loss": 0.4723, "step": 2569 }, { "epoch": 0.29, "learning_rate": 1.6569944047040394e-05, "loss": 0.4645, "step": 2570 }, { "epoch": 0.29, "learning_rate": 1.6567152937848776e-05, "loss": 0.483, "step": 2571 }, { "epoch": 0.29, "learning_rate": 1.6564360928810588e-05, "loss": 0.4732, "step": 2572 }, { "epoch": 0.29, "learning_rate": 1.6561568020308397e-05, "loss": 0.48, "step": 2573 }, { "epoch": 0.29, "learning_rate": 1.6558774212724888e-05, "loss": 0.48, "step": 2574 }, { "epoch": 0.29, "learning_rate": 1.655597950644288e-05, "loss": 0.4795, "step": 2575 }, { "epoch": 0.29, "learning_rate": 1.6553183901845313e-05, "loss": 0.475, "step": 2576 }, { "epoch": 0.29, "learning_rate": 1.6550387399315246e-05, "loss": 0.4733, "step": 2577 }, { "epoch": 0.29, "learning_rate": 1.6547589999235854e-05, "loss": 0.4748, "step": 2578 }, { "epoch": 0.29, "learning_rate": 1.654479170199045e-05, "loss": 0.467, "step": 2579 }, { "epoch": 0.29, "learning_rate": 1.6541992507962467e-05, "loss": 0.4737, "step": 2580 }, { "epoch": 0.29, "learning_rate": 1.653919241753545e-05, "loss": 0.4803, "step": 2581 }, { "epoch": 0.3, "learning_rate": 1.6536391431093077e-05, "loss": 0.4576, "step": 2582 }, { "epoch": 0.3, "learning_rate": 1.6533589549019147e-05, "loss": 0.4855, "step": 2583 }, { "epoch": 0.3, "learning_rate": 1.6530786771697575e-05, "loss": 0.4809, "step": 2584 }, { "epoch": 0.3, "learning_rate": 1.6527983099512414e-05, "loss": 0.4582, "step": 2585 }, { "epoch": 0.3, "learning_rate": 1.6525178532847816e-05, "loss": 0.4754, "step": 2586 }, { "epoch": 0.3, "learning_rate": 1.6522373072088083e-05, "loss": 0.4623, "step": 2587 }, { "epoch": 0.3, "learning_rate": 1.6519566717617616e-05, "loss": 0.4678, "step": 2588 }, { "epoch": 0.3, "learning_rate": 1.6516759469820955e-05, "loss": 0.4837, "step": 2589 }, { "epoch": 0.3, "learning_rate": 1.6513951329082746e-05, "loss": 0.4858, "step": 2590 }, { "epoch": 0.3, "learning_rate": 1.651114229578778e-05, "loss": 0.4732, "step": 2591 }, { "epoch": 0.3, "learning_rate": 1.6508332370320948e-05, "loss": 0.4903, "step": 2592 }, { "epoch": 0.3, "learning_rate": 1.6505521553067273e-05, "loss": 0.4576, "step": 2593 }, { "epoch": 0.3, "learning_rate": 1.6502709844411907e-05, "loss": 0.4749, "step": 2594 }, { "epoch": 0.3, "learning_rate": 1.6499897244740107e-05, "loss": 0.4708, "step": 2595 }, { "epoch": 0.3, "learning_rate": 1.649708375443727e-05, "loss": 0.4769, "step": 2596 }, { "epoch": 0.3, "learning_rate": 1.6494269373888902e-05, "loss": 0.4642, "step": 2597 }, { "epoch": 0.3, "learning_rate": 1.6491454103480637e-05, "loss": 0.4851, "step": 2598 }, { "epoch": 0.3, "learning_rate": 1.6488637943598235e-05, "loss": 0.4549, "step": 2599 }, { "epoch": 0.3, "learning_rate": 1.648582089462756e-05, "loss": 0.5042, "step": 2600 }, { "epoch": 0.3, "learning_rate": 1.6483002956954622e-05, "loss": 0.4748, "step": 2601 }, { "epoch": 0.3, "learning_rate": 1.6480184130965542e-05, "loss": 0.4497, "step": 2602 }, { "epoch": 0.3, "learning_rate": 1.647736441704656e-05, "loss": 0.4645, "step": 2603 }, { "epoch": 0.3, "learning_rate": 1.647454381558403e-05, "loss": 0.4807, "step": 2604 }, { "epoch": 0.3, "learning_rate": 1.647172232696445e-05, "loss": 0.4787, "step": 2605 }, { "epoch": 0.3, "learning_rate": 1.6468899951574423e-05, "loss": 0.4748, "step": 2606 }, { "epoch": 0.3, "learning_rate": 1.6466076689800677e-05, "loss": 0.4747, "step": 2607 }, { "epoch": 0.3, "learning_rate": 1.6463252542030058e-05, "loss": 0.4748, "step": 2608 }, { "epoch": 0.3, "learning_rate": 1.6460427508649546e-05, "loss": 0.4958, "step": 2609 }, { "epoch": 0.3, "learning_rate": 1.6457601590046227e-05, "loss": 0.454, "step": 2610 }, { "epoch": 0.3, "learning_rate": 1.6454774786607317e-05, "loss": 0.4737, "step": 2611 }, { "epoch": 0.3, "learning_rate": 1.6451947098720148e-05, "loss": 0.4823, "step": 2612 }, { "epoch": 0.3, "learning_rate": 1.6449118526772183e-05, "loss": 0.4601, "step": 2613 }, { "epoch": 0.3, "learning_rate": 1.6446289071150993e-05, "loss": 0.4766, "step": 2614 }, { "epoch": 0.3, "learning_rate": 1.644345873224428e-05, "loss": 0.4621, "step": 2615 }, { "epoch": 0.3, "learning_rate": 1.6440627510439862e-05, "loss": 0.4784, "step": 2616 }, { "epoch": 0.3, "learning_rate": 1.6437795406125684e-05, "loss": 0.4711, "step": 2617 }, { "epoch": 0.3, "learning_rate": 1.6434962419689803e-05, "loss": 0.4825, "step": 2618 }, { "epoch": 0.3, "learning_rate": 1.64321285515204e-05, "loss": 0.4636, "step": 2619 }, { "epoch": 0.3, "learning_rate": 1.6429293802005783e-05, "loss": 0.4749, "step": 2620 }, { "epoch": 0.3, "learning_rate": 1.642645817153437e-05, "loss": 0.4664, "step": 2621 }, { "epoch": 0.3, "learning_rate": 1.6423621660494714e-05, "loss": 0.4854, "step": 2622 }, { "epoch": 0.3, "learning_rate": 1.6420784269275474e-05, "loss": 0.4695, "step": 2623 }, { "epoch": 0.3, "learning_rate": 1.6417945998265436e-05, "loss": 0.4813, "step": 2624 }, { "epoch": 0.3, "learning_rate": 1.641510684785351e-05, "loss": 0.464, "step": 2625 }, { "epoch": 0.3, "learning_rate": 1.641226681842872e-05, "loss": 0.4837, "step": 2626 }, { "epoch": 0.3, "learning_rate": 1.6409425910380215e-05, "loss": 0.4592, "step": 2627 }, { "epoch": 0.3, "learning_rate": 1.640658412409726e-05, "loss": 0.4575, "step": 2628 }, { "epoch": 0.3, "learning_rate": 1.640374145996925e-05, "loss": 0.4661, "step": 2629 }, { "epoch": 0.3, "learning_rate": 1.6400897918385687e-05, "loss": 0.501, "step": 2630 }, { "epoch": 0.3, "learning_rate": 1.63980534997362e-05, "loss": 0.4592, "step": 2631 }, { "epoch": 0.3, "learning_rate": 1.639520820441054e-05, "loss": 0.4907, "step": 2632 }, { "epoch": 0.3, "learning_rate": 1.6392362032798578e-05, "loss": 0.4751, "step": 2633 }, { "epoch": 0.3, "learning_rate": 1.63895149852903e-05, "loss": 0.4735, "step": 2634 }, { "epoch": 0.3, "learning_rate": 1.6386667062275817e-05, "loss": 0.4791, "step": 2635 }, { "epoch": 0.3, "learning_rate": 1.638381826414535e-05, "loss": 0.476, "step": 2636 }, { "epoch": 0.3, "learning_rate": 1.638096859128926e-05, "loss": 0.453, "step": 2637 }, { "epoch": 0.3, "learning_rate": 1.637811804409801e-05, "loss": 0.4987, "step": 2638 }, { "epoch": 0.3, "learning_rate": 1.6375266622962188e-05, "loss": 0.4523, "step": 2639 }, { "epoch": 0.3, "learning_rate": 1.6372414328272502e-05, "loss": 0.4917, "step": 2640 }, { "epoch": 0.3, "learning_rate": 1.6369561160419783e-05, "loss": 0.4654, "step": 2641 }, { "epoch": 0.3, "learning_rate": 1.6366707119794978e-05, "loss": 0.4869, "step": 2642 }, { "epoch": 0.3, "learning_rate": 1.6363852206789155e-05, "loss": 0.4597, "step": 2643 }, { "epoch": 0.3, "learning_rate": 1.6360996421793497e-05, "loss": 0.4904, "step": 2644 }, { "epoch": 0.3, "learning_rate": 1.635813976519931e-05, "loss": 0.4572, "step": 2645 }, { "epoch": 0.3, "learning_rate": 1.6355282237398026e-05, "loss": 0.4793, "step": 2646 }, { "epoch": 0.3, "learning_rate": 1.6352423838781185e-05, "loss": 0.4746, "step": 2647 }, { "epoch": 0.3, "learning_rate": 1.6349564569740454e-05, "loss": 0.4728, "step": 2648 }, { "epoch": 0.3, "learning_rate": 1.6346704430667612e-05, "loss": 0.477, "step": 2649 }, { "epoch": 0.3, "learning_rate": 1.6343843421954567e-05, "loss": 0.4799, "step": 2650 }, { "epoch": 0.3, "learning_rate": 1.634098154399334e-05, "loss": 0.4626, "step": 2651 }, { "epoch": 0.3, "learning_rate": 1.6338118797176074e-05, "loss": 0.4803, "step": 2652 }, { "epoch": 0.3, "learning_rate": 1.6335255181895026e-05, "loss": 0.482, "step": 2653 }, { "epoch": 0.3, "learning_rate": 1.633239069854257e-05, "loss": 0.4549, "step": 2654 }, { "epoch": 0.3, "learning_rate": 1.632952534751122e-05, "loss": 0.4724, "step": 2655 }, { "epoch": 0.3, "learning_rate": 1.6326659129193577e-05, "loss": 0.4907, "step": 2656 }, { "epoch": 0.3, "learning_rate": 1.632379204398238e-05, "loss": 0.4783, "step": 2657 }, { "epoch": 0.3, "learning_rate": 1.6320924092270494e-05, "loss": 0.5081, "step": 2658 }, { "epoch": 0.3, "learning_rate": 1.6318055274450885e-05, "loss": 0.4605, "step": 2659 }, { "epoch": 0.3, "learning_rate": 1.6315185590916644e-05, "loss": 0.4626, "step": 2660 }, { "epoch": 0.3, "learning_rate": 1.6312315042060984e-05, "loss": 0.4659, "step": 2661 }, { "epoch": 0.3, "learning_rate": 1.630944362827723e-05, "loss": 0.4902, "step": 2662 }, { "epoch": 0.3, "learning_rate": 1.6306571349958833e-05, "loss": 0.4671, "step": 2663 }, { "epoch": 0.3, "learning_rate": 1.6303698207499364e-05, "loss": 0.4744, "step": 2664 }, { "epoch": 0.3, "learning_rate": 1.63008242012925e-05, "loss": 0.4611, "step": 2665 }, { "epoch": 0.3, "learning_rate": 1.6297949331732047e-05, "loss": 0.5038, "step": 2666 }, { "epoch": 0.3, "learning_rate": 1.629507359921193e-05, "loss": 0.4835, "step": 2667 }, { "epoch": 0.3, "learning_rate": 1.6292197004126184e-05, "loss": 0.4742, "step": 2668 }, { "epoch": 0.31, "learning_rate": 1.6289319546868966e-05, "loss": 0.4685, "step": 2669 }, { "epoch": 0.31, "learning_rate": 1.6286441227834552e-05, "loss": 0.4954, "step": 2670 }, { "epoch": 0.31, "learning_rate": 1.6283562047417342e-05, "loss": 0.4682, "step": 2671 }, { "epoch": 0.31, "learning_rate": 1.628068200601184e-05, "loss": 0.4653, "step": 2672 }, { "epoch": 0.31, "learning_rate": 1.627780110401268e-05, "loss": 0.4799, "step": 2673 }, { "epoch": 0.31, "learning_rate": 1.6274919341814607e-05, "loss": 0.4749, "step": 2674 }, { "epoch": 0.31, "learning_rate": 1.6272036719812496e-05, "loss": 0.4631, "step": 2675 }, { "epoch": 0.31, "learning_rate": 1.6269153238401317e-05, "loss": 0.4921, "step": 2676 }, { "epoch": 0.31, "learning_rate": 1.626626889797618e-05, "loss": 0.4678, "step": 2677 }, { "epoch": 0.31, "learning_rate": 1.6263383698932307e-05, "loss": 0.4558, "step": 2678 }, { "epoch": 0.31, "learning_rate": 1.6260497641665028e-05, "loss": 0.4778, "step": 2679 }, { "epoch": 0.31, "learning_rate": 1.6257610726569798e-05, "loss": 0.4876, "step": 2680 }, { "epoch": 0.31, "learning_rate": 1.625472295404219e-05, "loss": 0.4687, "step": 2681 }, { "epoch": 0.31, "learning_rate": 1.625183432447789e-05, "loss": 0.4772, "step": 2682 }, { "epoch": 0.31, "learning_rate": 1.6248944838272712e-05, "loss": 0.46, "step": 2683 }, { "epoch": 0.31, "learning_rate": 1.6246054495822575e-05, "loss": 0.4925, "step": 2684 }, { "epoch": 0.31, "learning_rate": 1.6243163297523524e-05, "loss": 0.4656, "step": 2685 }, { "epoch": 0.31, "learning_rate": 1.6240271243771713e-05, "loss": 0.4525, "step": 2686 }, { "epoch": 0.31, "learning_rate": 1.6237378334963422e-05, "loss": 0.4818, "step": 2687 }, { "epoch": 0.31, "learning_rate": 1.623448457149504e-05, "loss": 0.4646, "step": 2688 }, { "epoch": 0.31, "learning_rate": 1.623158995376308e-05, "loss": 0.4739, "step": 2689 }, { "epoch": 0.31, "learning_rate": 1.6228694482164167e-05, "loss": 0.4613, "step": 2690 }, { "epoch": 0.31, "learning_rate": 1.622579815709505e-05, "loss": 0.5051, "step": 2691 }, { "epoch": 0.31, "learning_rate": 1.6222900978952586e-05, "loss": 0.4472, "step": 2692 }, { "epoch": 0.31, "learning_rate": 1.6220002948133756e-05, "loss": 0.5041, "step": 2693 }, { "epoch": 0.31, "learning_rate": 1.6217104065035652e-05, "loss": 0.4845, "step": 2694 }, { "epoch": 0.31, "learning_rate": 1.6214204330055484e-05, "loss": 0.4754, "step": 2695 }, { "epoch": 0.31, "learning_rate": 1.621130374359059e-05, "loss": 0.4589, "step": 2696 }, { "epoch": 0.31, "learning_rate": 1.6208402306038406e-05, "loss": 0.4649, "step": 2697 }, { "epoch": 0.31, "learning_rate": 1.620550001779649e-05, "loss": 0.4751, "step": 2698 }, { "epoch": 0.31, "learning_rate": 1.6202596879262536e-05, "loss": 0.4805, "step": 2699 }, { "epoch": 0.31, "learning_rate": 1.6199692890834324e-05, "loss": 0.46, "step": 2700 }, { "epoch": 0.31, "learning_rate": 1.6196788052909772e-05, "loss": 0.477, "step": 2701 }, { "epoch": 0.31, "learning_rate": 1.6193882365886905e-05, "loss": 0.4757, "step": 2702 }, { "epoch": 0.31, "learning_rate": 1.6190975830163872e-05, "loss": 0.4712, "step": 2703 }, { "epoch": 0.31, "learning_rate": 1.6188068446138925e-05, "loss": 0.4701, "step": 2704 }, { "epoch": 0.31, "learning_rate": 1.6185160214210447e-05, "loss": 0.4706, "step": 2705 }, { "epoch": 0.31, "learning_rate": 1.6182251134776927e-05, "loss": 0.4659, "step": 2706 }, { "epoch": 0.31, "learning_rate": 1.6179341208236977e-05, "loss": 0.4882, "step": 2707 }, { "epoch": 0.31, "learning_rate": 1.617643043498932e-05, "loss": 0.4824, "step": 2708 }, { "epoch": 0.31, "learning_rate": 1.6173518815432797e-05, "loss": 0.4679, "step": 2709 }, { "epoch": 0.31, "learning_rate": 1.6170606349966367e-05, "loss": 0.4932, "step": 2710 }, { "epoch": 0.31, "learning_rate": 1.6167693038989098e-05, "loss": 0.485, "step": 2711 }, { "epoch": 0.31, "learning_rate": 1.6164778882900186e-05, "loss": 0.4555, "step": 2712 }, { "epoch": 0.31, "learning_rate": 1.6161863882098926e-05, "loss": 0.5035, "step": 2713 }, { "epoch": 0.31, "learning_rate": 1.615894803698475e-05, "loss": 0.4557, "step": 2714 }, { "epoch": 0.31, "learning_rate": 1.615603134795718e-05, "loss": 0.4986, "step": 2715 }, { "epoch": 0.31, "learning_rate": 1.615311381541588e-05, "loss": 0.4746, "step": 2716 }, { "epoch": 0.31, "learning_rate": 1.615019543976061e-05, "loss": 0.4601, "step": 2717 }, { "epoch": 0.31, "learning_rate": 1.6147276221391256e-05, "loss": 0.4762, "step": 2718 }, { "epoch": 0.31, "learning_rate": 1.614435616070781e-05, "loss": 0.483, "step": 2719 }, { "epoch": 0.31, "learning_rate": 1.6141435258110397e-05, "loss": 0.4747, "step": 2720 }, { "epoch": 0.31, "learning_rate": 1.6138513513999234e-05, "loss": 0.4668, "step": 2721 }, { "epoch": 0.31, "learning_rate": 1.613559092877467e-05, "loss": 0.4704, "step": 2722 }, { "epoch": 0.31, "learning_rate": 1.6132667502837164e-05, "loss": 0.4809, "step": 2723 }, { "epoch": 0.31, "learning_rate": 1.6129743236587293e-05, "loss": 0.4661, "step": 2724 }, { "epoch": 0.31, "learning_rate": 1.6126818130425746e-05, "loss": 0.48, "step": 2725 }, { "epoch": 0.31, "learning_rate": 1.6123892184753324e-05, "loss": 0.4916, "step": 2726 }, { "epoch": 0.31, "learning_rate": 1.612096539997095e-05, "loss": 0.4791, "step": 2727 }, { "epoch": 0.31, "learning_rate": 1.611803777647966e-05, "loss": 0.4851, "step": 2728 }, { "epoch": 0.31, "learning_rate": 1.6115109314680603e-05, "loss": 0.4755, "step": 2729 }, { "epoch": 0.31, "learning_rate": 1.611218001497504e-05, "loss": 0.4662, "step": 2730 }, { "epoch": 0.31, "learning_rate": 1.610924987776436e-05, "loss": 0.4743, "step": 2731 }, { "epoch": 0.31, "learning_rate": 1.6106318903450042e-05, "loss": 0.446, "step": 2732 }, { "epoch": 0.31, "learning_rate": 1.6103387092433704e-05, "loss": 0.48, "step": 2733 }, { "epoch": 0.31, "learning_rate": 1.6100454445117074e-05, "loss": 0.4846, "step": 2734 }, { "epoch": 0.31, "learning_rate": 1.6097520961901983e-05, "loss": 0.4946, "step": 2735 }, { "epoch": 0.31, "learning_rate": 1.6094586643190388e-05, "loss": 0.4798, "step": 2736 }, { "epoch": 0.31, "learning_rate": 1.609165148938435e-05, "loss": 0.4737, "step": 2737 }, { "epoch": 0.31, "learning_rate": 1.608871550088606e-05, "loss": 0.4634, "step": 2738 }, { "epoch": 0.31, "learning_rate": 1.6085778678097804e-05, "loss": 0.4716, "step": 2739 }, { "epoch": 0.31, "learning_rate": 1.6082841021422e-05, "loss": 0.4621, "step": 2740 }, { "epoch": 0.31, "learning_rate": 1.607990253126117e-05, "loss": 0.4844, "step": 2741 }, { "epoch": 0.31, "learning_rate": 1.607696320801795e-05, "loss": 0.479, "step": 2742 }, { "epoch": 0.31, "learning_rate": 1.6074023052095096e-05, "loss": 0.4718, "step": 2743 }, { "epoch": 0.31, "learning_rate": 1.6071082063895476e-05, "loss": 0.4843, "step": 2744 }, { "epoch": 0.31, "learning_rate": 1.6068140243822065e-05, "loss": 0.4677, "step": 2745 }, { "epoch": 0.31, "learning_rate": 1.6065197592277965e-05, "loss": 0.4666, "step": 2746 }, { "epoch": 0.31, "learning_rate": 1.6062254109666383e-05, "loss": 0.4853, "step": 2747 }, { "epoch": 0.31, "learning_rate": 1.6059309796390638e-05, "loss": 0.4735, "step": 2748 }, { "epoch": 0.31, "learning_rate": 1.6056364652854174e-05, "loss": 0.4768, "step": 2749 }, { "epoch": 0.31, "learning_rate": 1.6053418679460534e-05, "loss": 0.4528, "step": 2750 }, { "epoch": 0.31, "learning_rate": 1.6050471876613386e-05, "loss": 0.4702, "step": 2751 }, { "epoch": 0.31, "learning_rate": 1.6047524244716506e-05, "loss": 0.4713, "step": 2752 }, { "epoch": 0.31, "learning_rate": 1.604457578417379e-05, "loss": 0.4758, "step": 2753 }, { "epoch": 0.31, "learning_rate": 1.6041626495389235e-05, "loss": 0.4742, "step": 2754 }, { "epoch": 0.31, "learning_rate": 1.6038676378766968e-05, "loss": 0.4639, "step": 2755 }, { "epoch": 0.31, "learning_rate": 1.603572543471121e-05, "loss": 0.4743, "step": 2756 }, { "epoch": 0.32, "learning_rate": 1.603277366362632e-05, "loss": 0.4833, "step": 2757 }, { "epoch": 0.32, "learning_rate": 1.6029821065916745e-05, "loss": 0.4669, "step": 2758 }, { "epoch": 0.32, "learning_rate": 1.602686764198706e-05, "loss": 0.4883, "step": 2759 }, { "epoch": 0.32, "learning_rate": 1.602391339224196e-05, "loss": 0.4739, "step": 2760 }, { "epoch": 0.32, "learning_rate": 1.6020958317086224e-05, "loss": 0.466, "step": 2761 }, { "epoch": 0.32, "learning_rate": 1.601800241692478e-05, "loss": 0.4624, "step": 2762 }, { "epoch": 0.32, "learning_rate": 1.6015045692162644e-05, "loss": 0.4698, "step": 2763 }, { "epoch": 0.32, "learning_rate": 1.6012088143204953e-05, "loss": 0.4567, "step": 2764 }, { "epoch": 0.32, "learning_rate": 1.6009129770456962e-05, "loss": 0.4719, "step": 2765 }, { "epoch": 0.32, "learning_rate": 1.6006170574324033e-05, "loss": 0.4681, "step": 2766 }, { "epoch": 0.32, "learning_rate": 1.6003210555211635e-05, "loss": 0.4753, "step": 2767 }, { "epoch": 0.32, "learning_rate": 1.6000249713525366e-05, "loss": 0.4674, "step": 2768 }, { "epoch": 0.32, "learning_rate": 1.5997288049670924e-05, "loss": 0.4563, "step": 2769 }, { "epoch": 0.32, "learning_rate": 1.5994325564054122e-05, "loss": 0.5064, "step": 2770 }, { "epoch": 0.32, "learning_rate": 1.599136225708089e-05, "loss": 0.4761, "step": 2771 }, { "epoch": 0.32, "learning_rate": 1.598839812915726e-05, "loss": 0.4571, "step": 2772 }, { "epoch": 0.32, "learning_rate": 1.598543318068939e-05, "loss": 0.4861, "step": 2773 }, { "epoch": 0.32, "learning_rate": 1.5982467412083543e-05, "loss": 0.4579, "step": 2774 }, { "epoch": 0.32, "learning_rate": 1.5979500823746096e-05, "loss": 0.4937, "step": 2775 }, { "epoch": 0.32, "learning_rate": 1.5976533416083535e-05, "loss": 0.4646, "step": 2776 }, { "epoch": 0.32, "learning_rate": 1.5973565189502463e-05, "loss": 0.4636, "step": 2777 }, { "epoch": 0.32, "learning_rate": 1.5970596144409595e-05, "loss": 0.4741, "step": 2778 }, { "epoch": 0.32, "learning_rate": 1.5967626281211754e-05, "loss": 0.4716, "step": 2779 }, { "epoch": 0.32, "learning_rate": 1.596465560031588e-05, "loss": 0.4568, "step": 2780 }, { "epoch": 0.32, "learning_rate": 1.5961684102129015e-05, "loss": 0.4772, "step": 2781 }, { "epoch": 0.32, "learning_rate": 1.5958711787058332e-05, "loss": 0.4642, "step": 2782 }, { "epoch": 0.32, "learning_rate": 1.5955738655511094e-05, "loss": 0.4938, "step": 2783 }, { "epoch": 0.32, "learning_rate": 1.5952764707894696e-05, "loss": 0.4634, "step": 2784 }, { "epoch": 0.32, "learning_rate": 1.594978994461663e-05, "loss": 0.4767, "step": 2785 }, { "epoch": 0.32, "learning_rate": 1.5946814366084505e-05, "loss": 0.4734, "step": 2786 }, { "epoch": 0.32, "learning_rate": 1.594383797270604e-05, "loss": 0.4918, "step": 2787 }, { "epoch": 0.32, "learning_rate": 1.5940860764889073e-05, "loss": 0.4859, "step": 2788 }, { "epoch": 0.32, "learning_rate": 1.5937882743041543e-05, "loss": 0.462, "step": 2789 }, { "epoch": 0.32, "learning_rate": 1.5934903907571507e-05, "loss": 0.4686, "step": 2790 }, { "epoch": 0.32, "learning_rate": 1.593192425888713e-05, "loss": 0.4752, "step": 2791 }, { "epoch": 0.32, "learning_rate": 1.5928943797396695e-05, "loss": 0.4988, "step": 2792 }, { "epoch": 0.32, "learning_rate": 1.592596252350859e-05, "loss": 0.4771, "step": 2793 }, { "epoch": 0.32, "learning_rate": 1.5922980437631314e-05, "loss": 0.4763, "step": 2794 }, { "epoch": 0.32, "learning_rate": 1.591999754017348e-05, "loss": 0.4701, "step": 2795 }, { "epoch": 0.32, "learning_rate": 1.5917013831543814e-05, "loss": 0.4927, "step": 2796 }, { "epoch": 0.32, "learning_rate": 1.5914029312151146e-05, "loss": 0.4832, "step": 2797 }, { "epoch": 0.32, "learning_rate": 1.5911043982404426e-05, "loss": 0.475, "step": 2798 }, { "epoch": 0.32, "learning_rate": 1.590805784271271e-05, "loss": 0.4782, "step": 2799 }, { "epoch": 0.32, "learning_rate": 1.5905070893485165e-05, "loss": 0.4783, "step": 2800 }, { "epoch": 0.32, "learning_rate": 1.5902083135131067e-05, "loss": 0.514, "step": 2801 }, { "epoch": 0.32, "learning_rate": 1.5899094568059812e-05, "loss": 0.4526, "step": 2802 }, { "epoch": 0.32, "learning_rate": 1.58961051926809e-05, "loss": 0.4837, "step": 2803 }, { "epoch": 0.32, "learning_rate": 1.5893115009403932e-05, "loss": 0.4742, "step": 2804 }, { "epoch": 0.32, "learning_rate": 1.589012401863864e-05, "loss": 0.4731, "step": 2805 }, { "epoch": 0.32, "learning_rate": 1.5887132220794855e-05, "loss": 0.4697, "step": 2806 }, { "epoch": 0.32, "learning_rate": 1.5884139616282517e-05, "loss": 0.4692, "step": 2807 }, { "epoch": 0.32, "learning_rate": 1.5881146205511683e-05, "loss": 0.4793, "step": 2808 }, { "epoch": 0.32, "learning_rate": 1.5878151988892513e-05, "loss": 0.4826, "step": 2809 }, { "epoch": 0.32, "learning_rate": 1.5875156966835285e-05, "loss": 0.4683, "step": 2810 }, { "epoch": 0.32, "learning_rate": 1.5872161139750384e-05, "loss": 0.4728, "step": 2811 }, { "epoch": 0.32, "learning_rate": 1.5869164508048304e-05, "loss": 0.4519, "step": 2812 }, { "epoch": 0.32, "learning_rate": 1.5866167072139645e-05, "loss": 0.4566, "step": 2813 }, { "epoch": 0.32, "learning_rate": 1.5863168832435137e-05, "loss": 0.4898, "step": 2814 }, { "epoch": 0.32, "learning_rate": 1.5860169789345592e-05, "loss": 0.472, "step": 2815 }, { "epoch": 0.32, "learning_rate": 1.5857169943281948e-05, "loss": 0.4816, "step": 2816 }, { "epoch": 0.32, "learning_rate": 1.585416929465526e-05, "loss": 0.4718, "step": 2817 }, { "epoch": 0.32, "learning_rate": 1.585116784387667e-05, "loss": 0.4443, "step": 2818 }, { "epoch": 0.32, "learning_rate": 1.5848165591357458e-05, "loss": 0.4654, "step": 2819 }, { "epoch": 0.32, "learning_rate": 1.584516253750899e-05, "loss": 0.4793, "step": 2820 }, { "epoch": 0.32, "learning_rate": 1.5842158682742756e-05, "loss": 0.4703, "step": 2821 }, { "epoch": 0.32, "learning_rate": 1.5839154027470346e-05, "loss": 0.4631, "step": 2822 }, { "epoch": 0.32, "learning_rate": 1.583614857210347e-05, "loss": 0.4858, "step": 2823 }, { "epoch": 0.32, "learning_rate": 1.5833142317053943e-05, "loss": 0.4655, "step": 2824 }, { "epoch": 0.32, "learning_rate": 1.5830135262733684e-05, "loss": 0.4708, "step": 2825 }, { "epoch": 0.32, "learning_rate": 1.582712740955473e-05, "loss": 0.477, "step": 2826 }, { "epoch": 0.32, "learning_rate": 1.5824118757929224e-05, "loss": 0.4869, "step": 2827 }, { "epoch": 0.32, "learning_rate": 1.5821109308269416e-05, "loss": 0.4708, "step": 2828 }, { "epoch": 0.32, "learning_rate": 1.581809906098767e-05, "loss": 0.4834, "step": 2829 }, { "epoch": 0.32, "learning_rate": 1.581508801649646e-05, "loss": 0.4669, "step": 2830 }, { "epoch": 0.32, "learning_rate": 1.581207617520836e-05, "loss": 0.4761, "step": 2831 }, { "epoch": 0.32, "learning_rate": 1.5809063537536066e-05, "loss": 0.4765, "step": 2832 }, { "epoch": 0.32, "learning_rate": 1.580605010389237e-05, "loss": 0.4775, "step": 2833 }, { "epoch": 0.32, "learning_rate": 1.5803035874690186e-05, "loss": 0.4697, "step": 2834 }, { "epoch": 0.32, "learning_rate": 1.5800020850342524e-05, "loss": 0.4574, "step": 2835 }, { "epoch": 0.32, "learning_rate": 1.5797005031262514e-05, "loss": 0.4732, "step": 2836 }, { "epoch": 0.32, "learning_rate": 1.579398841786339e-05, "loss": 0.492, "step": 2837 }, { "epoch": 0.32, "learning_rate": 1.57909710105585e-05, "loss": 0.4496, "step": 2838 }, { "epoch": 0.32, "learning_rate": 1.5787952809761286e-05, "loss": 0.478, "step": 2839 }, { "epoch": 0.32, "learning_rate": 1.5784933815885315e-05, "loss": 0.4775, "step": 2840 }, { "epoch": 0.32, "learning_rate": 1.5781914029344254e-05, "loss": 0.4648, "step": 2841 }, { "epoch": 0.32, "learning_rate": 1.5778893450551888e-05, "loss": 0.4642, "step": 2842 }, { "epoch": 0.32, "learning_rate": 1.5775872079922098e-05, "loss": 0.4863, "step": 2843 }, { "epoch": 0.33, "learning_rate": 1.5772849917868876e-05, "loss": 0.4598, "step": 2844 }, { "epoch": 0.33, "learning_rate": 1.576982696480633e-05, "loss": 0.478, "step": 2845 }, { "epoch": 0.33, "learning_rate": 1.5766803221148676e-05, "loss": 0.4735, "step": 2846 }, { "epoch": 0.33, "learning_rate": 1.5763778687310224e-05, "loss": 0.4723, "step": 2847 }, { "epoch": 0.33, "learning_rate": 1.5760753363705412e-05, "loss": 0.4484, "step": 2848 }, { "epoch": 0.33, "learning_rate": 1.5757727250748773e-05, "loss": 0.4742, "step": 2849 }, { "epoch": 0.33, "learning_rate": 1.5754700348854955e-05, "loss": 0.4912, "step": 2850 }, { "epoch": 0.33, "learning_rate": 1.5751672658438707e-05, "loss": 0.4788, "step": 2851 }, { "epoch": 0.33, "learning_rate": 1.574864417991489e-05, "loss": 0.4717, "step": 2852 }, { "epoch": 0.33, "learning_rate": 1.5745614913698478e-05, "loss": 0.5, "step": 2853 }, { "epoch": 0.33, "learning_rate": 1.5742584860204547e-05, "loss": 0.4665, "step": 2854 }, { "epoch": 0.33, "learning_rate": 1.5739554019848274e-05, "loss": 0.471, "step": 2855 }, { "epoch": 0.33, "learning_rate": 1.5736522393044962e-05, "loss": 0.4684, "step": 2856 }, { "epoch": 0.33, "learning_rate": 1.5733489980210007e-05, "loss": 0.4837, "step": 2857 }, { "epoch": 0.33, "learning_rate": 1.573045678175892e-05, "loss": 0.4908, "step": 2858 }, { "epoch": 0.33, "learning_rate": 1.5727422798107313e-05, "loss": 0.4824, "step": 2859 }, { "epoch": 0.33, "learning_rate": 1.5724388029670912e-05, "loss": 0.4636, "step": 2860 }, { "epoch": 0.33, "learning_rate": 1.5721352476865546e-05, "loss": 0.4617, "step": 2861 }, { "epoch": 0.33, "learning_rate": 1.5718316140107156e-05, "loss": 0.4884, "step": 2862 }, { "epoch": 0.33, "learning_rate": 1.5715279019811783e-05, "loss": 0.4766, "step": 2863 }, { "epoch": 0.33, "learning_rate": 1.571224111639559e-05, "loss": 0.4708, "step": 2864 }, { "epoch": 0.33, "learning_rate": 1.570920243027483e-05, "loss": 0.4695, "step": 2865 }, { "epoch": 0.33, "learning_rate": 1.5706162961865866e-05, "loss": 0.4738, "step": 2866 }, { "epoch": 0.33, "learning_rate": 1.570312271158519e-05, "loss": 0.4878, "step": 2867 }, { "epoch": 0.33, "learning_rate": 1.5700081679849362e-05, "loss": 0.4698, "step": 2868 }, { "epoch": 0.33, "learning_rate": 1.569703986707509e-05, "loss": 0.4732, "step": 2869 }, { "epoch": 0.33, "learning_rate": 1.5693997273679165e-05, "loss": 0.5003, "step": 2870 }, { "epoch": 0.33, "learning_rate": 1.5690953900078485e-05, "loss": 0.4552, "step": 2871 }, { "epoch": 0.33, "learning_rate": 1.5687909746690064e-05, "loss": 0.472, "step": 2872 }, { "epoch": 0.33, "learning_rate": 1.568486481393102e-05, "loss": 0.4709, "step": 2873 }, { "epoch": 0.33, "learning_rate": 1.5681819102218572e-05, "loss": 0.4626, "step": 2874 }, { "epoch": 0.33, "learning_rate": 1.5678772611970056e-05, "loss": 0.4704, "step": 2875 }, { "epoch": 0.33, "learning_rate": 1.5675725343602904e-05, "loss": 0.4631, "step": 2876 }, { "epoch": 0.33, "learning_rate": 1.5672677297534665e-05, "loss": 0.4735, "step": 2877 }, { "epoch": 0.33, "learning_rate": 1.566962847418299e-05, "loss": 0.4643, "step": 2878 }, { "epoch": 0.33, "learning_rate": 1.5666578873965627e-05, "loss": 0.4823, "step": 2879 }, { "epoch": 0.33, "learning_rate": 1.566352849730045e-05, "loss": 0.4623, "step": 2880 }, { "epoch": 0.33, "learning_rate": 1.566047734460542e-05, "loss": 0.4846, "step": 2881 }, { "epoch": 0.33, "learning_rate": 1.5657425416298623e-05, "loss": 0.4666, "step": 2882 }, { "epoch": 0.33, "learning_rate": 1.565437271279823e-05, "loss": 0.4601, "step": 2883 }, { "epoch": 0.33, "learning_rate": 1.5651319234522538e-05, "loss": 0.4834, "step": 2884 }, { "epoch": 0.33, "learning_rate": 1.5648264981889936e-05, "loss": 0.4699, "step": 2885 }, { "epoch": 0.33, "learning_rate": 1.564520995531893e-05, "loss": 0.4772, "step": 2886 }, { "epoch": 0.33, "learning_rate": 1.5642154155228124e-05, "loss": 0.4867, "step": 2887 }, { "epoch": 0.33, "learning_rate": 1.5639097582036226e-05, "loss": 0.4585, "step": 2888 }, { "epoch": 0.33, "learning_rate": 1.5636040236162066e-05, "loss": 0.4807, "step": 2889 }, { "epoch": 0.33, "learning_rate": 1.5632982118024556e-05, "loss": 0.4746, "step": 2890 }, { "epoch": 0.33, "learning_rate": 1.562992322804274e-05, "loss": 0.4685, "step": 2891 }, { "epoch": 0.33, "learning_rate": 1.5626863566635744e-05, "loss": 0.4727, "step": 2892 }, { "epoch": 0.33, "learning_rate": 1.5623803134222812e-05, "loss": 0.4873, "step": 2893 }, { "epoch": 0.33, "learning_rate": 1.5620741931223292e-05, "loss": 0.4863, "step": 2894 }, { "epoch": 0.33, "learning_rate": 1.5617679958056643e-05, "loss": 0.4903, "step": 2895 }, { "epoch": 0.33, "learning_rate": 1.5614617215142412e-05, "loss": 0.4736, "step": 2896 }, { "epoch": 0.33, "learning_rate": 1.5611553702900275e-05, "loss": 0.4637, "step": 2897 }, { "epoch": 0.33, "learning_rate": 1.5608489421749995e-05, "loss": 0.4758, "step": 2898 }, { "epoch": 0.33, "learning_rate": 1.5605424372111447e-05, "loss": 0.4812, "step": 2899 }, { "epoch": 0.33, "learning_rate": 1.5602358554404613e-05, "loss": 0.4662, "step": 2900 }, { "epoch": 0.33, "learning_rate": 1.5599291969049575e-05, "loss": 0.4708, "step": 2901 }, { "epoch": 0.33, "learning_rate": 1.5596224616466527e-05, "loss": 0.469, "step": 2902 }, { "epoch": 0.33, "learning_rate": 1.5593156497075767e-05, "loss": 0.4772, "step": 2903 }, { "epoch": 0.33, "learning_rate": 1.5590087611297694e-05, "loss": 0.484, "step": 2904 }, { "epoch": 0.33, "learning_rate": 1.558701795955281e-05, "loss": 0.468, "step": 2905 }, { "epoch": 0.33, "learning_rate": 1.558394754226173e-05, "loss": 0.4638, "step": 2906 }, { "epoch": 0.33, "learning_rate": 1.5580876359845166e-05, "loss": 0.4748, "step": 2907 }, { "epoch": 0.33, "learning_rate": 1.557780441272395e-05, "loss": 0.4646, "step": 2908 }, { "epoch": 0.33, "learning_rate": 1.5574731701318987e-05, "loss": 0.4657, "step": 2909 }, { "epoch": 0.33, "learning_rate": 1.5571658226051325e-05, "loss": 0.5036, "step": 2910 }, { "epoch": 0.33, "learning_rate": 1.556858398734209e-05, "loss": 0.478, "step": 2911 }, { "epoch": 0.33, "learning_rate": 1.5565508985612525e-05, "loss": 0.4641, "step": 2912 }, { "epoch": 0.33, "learning_rate": 1.556243322128397e-05, "loss": 0.4988, "step": 2913 }, { "epoch": 0.33, "learning_rate": 1.5559356694777882e-05, "loss": 0.4682, "step": 2914 }, { "epoch": 0.33, "learning_rate": 1.5556279406515802e-05, "loss": 0.4605, "step": 2915 }, { "epoch": 0.33, "learning_rate": 1.5553201356919394e-05, "loss": 0.4572, "step": 2916 }, { "epoch": 0.33, "learning_rate": 1.555012254641042e-05, "loss": 0.4649, "step": 2917 }, { "epoch": 0.33, "learning_rate": 1.554704297541074e-05, "loss": 0.4938, "step": 2918 }, { "epoch": 0.33, "learning_rate": 1.5543962644342335e-05, "loss": 0.4751, "step": 2919 }, { "epoch": 0.33, "learning_rate": 1.5540881553627264e-05, "loss": 0.4628, "step": 2920 }, { "epoch": 0.33, "learning_rate": 1.553779970368772e-05, "loss": 0.4738, "step": 2921 }, { "epoch": 0.33, "learning_rate": 1.553471709494598e-05, "loss": 0.4807, "step": 2922 }, { "epoch": 0.33, "learning_rate": 1.5531633727824423e-05, "loss": 0.456, "step": 2923 }, { "epoch": 0.33, "learning_rate": 1.5528549602745545e-05, "loss": 0.4865, "step": 2924 }, { "epoch": 0.33, "learning_rate": 1.5525464720131945e-05, "loss": 0.4608, "step": 2925 }, { "epoch": 0.33, "learning_rate": 1.5522379080406315e-05, "loss": 0.4985, "step": 2926 }, { "epoch": 0.33, "learning_rate": 1.5519292683991455e-05, "loss": 0.4733, "step": 2927 }, { "epoch": 0.33, "learning_rate": 1.5516205531310272e-05, "loss": 0.4852, "step": 2928 }, { "epoch": 0.33, "learning_rate": 1.5513117622785778e-05, "loss": 0.4641, "step": 2929 }, { "epoch": 0.33, "learning_rate": 1.5510028958841085e-05, "loss": 0.4682, "step": 2930 }, { "epoch": 0.33, "learning_rate": 1.5506939539899403e-05, "loss": 0.4544, "step": 2931 }, { "epoch": 0.34, "learning_rate": 1.5503849366384053e-05, "loss": 0.4609, "step": 2932 }, { "epoch": 0.34, "learning_rate": 1.5500758438718463e-05, "loss": 0.4947, "step": 2933 }, { "epoch": 0.34, "learning_rate": 1.5497666757326157e-05, "loss": 0.4783, "step": 2934 }, { "epoch": 0.34, "learning_rate": 1.5494574322630765e-05, "loss": 0.4702, "step": 2935 }, { "epoch": 0.34, "learning_rate": 1.5491481135056012e-05, "loss": 0.5003, "step": 2936 }, { "epoch": 0.34, "learning_rate": 1.5488387195025745e-05, "loss": 0.4549, "step": 2937 }, { "epoch": 0.34, "learning_rate": 1.5485292502963892e-05, "loss": 0.4735, "step": 2938 }, { "epoch": 0.34, "learning_rate": 1.548219705929451e-05, "loss": 0.4817, "step": 2939 }, { "epoch": 0.34, "learning_rate": 1.5479100864441726e-05, "loss": 0.4679, "step": 2940 }, { "epoch": 0.34, "learning_rate": 1.54760039188298e-05, "loss": 0.4699, "step": 2941 }, { "epoch": 0.34, "learning_rate": 1.5472906222883075e-05, "loss": 0.4791, "step": 2942 }, { "epoch": 0.34, "learning_rate": 1.5469807777026014e-05, "loss": 0.4749, "step": 2943 }, { "epoch": 0.34, "learning_rate": 1.5466708581683164e-05, "loss": 0.4845, "step": 2944 }, { "epoch": 0.34, "learning_rate": 1.546360863727919e-05, "loss": 0.4682, "step": 2945 }, { "epoch": 0.34, "learning_rate": 1.546050794423885e-05, "loss": 0.4739, "step": 2946 }, { "epoch": 0.34, "learning_rate": 1.5457406502987007e-05, "loss": 0.4703, "step": 2947 }, { "epoch": 0.34, "learning_rate": 1.5454304313948635e-05, "loss": 0.486, "step": 2948 }, { "epoch": 0.34, "learning_rate": 1.5451201377548793e-05, "loss": 0.4633, "step": 2949 }, { "epoch": 0.34, "learning_rate": 1.5448097694212663e-05, "loss": 0.4788, "step": 2950 }, { "epoch": 0.34, "learning_rate": 1.544499326436551e-05, "loss": 0.4686, "step": 2951 }, { "epoch": 0.34, "learning_rate": 1.5441888088432716e-05, "loss": 0.482, "step": 2952 }, { "epoch": 0.34, "learning_rate": 1.5438782166839757e-05, "loss": 0.4666, "step": 2953 }, { "epoch": 0.34, "learning_rate": 1.5435675500012212e-05, "loss": 0.4929, "step": 2954 }, { "epoch": 0.34, "learning_rate": 1.5432568088375766e-05, "loss": 0.4673, "step": 2955 }, { "epoch": 0.34, "learning_rate": 1.542945993235621e-05, "loss": 0.4798, "step": 2956 }, { "epoch": 0.34, "learning_rate": 1.5426351032379418e-05, "loss": 0.4764, "step": 2957 }, { "epoch": 0.34, "learning_rate": 1.5423241388871383e-05, "loss": 0.4605, "step": 2958 }, { "epoch": 0.34, "learning_rate": 1.54201310022582e-05, "loss": 0.4917, "step": 2959 }, { "epoch": 0.34, "learning_rate": 1.541701987296606e-05, "loss": 0.468, "step": 2960 }, { "epoch": 0.34, "learning_rate": 1.5413908001421257e-05, "loss": 0.4596, "step": 2961 }, { "epoch": 0.34, "learning_rate": 1.5410795388050182e-05, "loss": 0.488, "step": 2962 }, { "epoch": 0.34, "learning_rate": 1.540768203327934e-05, "loss": 0.4573, "step": 2963 }, { "epoch": 0.34, "learning_rate": 1.5404567937535326e-05, "loss": 0.4672, "step": 2964 }, { "epoch": 0.34, "learning_rate": 1.540145310124484e-05, "loss": 0.4718, "step": 2965 }, { "epoch": 0.34, "learning_rate": 1.5398337524834688e-05, "loss": 0.4789, "step": 2966 }, { "epoch": 0.34, "learning_rate": 1.5395221208731766e-05, "loss": 0.4671, "step": 2967 }, { "epoch": 0.34, "learning_rate": 1.5392104153363086e-05, "loss": 0.4992, "step": 2968 }, { "epoch": 0.34, "learning_rate": 1.538898635915576e-05, "loss": 0.4666, "step": 2969 }, { "epoch": 0.34, "learning_rate": 1.5385867826536977e-05, "loss": 0.486, "step": 2970 }, { "epoch": 0.34, "learning_rate": 1.5382748555934058e-05, "loss": 0.4593, "step": 2971 }, { "epoch": 0.34, "learning_rate": 1.5379628547774412e-05, "loss": 0.4736, "step": 2972 }, { "epoch": 0.34, "learning_rate": 1.5376507802485547e-05, "loss": 0.4685, "step": 2973 }, { "epoch": 0.34, "learning_rate": 1.537338632049508e-05, "loss": 0.4572, "step": 2974 }, { "epoch": 0.34, "learning_rate": 1.5370264102230716e-05, "loss": 0.4599, "step": 2975 }, { "epoch": 0.34, "learning_rate": 1.5367141148120275e-05, "loss": 0.4735, "step": 2976 }, { "epoch": 0.34, "learning_rate": 1.5364017458591668e-05, "loss": 0.476, "step": 2977 }, { "epoch": 0.34, "learning_rate": 1.536089303407291e-05, "loss": 0.4663, "step": 2978 }, { "epoch": 0.34, "learning_rate": 1.535776787499212e-05, "loss": 0.4701, "step": 2979 }, { "epoch": 0.34, "learning_rate": 1.5354641981777514e-05, "loss": 0.483, "step": 2980 }, { "epoch": 0.34, "learning_rate": 1.5351515354857404e-05, "loss": 0.4585, "step": 2981 }, { "epoch": 0.34, "learning_rate": 1.5348387994660214e-05, "loss": 0.4679, "step": 2982 }, { "epoch": 0.34, "learning_rate": 1.534525990161446e-05, "loss": 0.4726, "step": 2983 }, { "epoch": 0.34, "learning_rate": 1.534213107614876e-05, "loss": 0.4763, "step": 2984 }, { "epoch": 0.34, "learning_rate": 1.5339001518691833e-05, "loss": 0.4865, "step": 2985 }, { "epoch": 0.34, "learning_rate": 1.5335871229672496e-05, "loss": 0.4598, "step": 2986 }, { "epoch": 0.34, "learning_rate": 1.5332740209519674e-05, "loss": 0.4754, "step": 2987 }, { "epoch": 0.34, "learning_rate": 1.5329608458662383e-05, "loss": 0.4915, "step": 2988 }, { "epoch": 0.34, "learning_rate": 1.5326475977529745e-05, "loss": 0.4633, "step": 2989 }, { "epoch": 0.34, "learning_rate": 1.5323342766550978e-05, "loss": 0.4808, "step": 2990 }, { "epoch": 0.34, "learning_rate": 1.53202088261554e-05, "loss": 0.4753, "step": 2991 }, { "epoch": 0.34, "learning_rate": 1.5317074156772434e-05, "loss": 0.4628, "step": 2992 }, { "epoch": 0.34, "learning_rate": 1.5313938758831596e-05, "loss": 0.4698, "step": 2993 }, { "epoch": 0.34, "learning_rate": 1.531080263276251e-05, "loss": 0.4773, "step": 2994 }, { "epoch": 0.34, "learning_rate": 1.5307665778994897e-05, "loss": 0.4576, "step": 2995 }, { "epoch": 0.34, "learning_rate": 1.5304528197958565e-05, "loss": 0.4724, "step": 2996 }, { "epoch": 0.34, "learning_rate": 1.5301389890083446e-05, "loss": 0.4608, "step": 2997 }, { "epoch": 0.34, "learning_rate": 1.529825085579955e-05, "loss": 0.4734, "step": 2998 }, { "epoch": 0.34, "learning_rate": 1.5295111095536997e-05, "loss": 0.4648, "step": 2999 }, { "epoch": 0.34, "learning_rate": 1.5291970609726008e-05, "loss": 0.454, "step": 3000 }, { "epoch": 0.34, "learning_rate": 1.5288829398796892e-05, "loss": 0.4805, "step": 3001 }, { "epoch": 0.34, "learning_rate": 1.528568746318007e-05, "loss": 0.4806, "step": 3002 }, { "epoch": 0.34, "learning_rate": 1.5282544803306056e-05, "loss": 0.4626, "step": 3003 }, { "epoch": 0.34, "learning_rate": 1.5279401419605466e-05, "loss": 0.4611, "step": 3004 }, { "epoch": 0.34, "learning_rate": 1.527625731250901e-05, "loss": 0.4811, "step": 3005 }, { "epoch": 0.34, "learning_rate": 1.527311248244751e-05, "loss": 0.4894, "step": 3006 }, { "epoch": 0.34, "learning_rate": 1.5269966929851866e-05, "loss": 0.4652, "step": 3007 }, { "epoch": 0.34, "learning_rate": 1.52668206551531e-05, "loss": 0.4701, "step": 3008 }, { "epoch": 0.34, "learning_rate": 1.526367365878231e-05, "loss": 0.4649, "step": 3009 }, { "epoch": 0.34, "learning_rate": 1.526052594117071e-05, "loss": 0.4541, "step": 3010 }, { "epoch": 0.34, "learning_rate": 1.5257377502749614e-05, "loss": 0.4898, "step": 3011 }, { "epoch": 0.34, "learning_rate": 1.525422834395042e-05, "loss": 0.4587, "step": 3012 }, { "epoch": 0.34, "learning_rate": 1.525107846520464e-05, "loss": 0.4891, "step": 3013 }, { "epoch": 0.34, "learning_rate": 1.5247927866943869e-05, "loss": 0.4719, "step": 3014 }, { "epoch": 0.34, "learning_rate": 1.5244776549599816e-05, "loss": 0.4638, "step": 3015 }, { "epoch": 0.34, "learning_rate": 1.5241624513604281e-05, "loss": 0.4802, "step": 3016 }, { "epoch": 0.34, "learning_rate": 1.523847175938916e-05, "loss": 0.4526, "step": 3017 }, { "epoch": 0.34, "learning_rate": 1.5235318287386455e-05, "loss": 0.4785, "step": 3018 }, { "epoch": 0.35, "learning_rate": 1.5232164098028257e-05, "loss": 0.4786, "step": 3019 }, { "epoch": 0.35, "learning_rate": 1.5229009191746769e-05, "loss": 0.4906, "step": 3020 }, { "epoch": 0.35, "learning_rate": 1.5225853568974271e-05, "loss": 0.4532, "step": 3021 }, { "epoch": 0.35, "learning_rate": 1.5222697230143166e-05, "loss": 0.4748, "step": 3022 }, { "epoch": 0.35, "learning_rate": 1.5219540175685938e-05, "loss": 0.4803, "step": 3023 }, { "epoch": 0.35, "learning_rate": 1.521638240603517e-05, "loss": 0.4751, "step": 3024 }, { "epoch": 0.35, "learning_rate": 1.5213223921623553e-05, "loss": 0.4679, "step": 3025 }, { "epoch": 0.35, "learning_rate": 1.5210064722883865e-05, "loss": 0.4836, "step": 3026 }, { "epoch": 0.35, "learning_rate": 1.5206904810248992e-05, "loss": 0.4656, "step": 3027 }, { "epoch": 0.35, "learning_rate": 1.5203744184151907e-05, "loss": 0.4757, "step": 3028 }, { "epoch": 0.35, "learning_rate": 1.5200582845025688e-05, "loss": 0.4992, "step": 3029 }, { "epoch": 0.35, "learning_rate": 1.5197420793303514e-05, "loss": 0.4701, "step": 3030 }, { "epoch": 0.35, "learning_rate": 1.5194258029418657e-05, "loss": 0.4565, "step": 3031 }, { "epoch": 0.35, "learning_rate": 1.5191094553804476e-05, "loss": 0.4628, "step": 3032 }, { "epoch": 0.35, "learning_rate": 1.5187930366894442e-05, "loss": 0.4777, "step": 3033 }, { "epoch": 0.35, "learning_rate": 1.5184765469122122e-05, "loss": 0.4835, "step": 3034 }, { "epoch": 0.35, "learning_rate": 1.5181599860921182e-05, "loss": 0.4564, "step": 3035 }, { "epoch": 0.35, "learning_rate": 1.517843354272537e-05, "loss": 0.4759, "step": 3036 }, { "epoch": 0.35, "learning_rate": 1.517526651496855e-05, "loss": 0.4583, "step": 3037 }, { "epoch": 0.35, "learning_rate": 1.5172098778084672e-05, "loss": 0.4962, "step": 3038 }, { "epoch": 0.35, "learning_rate": 1.5168930332507791e-05, "loss": 0.4479, "step": 3039 }, { "epoch": 0.35, "learning_rate": 1.5165761178672052e-05, "loss": 0.4767, "step": 3040 }, { "epoch": 0.35, "learning_rate": 1.51625913170117e-05, "loss": 0.4743, "step": 3041 }, { "epoch": 0.35, "learning_rate": 1.5159420747961076e-05, "loss": 0.4861, "step": 3042 }, { "epoch": 0.35, "learning_rate": 1.5156249471954617e-05, "loss": 0.46, "step": 3043 }, { "epoch": 0.35, "learning_rate": 1.5153077489426865e-05, "loss": 0.468, "step": 3044 }, { "epoch": 0.35, "learning_rate": 1.5149904800812448e-05, "loss": 0.4918, "step": 3045 }, { "epoch": 0.35, "learning_rate": 1.514673140654609e-05, "loss": 0.4897, "step": 3046 }, { "epoch": 0.35, "learning_rate": 1.514355730706263e-05, "loss": 0.4717, "step": 3047 }, { "epoch": 0.35, "learning_rate": 1.5140382502796978e-05, "loss": 0.4652, "step": 3048 }, { "epoch": 0.35, "learning_rate": 1.5137206994184159e-05, "loss": 0.4705, "step": 3049 }, { "epoch": 0.35, "learning_rate": 1.5134030781659288e-05, "loss": 0.4599, "step": 3050 }, { "epoch": 0.35, "learning_rate": 1.513085386565758e-05, "loss": 0.4557, "step": 3051 }, { "epoch": 0.35, "learning_rate": 1.5127676246614336e-05, "loss": 0.4788, "step": 3052 }, { "epoch": 0.35, "learning_rate": 1.5124497924964966e-05, "loss": 0.4772, "step": 3053 }, { "epoch": 0.35, "learning_rate": 1.512131890114497e-05, "loss": 0.473, "step": 3054 }, { "epoch": 0.35, "learning_rate": 1.5118139175589944e-05, "loss": 0.4603, "step": 3055 }, { "epoch": 0.35, "learning_rate": 1.5114958748735584e-05, "loss": 0.4807, "step": 3056 }, { "epoch": 0.35, "learning_rate": 1.5111777621017677e-05, "loss": 0.4671, "step": 3057 }, { "epoch": 0.35, "learning_rate": 1.5108595792872112e-05, "loss": 0.4546, "step": 3058 }, { "epoch": 0.35, "learning_rate": 1.5105413264734866e-05, "loss": 0.4701, "step": 3059 }, { "epoch": 0.35, "learning_rate": 1.5102230037042018e-05, "loss": 0.4811, "step": 3060 }, { "epoch": 0.35, "learning_rate": 1.5099046110229742e-05, "loss": 0.4597, "step": 3061 }, { "epoch": 0.35, "learning_rate": 1.5095861484734307e-05, "loss": 0.4749, "step": 3062 }, { "epoch": 0.35, "learning_rate": 1.5092676160992077e-05, "loss": 0.4709, "step": 3063 }, { "epoch": 0.35, "learning_rate": 1.5089490139439514e-05, "loss": 0.4601, "step": 3064 }, { "epoch": 0.35, "learning_rate": 1.508630342051317e-05, "loss": 0.4482, "step": 3065 }, { "epoch": 0.35, "learning_rate": 1.5083116004649703e-05, "loss": 0.4873, "step": 3066 }, { "epoch": 0.35, "learning_rate": 1.5079927892285855e-05, "loss": 0.4526, "step": 3067 }, { "epoch": 0.35, "learning_rate": 1.5076739083858472e-05, "loss": 0.4646, "step": 3068 }, { "epoch": 0.35, "learning_rate": 1.5073549579804493e-05, "loss": 0.4813, "step": 3069 }, { "epoch": 0.35, "learning_rate": 1.5070359380560944e-05, "loss": 0.4693, "step": 3070 }, { "epoch": 0.35, "learning_rate": 1.5067168486564959e-05, "loss": 0.4967, "step": 3071 }, { "epoch": 0.35, "learning_rate": 1.5063976898253763e-05, "loss": 0.4671, "step": 3072 }, { "epoch": 0.35, "learning_rate": 1.506078461606467e-05, "loss": 0.4815, "step": 3073 }, { "epoch": 0.35, "learning_rate": 1.5057591640435098e-05, "loss": 0.471, "step": 3074 }, { "epoch": 0.35, "learning_rate": 1.5054397971802557e-05, "loss": 0.4657, "step": 3075 }, { "epoch": 0.35, "learning_rate": 1.5051203610604643e-05, "loss": 0.4786, "step": 3076 }, { "epoch": 0.35, "learning_rate": 1.5048008557279064e-05, "loss": 0.4743, "step": 3077 }, { "epoch": 0.35, "learning_rate": 1.504481281226361e-05, "loss": 0.4958, "step": 3078 }, { "epoch": 0.35, "learning_rate": 1.504161637599617e-05, "loss": 0.4849, "step": 3079 }, { "epoch": 0.35, "learning_rate": 1.5038419248914725e-05, "loss": 0.4544, "step": 3080 }, { "epoch": 0.35, "learning_rate": 1.5035221431457352e-05, "loss": 0.478, "step": 3081 }, { "epoch": 0.35, "learning_rate": 1.5032022924062228e-05, "loss": 0.4758, "step": 3082 }, { "epoch": 0.35, "learning_rate": 1.5028823727167621e-05, "loss": 0.4713, "step": 3083 }, { "epoch": 0.35, "learning_rate": 1.5025623841211885e-05, "loss": 0.4591, "step": 3084 }, { "epoch": 0.35, "learning_rate": 1.502242326663348e-05, "loss": 0.457, "step": 3085 }, { "epoch": 0.35, "learning_rate": 1.5019222003870954e-05, "loss": 0.4923, "step": 3086 }, { "epoch": 0.35, "learning_rate": 1.501602005336296e-05, "loss": 0.4548, "step": 3087 }, { "epoch": 0.35, "learning_rate": 1.5012817415548226e-05, "loss": 0.4693, "step": 3088 }, { "epoch": 0.35, "learning_rate": 1.500961409086559e-05, "loss": 0.4745, "step": 3089 }, { "epoch": 0.35, "learning_rate": 1.5006410079753974e-05, "loss": 0.4642, "step": 3090 }, { "epoch": 0.35, "learning_rate": 1.5003205382652409e-05, "loss": 0.4622, "step": 3091 }, { "epoch": 0.35, "learning_rate": 1.5000000000000002e-05, "loss": 0.4943, "step": 3092 }, { "epoch": 0.35, "learning_rate": 1.4996793932235965e-05, "loss": 0.4657, "step": 3093 }, { "epoch": 0.35, "learning_rate": 1.4993587179799598e-05, "loss": 0.4849, "step": 3094 }, { "epoch": 0.35, "learning_rate": 1.49903797431303e-05, "loss": 0.4615, "step": 3095 }, { "epoch": 0.35, "learning_rate": 1.4987171622667562e-05, "loss": 0.4694, "step": 3096 }, { "epoch": 0.35, "learning_rate": 1.4983962818850967e-05, "loss": 0.4771, "step": 3097 }, { "epoch": 0.35, "learning_rate": 1.4980753332120193e-05, "loss": 0.4754, "step": 3098 }, { "epoch": 0.35, "learning_rate": 1.4977543162915011e-05, "loss": 0.4576, "step": 3099 }, { "epoch": 0.35, "learning_rate": 1.4974332311675286e-05, "loss": 0.4701, "step": 3100 }, { "epoch": 0.35, "learning_rate": 1.497112077884098e-05, "loss": 0.4787, "step": 3101 }, { "epoch": 0.35, "learning_rate": 1.4967908564852137e-05, "loss": 0.5031, "step": 3102 }, { "epoch": 0.35, "learning_rate": 1.4964695670148907e-05, "loss": 0.47, "step": 3103 }, { "epoch": 0.35, "learning_rate": 1.4961482095171529e-05, "loss": 0.4716, "step": 3104 }, { "epoch": 0.35, "learning_rate": 1.4958267840360332e-05, "loss": 0.4739, "step": 3105 }, { "epoch": 0.35, "learning_rate": 1.495505290615574e-05, "loss": 0.4693, "step": 3106 }, { "epoch": 0.36, "learning_rate": 1.4951837292998277e-05, "loss": 0.4659, "step": 3107 }, { "epoch": 0.36, "learning_rate": 1.4948621001328544e-05, "loss": 0.4686, "step": 3108 }, { "epoch": 0.36, "learning_rate": 1.4945404031587255e-05, "loss": 0.4645, "step": 3109 }, { "epoch": 0.36, "learning_rate": 1.4942186384215198e-05, "loss": 0.4806, "step": 3110 }, { "epoch": 0.36, "learning_rate": 1.4938968059653269e-05, "loss": 0.4747, "step": 3111 }, { "epoch": 0.36, "learning_rate": 1.4935749058342446e-05, "loss": 0.4749, "step": 3112 }, { "epoch": 0.36, "learning_rate": 1.4932529380723806e-05, "loss": 0.4757, "step": 3113 }, { "epoch": 0.36, "learning_rate": 1.4929309027238517e-05, "loss": 0.4718, "step": 3114 }, { "epoch": 0.36, "learning_rate": 1.4926087998327838e-05, "loss": 0.4873, "step": 3115 }, { "epoch": 0.36, "learning_rate": 1.4922866294433122e-05, "loss": 0.458, "step": 3116 }, { "epoch": 0.36, "learning_rate": 1.4919643915995816e-05, "loss": 0.4518, "step": 3117 }, { "epoch": 0.36, "learning_rate": 1.4916420863457456e-05, "loss": 0.484, "step": 3118 }, { "epoch": 0.36, "learning_rate": 1.4913197137259675e-05, "loss": 0.4704, "step": 3119 }, { "epoch": 0.36, "learning_rate": 1.490997273784419e-05, "loss": 0.4703, "step": 3120 }, { "epoch": 0.36, "learning_rate": 1.4906747665652821e-05, "loss": 0.472, "step": 3121 }, { "epoch": 0.36, "learning_rate": 1.4903521921127472e-05, "loss": 0.4628, "step": 3122 }, { "epoch": 0.36, "learning_rate": 1.4900295504710143e-05, "loss": 0.4817, "step": 3123 }, { "epoch": 0.36, "learning_rate": 1.4897068416842926e-05, "loss": 0.464, "step": 3124 }, { "epoch": 0.36, "learning_rate": 1.4893840657968001e-05, "loss": 0.4822, "step": 3125 }, { "epoch": 0.36, "learning_rate": 1.4890612228527648e-05, "loss": 0.4618, "step": 3126 }, { "epoch": 0.36, "learning_rate": 1.4887383128964232e-05, "loss": 0.4776, "step": 3127 }, { "epoch": 0.36, "learning_rate": 1.4884153359720205e-05, "loss": 0.4775, "step": 3128 }, { "epoch": 0.36, "learning_rate": 1.4880922921238128e-05, "loss": 0.4653, "step": 3129 }, { "epoch": 0.36, "learning_rate": 1.4877691813960638e-05, "loss": 0.4933, "step": 3130 }, { "epoch": 0.36, "learning_rate": 1.4874460038330469e-05, "loss": 0.465, "step": 3131 }, { "epoch": 0.36, "learning_rate": 1.4871227594790447e-05, "loss": 0.4592, "step": 3132 }, { "epoch": 0.36, "learning_rate": 1.4867994483783485e-05, "loss": 0.4704, "step": 3133 }, { "epoch": 0.36, "learning_rate": 1.48647607057526e-05, "loss": 0.4597, "step": 3134 }, { "epoch": 0.36, "learning_rate": 1.4861526261140886e-05, "loss": 0.4649, "step": 3135 }, { "epoch": 0.36, "learning_rate": 1.4858291150391533e-05, "loss": 0.4881, "step": 3136 }, { "epoch": 0.36, "learning_rate": 1.4855055373947829e-05, "loss": 0.4686, "step": 3137 }, { "epoch": 0.36, "learning_rate": 1.4851818932253137e-05, "loss": 0.4904, "step": 3138 }, { "epoch": 0.36, "learning_rate": 1.4848581825750935e-05, "loss": 0.4775, "step": 3139 }, { "epoch": 0.36, "learning_rate": 1.4845344054884772e-05, "loss": 0.456, "step": 3140 }, { "epoch": 0.36, "learning_rate": 1.4842105620098292e-05, "loss": 0.4727, "step": 3141 }, { "epoch": 0.36, "learning_rate": 1.4838866521835238e-05, "loss": 0.4698, "step": 3142 }, { "epoch": 0.36, "learning_rate": 1.4835626760539437e-05, "loss": 0.4501, "step": 3143 }, { "epoch": 0.36, "learning_rate": 1.483238633665481e-05, "loss": 0.4737, "step": 3144 }, { "epoch": 0.36, "learning_rate": 1.4829145250625368e-05, "loss": 0.476, "step": 3145 }, { "epoch": 0.36, "learning_rate": 1.4825903502895207e-05, "loss": 0.4562, "step": 3146 }, { "epoch": 0.36, "learning_rate": 1.4822661093908521e-05, "loss": 0.4805, "step": 3147 }, { "epoch": 0.36, "learning_rate": 1.4819418024109595e-05, "loss": 0.4816, "step": 3148 }, { "epoch": 0.36, "learning_rate": 1.4816174293942804e-05, "loss": 0.4696, "step": 3149 }, { "epoch": 0.36, "learning_rate": 1.4812929903852606e-05, "loss": 0.4819, "step": 3150 }, { "epoch": 0.36, "learning_rate": 1.4809684854283557e-05, "loss": 0.4685, "step": 3151 }, { "epoch": 0.36, "learning_rate": 1.4806439145680298e-05, "loss": 0.4632, "step": 3152 }, { "epoch": 0.36, "learning_rate": 1.4803192778487569e-05, "loss": 0.4622, "step": 3153 }, { "epoch": 0.36, "learning_rate": 1.4799945753150194e-05, "loss": 0.508, "step": 3154 }, { "epoch": 0.36, "learning_rate": 1.4796698070113084e-05, "loss": 0.4752, "step": 3155 }, { "epoch": 0.36, "learning_rate": 1.4793449729821248e-05, "loss": 0.4801, "step": 3156 }, { "epoch": 0.36, "learning_rate": 1.4790200732719779e-05, "loss": 0.4513, "step": 3157 }, { "epoch": 0.36, "learning_rate": 1.4786951079253861e-05, "loss": 0.4687, "step": 3158 }, { "epoch": 0.36, "learning_rate": 1.4783700769868775e-05, "loss": 0.5047, "step": 3159 }, { "epoch": 0.36, "learning_rate": 1.4780449805009878e-05, "loss": 0.4439, "step": 3160 }, { "epoch": 0.36, "learning_rate": 1.477719818512263e-05, "loss": 0.481, "step": 3161 }, { "epoch": 0.36, "learning_rate": 1.4773945910652576e-05, "loss": 0.4716, "step": 3162 }, { "epoch": 0.36, "learning_rate": 1.4770692982045344e-05, "loss": 0.4807, "step": 3163 }, { "epoch": 0.36, "learning_rate": 1.4767439399746666e-05, "loss": 0.476, "step": 3164 }, { "epoch": 0.36, "learning_rate": 1.4764185164202349e-05, "loss": 0.4745, "step": 3165 }, { "epoch": 0.36, "learning_rate": 1.47609302758583e-05, "loss": 0.4644, "step": 3166 }, { "epoch": 0.36, "learning_rate": 1.4757674735160512e-05, "loss": 0.4823, "step": 3167 }, { "epoch": 0.36, "learning_rate": 1.475441854255506e-05, "loss": 0.464, "step": 3168 }, { "epoch": 0.36, "learning_rate": 1.4751161698488124e-05, "loss": 0.4667, "step": 3169 }, { "epoch": 0.36, "learning_rate": 1.4747904203405959e-05, "loss": 0.4758, "step": 3170 }, { "epoch": 0.36, "learning_rate": 1.4744646057754913e-05, "loss": 0.4825, "step": 3171 }, { "epoch": 0.36, "learning_rate": 1.4741387261981428e-05, "loss": 0.447, "step": 3172 }, { "epoch": 0.36, "learning_rate": 1.4738127816532034e-05, "loss": 0.4674, "step": 3173 }, { "epoch": 0.36, "learning_rate": 1.4734867721853341e-05, "loss": 0.4779, "step": 3174 }, { "epoch": 0.36, "learning_rate": 1.4731606978392061e-05, "loss": 0.4519, "step": 3175 }, { "epoch": 0.36, "learning_rate": 1.4728345586594986e-05, "loss": 0.4539, "step": 3176 }, { "epoch": 0.36, "learning_rate": 1.4725083546909e-05, "loss": 0.474, "step": 3177 }, { "epoch": 0.36, "learning_rate": 1.4721820859781076e-05, "loss": 0.479, "step": 3178 }, { "epoch": 0.36, "learning_rate": 1.4718557525658272e-05, "loss": 0.477, "step": 3179 }, { "epoch": 0.36, "learning_rate": 1.471529354498774e-05, "loss": 0.4798, "step": 3180 }, { "epoch": 0.36, "learning_rate": 1.471202891821672e-05, "loss": 0.4852, "step": 3181 }, { "epoch": 0.36, "learning_rate": 1.4708763645792531e-05, "loss": 0.4692, "step": 3182 }, { "epoch": 0.36, "learning_rate": 1.4705497728162602e-05, "loss": 0.4714, "step": 3183 }, { "epoch": 0.36, "learning_rate": 1.4702231165774423e-05, "loss": 0.4565, "step": 3184 }, { "epoch": 0.36, "learning_rate": 1.4698963959075592e-05, "loss": 0.494, "step": 3185 }, { "epoch": 0.36, "learning_rate": 1.469569610851379e-05, "loss": 0.458, "step": 3186 }, { "epoch": 0.36, "learning_rate": 1.4692427614536783e-05, "loss": 0.4748, "step": 3187 }, { "epoch": 0.36, "learning_rate": 1.4689158477592433e-05, "loss": 0.4661, "step": 3188 }, { "epoch": 0.36, "learning_rate": 1.4685888698128677e-05, "loss": 0.4881, "step": 3189 }, { "epoch": 0.36, "learning_rate": 1.468261827659355e-05, "loss": 0.4749, "step": 3190 }, { "epoch": 0.36, "learning_rate": 1.4679347213435176e-05, "loss": 0.4825, "step": 3191 }, { "epoch": 0.36, "learning_rate": 1.4676075509101763e-05, "loss": 0.4861, "step": 3192 }, { "epoch": 0.36, "learning_rate": 1.4672803164041604e-05, "loss": 0.4816, "step": 3193 }, { "epoch": 0.37, "learning_rate": 1.4669530178703089e-05, "loss": 0.4642, "step": 3194 }, { "epoch": 0.37, "learning_rate": 1.4666256553534681e-05, "loss": 0.4829, "step": 3195 }, { "epoch": 0.37, "learning_rate": 1.466298228898495e-05, "loss": 0.4793, "step": 3196 }, { "epoch": 0.37, "learning_rate": 1.465970738550254e-05, "loss": 0.4768, "step": 3197 }, { "epoch": 0.37, "learning_rate": 1.4656431843536182e-05, "loss": 0.4439, "step": 3198 }, { "epoch": 0.37, "learning_rate": 1.4653155663534702e-05, "loss": 0.4805, "step": 3199 }, { "epoch": 0.37, "learning_rate": 1.464987884594701e-05, "loss": 0.4833, "step": 3200 }, { "epoch": 0.37, "learning_rate": 1.4646601391222102e-05, "loss": 0.4571, "step": 3201 }, { "epoch": 0.37, "learning_rate": 1.464332329980906e-05, "loss": 0.4729, "step": 3202 }, { "epoch": 0.37, "learning_rate": 1.4640044572157062e-05, "loss": 0.4818, "step": 3203 }, { "epoch": 0.37, "learning_rate": 1.4636765208715358e-05, "loss": 0.4877, "step": 3204 }, { "epoch": 0.37, "learning_rate": 1.4633485209933305e-05, "loss": 0.4683, "step": 3205 }, { "epoch": 0.37, "learning_rate": 1.4630204576260328e-05, "loss": 0.4616, "step": 3206 }, { "epoch": 0.37, "learning_rate": 1.4626923308145948e-05, "loss": 0.4905, "step": 3207 }, { "epoch": 0.37, "learning_rate": 1.4623641406039776e-05, "loss": 0.4609, "step": 3208 }, { "epoch": 0.37, "learning_rate": 1.46203588703915e-05, "loss": 0.4601, "step": 3209 }, { "epoch": 0.37, "learning_rate": 1.4617075701650907e-05, "loss": 0.4575, "step": 3210 }, { "epoch": 0.37, "learning_rate": 1.461379190026786e-05, "loss": 0.4594, "step": 3211 }, { "epoch": 0.37, "learning_rate": 1.4610507466692312e-05, "loss": 0.4681, "step": 3212 }, { "epoch": 0.37, "learning_rate": 1.460722240137431e-05, "loss": 0.48, "step": 3213 }, { "epoch": 0.37, "learning_rate": 1.4603936704763975e-05, "loss": 0.4612, "step": 3214 }, { "epoch": 0.37, "learning_rate": 1.4600650377311523e-05, "loss": 0.4754, "step": 3215 }, { "epoch": 0.37, "learning_rate": 1.4597363419467257e-05, "loss": 0.4533, "step": 3216 }, { "epoch": 0.37, "learning_rate": 1.4594075831681557e-05, "loss": 0.4847, "step": 3217 }, { "epoch": 0.37, "learning_rate": 1.4590787614404902e-05, "loss": 0.4619, "step": 3218 }, { "epoch": 0.37, "learning_rate": 1.4587498768087849e-05, "loss": 0.4724, "step": 3219 }, { "epoch": 0.37, "learning_rate": 1.4584209293181044e-05, "loss": 0.4591, "step": 3220 }, { "epoch": 0.37, "learning_rate": 1.4580919190135219e-05, "loss": 0.4992, "step": 3221 }, { "epoch": 0.37, "learning_rate": 1.4577628459401188e-05, "loss": 0.4668, "step": 3222 }, { "epoch": 0.37, "learning_rate": 1.457433710142986e-05, "loss": 0.4642, "step": 3223 }, { "epoch": 0.37, "learning_rate": 1.4571045116672219e-05, "loss": 0.4759, "step": 3224 }, { "epoch": 0.37, "learning_rate": 1.4567752505579345e-05, "loss": 0.4752, "step": 3225 }, { "epoch": 0.37, "learning_rate": 1.4564459268602396e-05, "loss": 0.4603, "step": 3226 }, { "epoch": 0.37, "learning_rate": 1.4561165406192622e-05, "loss": 0.4835, "step": 3227 }, { "epoch": 0.37, "learning_rate": 1.455787091880135e-05, "loss": 0.466, "step": 3228 }, { "epoch": 0.37, "learning_rate": 1.4554575806880005e-05, "loss": 0.4776, "step": 3229 }, { "epoch": 0.37, "learning_rate": 1.4551280070880089e-05, "loss": 0.4615, "step": 3230 }, { "epoch": 0.37, "learning_rate": 1.454798371125319e-05, "loss": 0.4812, "step": 3231 }, { "epoch": 0.37, "learning_rate": 1.4544686728450982e-05, "loss": 0.4703, "step": 3232 }, { "epoch": 0.37, "learning_rate": 1.4541389122925229e-05, "loss": 0.4607, "step": 3233 }, { "epoch": 0.37, "learning_rate": 1.4538090895127774e-05, "loss": 0.466, "step": 3234 }, { "epoch": 0.37, "learning_rate": 1.4534792045510548e-05, "loss": 0.4682, "step": 3235 }, { "epoch": 0.37, "learning_rate": 1.453149257452557e-05, "loss": 0.4742, "step": 3236 }, { "epoch": 0.37, "learning_rate": 1.4528192482624932e-05, "loss": 0.4683, "step": 3237 }, { "epoch": 0.37, "learning_rate": 1.4524891770260831e-05, "loss": 0.4715, "step": 3238 }, { "epoch": 0.37, "learning_rate": 1.4521590437885533e-05, "loss": 0.4758, "step": 3239 }, { "epoch": 0.37, "learning_rate": 1.4518288485951398e-05, "loss": 0.4706, "step": 3240 }, { "epoch": 0.37, "learning_rate": 1.4514985914910862e-05, "loss": 0.4904, "step": 3241 }, { "epoch": 0.37, "learning_rate": 1.451168272521645e-05, "loss": 0.4547, "step": 3242 }, { "epoch": 0.37, "learning_rate": 1.450837891732078e-05, "loss": 0.4668, "step": 3243 }, { "epoch": 0.37, "learning_rate": 1.4505074491676542e-05, "loss": 0.457, "step": 3244 }, { "epoch": 0.37, "learning_rate": 1.450176944873652e-05, "loss": 0.4586, "step": 3245 }, { "epoch": 0.37, "learning_rate": 1.4498463788953574e-05, "loss": 0.4766, "step": 3246 }, { "epoch": 0.37, "learning_rate": 1.4495157512780655e-05, "loss": 0.4627, "step": 3247 }, { "epoch": 0.37, "learning_rate": 1.4491850620670798e-05, "loss": 0.487, "step": 3248 }, { "epoch": 0.37, "learning_rate": 1.4488543113077121e-05, "loss": 0.4664, "step": 3249 }, { "epoch": 0.37, "learning_rate": 1.4485234990452826e-05, "loss": 0.4712, "step": 3250 }, { "epoch": 0.37, "learning_rate": 1.4481926253251197e-05, "loss": 0.4645, "step": 3251 }, { "epoch": 0.37, "learning_rate": 1.4478616901925606e-05, "loss": 0.4795, "step": 3252 }, { "epoch": 0.37, "learning_rate": 1.4475306936929513e-05, "loss": 0.4754, "step": 3253 }, { "epoch": 0.37, "learning_rate": 1.4471996358716451e-05, "loss": 0.4654, "step": 3254 }, { "epoch": 0.37, "learning_rate": 1.4468685167740044e-05, "loss": 0.4913, "step": 3255 }, { "epoch": 0.37, "learning_rate": 1.4465373364454001e-05, "loss": 0.4487, "step": 3256 }, { "epoch": 0.37, "learning_rate": 1.4462060949312114e-05, "loss": 0.4955, "step": 3257 }, { "epoch": 0.37, "learning_rate": 1.4458747922768256e-05, "loss": 0.4717, "step": 3258 }, { "epoch": 0.37, "learning_rate": 1.4455434285276385e-05, "loss": 0.4566, "step": 3259 }, { "epoch": 0.37, "learning_rate": 1.4452120037290547e-05, "loss": 0.4784, "step": 3260 }, { "epoch": 0.37, "learning_rate": 1.444880517926486e-05, "loss": 0.4602, "step": 3261 }, { "epoch": 0.37, "learning_rate": 1.4445489711653542e-05, "loss": 0.4926, "step": 3262 }, { "epoch": 0.37, "learning_rate": 1.4442173634910881e-05, "loss": 0.4705, "step": 3263 }, { "epoch": 0.37, "learning_rate": 1.4438856949491258e-05, "loss": 0.4573, "step": 3264 }, { "epoch": 0.37, "learning_rate": 1.4435539655849126e-05, "loss": 0.4668, "step": 3265 }, { "epoch": 0.37, "learning_rate": 1.4432221754439037e-05, "loss": 0.4646, "step": 3266 }, { "epoch": 0.37, "learning_rate": 1.4428903245715611e-05, "loss": 0.4654, "step": 3267 }, { "epoch": 0.37, "learning_rate": 1.442558413013356e-05, "loss": 0.4748, "step": 3268 }, { "epoch": 0.37, "learning_rate": 1.4422264408147676e-05, "loss": 0.4817, "step": 3269 }, { "epoch": 0.37, "learning_rate": 1.4418944080212838e-05, "loss": 0.4665, "step": 3270 }, { "epoch": 0.37, "learning_rate": 1.4415623146784e-05, "loss": 0.4809, "step": 3271 }, { "epoch": 0.37, "learning_rate": 1.441230160831621e-05, "loss": 0.4672, "step": 3272 }, { "epoch": 0.37, "learning_rate": 1.4408979465264588e-05, "loss": 0.4713, "step": 3273 }, { "epoch": 0.37, "learning_rate": 1.4405656718084344e-05, "loss": 0.4615, "step": 3274 }, { "epoch": 0.37, "learning_rate": 1.440233336723077e-05, "loss": 0.5039, "step": 3275 }, { "epoch": 0.37, "learning_rate": 1.4399009413159234e-05, "loss": 0.4667, "step": 3276 }, { "epoch": 0.37, "learning_rate": 1.4395684856325198e-05, "loss": 0.4888, "step": 3277 }, { "epoch": 0.37, "learning_rate": 1.4392359697184197e-05, "loss": 0.4571, "step": 3278 }, { "epoch": 0.37, "learning_rate": 1.4389033936191851e-05, "loss": 0.4598, "step": 3279 }, { "epoch": 0.37, "learning_rate": 1.4385707573803869e-05, "loss": 0.4715, "step": 3280 }, { "epoch": 0.37, "learning_rate": 1.4382380610476032e-05, "loss": 0.5006, "step": 3281 }, { "epoch": 0.38, "learning_rate": 1.4379053046664208e-05, "loss": 0.4744, "step": 3282 }, { "epoch": 0.38, "learning_rate": 1.437572488282435e-05, "loss": 0.4742, "step": 3283 }, { "epoch": 0.38, "learning_rate": 1.4372396119412493e-05, "loss": 0.4635, "step": 3284 }, { "epoch": 0.38, "learning_rate": 1.4369066756884745e-05, "loss": 0.4539, "step": 3285 }, { "epoch": 0.38, "learning_rate": 1.4365736795697306e-05, "loss": 0.4807, "step": 3286 }, { "epoch": 0.38, "learning_rate": 1.436240623630646e-05, "loss": 0.486, "step": 3287 }, { "epoch": 0.38, "learning_rate": 1.4359075079168562e-05, "loss": 0.4795, "step": 3288 }, { "epoch": 0.38, "learning_rate": 1.4355743324740055e-05, "loss": 0.4836, "step": 3289 }, { "epoch": 0.38, "learning_rate": 1.4352410973477466e-05, "loss": 0.4509, "step": 3290 }, { "epoch": 0.38, "learning_rate": 1.4349078025837401e-05, "loss": 0.4845, "step": 3291 }, { "epoch": 0.38, "learning_rate": 1.4345744482276551e-05, "loss": 0.4521, "step": 3292 }, { "epoch": 0.38, "learning_rate": 1.4342410343251683e-05, "loss": 0.461, "step": 3293 }, { "epoch": 0.38, "learning_rate": 1.4339075609219645e-05, "loss": 0.4714, "step": 3294 }, { "epoch": 0.38, "learning_rate": 1.4335740280637374e-05, "loss": 0.4697, "step": 3295 }, { "epoch": 0.38, "learning_rate": 1.4332404357961884e-05, "loss": 0.4775, "step": 3296 }, { "epoch": 0.38, "learning_rate": 1.4329067841650274e-05, "loss": 0.4835, "step": 3297 }, { "epoch": 0.38, "learning_rate": 1.4325730732159717e-05, "loss": 0.4689, "step": 3298 }, { "epoch": 0.38, "learning_rate": 1.432239302994747e-05, "loss": 0.4673, "step": 3299 }, { "epoch": 0.38, "learning_rate": 1.4319054735470879e-05, "loss": 0.462, "step": 3300 }, { "epoch": 0.38, "learning_rate": 1.4315715849187362e-05, "loss": 0.4648, "step": 3301 }, { "epoch": 0.38, "learning_rate": 1.4312376371554417e-05, "loss": 0.4644, "step": 3302 }, { "epoch": 0.38, "learning_rate": 1.4309036303029632e-05, "loss": 0.4579, "step": 3303 }, { "epoch": 0.38, "learning_rate": 1.4305695644070665e-05, "loss": 0.4781, "step": 3304 }, { "epoch": 0.38, "learning_rate": 1.4302354395135269e-05, "loss": 0.4719, "step": 3305 }, { "epoch": 0.38, "learning_rate": 1.4299012556681269e-05, "loss": 0.4776, "step": 3306 }, { "epoch": 0.38, "learning_rate": 1.4295670129166564e-05, "loss": 0.4732, "step": 3307 }, { "epoch": 0.38, "learning_rate": 1.4292327113049145e-05, "loss": 0.4742, "step": 3308 }, { "epoch": 0.38, "learning_rate": 1.428898350878708e-05, "loss": 0.4832, "step": 3309 }, { "epoch": 0.38, "learning_rate": 1.428563931683852e-05, "loss": 0.4557, "step": 3310 }, { "epoch": 0.38, "learning_rate": 1.4282294537661692e-05, "loss": 0.4736, "step": 3311 }, { "epoch": 0.38, "learning_rate": 1.4278949171714904e-05, "loss": 0.4591, "step": 3312 }, { "epoch": 0.38, "learning_rate": 1.4275603219456544e-05, "loss": 0.4673, "step": 3313 }, { "epoch": 0.38, "learning_rate": 1.4272256681345087e-05, "loss": 0.4759, "step": 3314 }, { "epoch": 0.38, "learning_rate": 1.4268909557839085e-05, "loss": 0.4635, "step": 3315 }, { "epoch": 0.38, "learning_rate": 1.4265561849397163e-05, "loss": 0.4533, "step": 3316 }, { "epoch": 0.38, "learning_rate": 1.4262213556478033e-05, "loss": 0.4715, "step": 3317 }, { "epoch": 0.38, "learning_rate": 1.4258864679540488e-05, "loss": 0.4616, "step": 3318 }, { "epoch": 0.38, "learning_rate": 1.4255515219043398e-05, "loss": 0.4528, "step": 3319 }, { "epoch": 0.38, "learning_rate": 1.425216517544571e-05, "loss": 0.4803, "step": 3320 }, { "epoch": 0.38, "learning_rate": 1.4248814549206464e-05, "loss": 0.462, "step": 3321 }, { "epoch": 0.38, "learning_rate": 1.4245463340784761e-05, "loss": 0.4962, "step": 3322 }, { "epoch": 0.38, "learning_rate": 1.4242111550639797e-05, "loss": 0.4631, "step": 3323 }, { "epoch": 0.38, "learning_rate": 1.4238759179230841e-05, "loss": 0.4858, "step": 3324 }, { "epoch": 0.38, "learning_rate": 1.4235406227017241e-05, "loss": 0.4673, "step": 3325 }, { "epoch": 0.38, "learning_rate": 1.423205269445843e-05, "loss": 0.4831, "step": 3326 }, { "epoch": 0.38, "learning_rate": 1.4228698582013908e-05, "loss": 0.4592, "step": 3327 }, { "epoch": 0.38, "learning_rate": 1.4225343890143275e-05, "loss": 0.4626, "step": 3328 }, { "epoch": 0.38, "learning_rate": 1.4221988619306192e-05, "loss": 0.4664, "step": 3329 }, { "epoch": 0.38, "learning_rate": 1.4218632769962408e-05, "loss": 0.4782, "step": 3330 }, { "epoch": 0.38, "learning_rate": 1.4215276342571749e-05, "loss": 0.4562, "step": 3331 }, { "epoch": 0.38, "learning_rate": 1.4211919337594118e-05, "loss": 0.4621, "step": 3332 }, { "epoch": 0.38, "learning_rate": 1.4208561755489502e-05, "loss": 0.4751, "step": 3333 }, { "epoch": 0.38, "learning_rate": 1.4205203596717966e-05, "loss": 0.4712, "step": 3334 }, { "epoch": 0.38, "learning_rate": 1.420184486173965e-05, "loss": 0.4627, "step": 3335 }, { "epoch": 0.38, "learning_rate": 1.4198485551014778e-05, "loss": 0.4534, "step": 3336 }, { "epoch": 0.38, "learning_rate": 1.4195125665003648e-05, "loss": 0.4545, "step": 3337 }, { "epoch": 0.38, "learning_rate": 1.4191765204166643e-05, "loss": 0.4793, "step": 3338 }, { "epoch": 0.38, "learning_rate": 1.4188404168964219e-05, "loss": 0.4492, "step": 3339 }, { "epoch": 0.38, "learning_rate": 1.418504255985691e-05, "loss": 0.4563, "step": 3340 }, { "epoch": 0.38, "learning_rate": 1.4181680377305336e-05, "loss": 0.4673, "step": 3341 }, { "epoch": 0.38, "learning_rate": 1.4178317621770187e-05, "loss": 0.4813, "step": 3342 }, { "epoch": 0.38, "learning_rate": 1.4174954293712242e-05, "loss": 0.4651, "step": 3343 }, { "epoch": 0.38, "learning_rate": 1.4171590393592346e-05, "loss": 0.469, "step": 3344 }, { "epoch": 0.38, "learning_rate": 1.4168225921871433e-05, "loss": 0.4549, "step": 3345 }, { "epoch": 0.38, "learning_rate": 1.4164860879010502e-05, "loss": 0.4827, "step": 3346 }, { "epoch": 0.38, "learning_rate": 1.4161495265470649e-05, "loss": 0.4757, "step": 3347 }, { "epoch": 0.38, "learning_rate": 1.4158129081713035e-05, "loss": 0.4788, "step": 3348 }, { "epoch": 0.38, "learning_rate": 1.41547623281989e-05, "loss": 0.4634, "step": 3349 }, { "epoch": 0.38, "learning_rate": 1.415139500538957e-05, "loss": 0.4736, "step": 3350 }, { "epoch": 0.38, "learning_rate": 1.4148027113746435e-05, "loss": 0.4737, "step": 3351 }, { "epoch": 0.38, "learning_rate": 1.4144658653730976e-05, "loss": 0.4693, "step": 3352 }, { "epoch": 0.38, "learning_rate": 1.4141289625804748e-05, "loss": 0.4686, "step": 3353 }, { "epoch": 0.38, "learning_rate": 1.4137920030429386e-05, "loss": 0.4651, "step": 3354 }, { "epoch": 0.38, "learning_rate": 1.4134549868066594e-05, "loss": 0.4646, "step": 3355 }, { "epoch": 0.38, "learning_rate": 1.4131179139178157e-05, "loss": 0.4861, "step": 3356 }, { "epoch": 0.38, "learning_rate": 1.4127807844225947e-05, "loss": 0.4695, "step": 3357 }, { "epoch": 0.38, "learning_rate": 1.4124435983671907e-05, "loss": 0.4706, "step": 3358 }, { "epoch": 0.38, "learning_rate": 1.4121063557978051e-05, "loss": 0.4766, "step": 3359 }, { "epoch": 0.38, "learning_rate": 1.4117690567606483e-05, "loss": 0.4701, "step": 3360 }, { "epoch": 0.38, "learning_rate": 1.411431701301937e-05, "loss": 0.4642, "step": 3361 }, { "epoch": 0.38, "learning_rate": 1.4110942894678971e-05, "loss": 0.4676, "step": 3362 }, { "epoch": 0.38, "learning_rate": 1.410756821304762e-05, "loss": 0.4786, "step": 3363 }, { "epoch": 0.38, "learning_rate": 1.410419296858771e-05, "loss": 0.47, "step": 3364 }, { "epoch": 0.38, "learning_rate": 1.4100817161761738e-05, "loss": 0.4691, "step": 3365 }, { "epoch": 0.38, "learning_rate": 1.4097440793032253e-05, "loss": 0.4569, "step": 3366 }, { "epoch": 0.38, "learning_rate": 1.4094063862861904e-05, "loss": 0.4553, "step": 3367 }, { "epoch": 0.38, "learning_rate": 1.4090686371713403e-05, "loss": 0.4536, "step": 3368 }, { "epoch": 0.39, "learning_rate": 1.4087308320049536e-05, "loss": 0.452, "step": 3369 }, { "epoch": 0.39, "learning_rate": 1.4083929708333173e-05, "loss": 0.4892, "step": 3370 }, { "epoch": 0.39, "learning_rate": 1.4080550537027264e-05, "loss": 0.4583, "step": 3371 }, { "epoch": 0.39, "learning_rate": 1.4077170806594831e-05, "loss": 0.4813, "step": 3372 }, { "epoch": 0.39, "learning_rate": 1.4073790517498967e-05, "loss": 0.4754, "step": 3373 }, { "epoch": 0.39, "learning_rate": 1.4070409670202849e-05, "loss": 0.4719, "step": 3374 }, { "epoch": 0.39, "learning_rate": 1.4067028265169728e-05, "loss": 0.4677, "step": 3375 }, { "epoch": 0.39, "learning_rate": 1.4063646302862938e-05, "loss": 0.4727, "step": 3376 }, { "epoch": 0.39, "learning_rate": 1.406026378374588e-05, "loss": 0.4658, "step": 3377 }, { "epoch": 0.39, "learning_rate": 1.405688070828203e-05, "loss": 0.4719, "step": 3378 }, { "epoch": 0.39, "learning_rate": 1.4053497076934948e-05, "loss": 0.4711, "step": 3379 }, { "epoch": 0.39, "learning_rate": 1.405011289016827e-05, "loss": 0.4865, "step": 3380 }, { "epoch": 0.39, "learning_rate": 1.4046728148445701e-05, "loss": 0.4585, "step": 3381 }, { "epoch": 0.39, "learning_rate": 1.4043342852231027e-05, "loss": 0.4705, "step": 3382 }, { "epoch": 0.39, "learning_rate": 1.4039957001988112e-05, "loss": 0.4612, "step": 3383 }, { "epoch": 0.39, "learning_rate": 1.4036570598180888e-05, "loss": 0.4656, "step": 3384 }, { "epoch": 0.39, "learning_rate": 1.4033183641273374e-05, "loss": 0.4502, "step": 3385 }, { "epoch": 0.39, "learning_rate": 1.4029796131729652e-05, "loss": 0.4727, "step": 3386 }, { "epoch": 0.39, "learning_rate": 1.4026408070013892e-05, "loss": 0.4752, "step": 3387 }, { "epoch": 0.39, "learning_rate": 1.4023019456590335e-05, "loss": 0.4736, "step": 3388 }, { "epoch": 0.39, "learning_rate": 1.4019630291923289e-05, "loss": 0.4678, "step": 3389 }, { "epoch": 0.39, "learning_rate": 1.4016240576477152e-05, "loss": 0.483, "step": 3390 }, { "epoch": 0.39, "learning_rate": 1.401285031071639e-05, "loss": 0.4638, "step": 3391 }, { "epoch": 0.39, "learning_rate": 1.4009459495105542e-05, "loss": 0.4708, "step": 3392 }, { "epoch": 0.39, "learning_rate": 1.400606813010923e-05, "loss": 0.4631, "step": 3393 }, { "epoch": 0.39, "learning_rate": 1.4002676216192141e-05, "loss": 0.4596, "step": 3394 }, { "epoch": 0.39, "learning_rate": 1.3999283753819047e-05, "loss": 0.4453, "step": 3395 }, { "epoch": 0.39, "learning_rate": 1.3995890743454789e-05, "loss": 0.4751, "step": 3396 }, { "epoch": 0.39, "learning_rate": 1.3992497185564289e-05, "loss": 0.4807, "step": 3397 }, { "epoch": 0.39, "learning_rate": 1.3989103080612533e-05, "loss": 0.4586, "step": 3398 }, { "epoch": 0.39, "learning_rate": 1.3985708429064598e-05, "loss": 0.4707, "step": 3399 }, { "epoch": 0.39, "learning_rate": 1.3982313231385622e-05, "loss": 0.4871, "step": 3400 }, { "epoch": 0.39, "learning_rate": 1.3978917488040822e-05, "loss": 0.4575, "step": 3401 }, { "epoch": 0.39, "learning_rate": 1.3975521199495495e-05, "loss": 0.446, "step": 3402 }, { "epoch": 0.39, "learning_rate": 1.3972124366215002e-05, "loss": 0.4673, "step": 3403 }, { "epoch": 0.39, "learning_rate": 1.3968726988664788e-05, "loss": 0.4686, "step": 3404 }, { "epoch": 0.39, "learning_rate": 1.3965329067310372e-05, "loss": 0.4776, "step": 3405 }, { "epoch": 0.39, "learning_rate": 1.3961930602617345e-05, "loss": 0.4751, "step": 3406 }, { "epoch": 0.39, "learning_rate": 1.3958531595051367e-05, "loss": 0.4603, "step": 3407 }, { "epoch": 0.39, "learning_rate": 1.395513204507818e-05, "loss": 0.4653, "step": 3408 }, { "epoch": 0.39, "learning_rate": 1.3951731953163606e-05, "loss": 0.4896, "step": 3409 }, { "epoch": 0.39, "learning_rate": 1.3948331319773525e-05, "loss": 0.4479, "step": 3410 }, { "epoch": 0.39, "learning_rate": 1.3944930145373903e-05, "loss": 0.47, "step": 3411 }, { "epoch": 0.39, "learning_rate": 1.3941528430430773e-05, "loss": 0.4531, "step": 3412 }, { "epoch": 0.39, "learning_rate": 1.393812617541025e-05, "loss": 0.4815, "step": 3413 }, { "epoch": 0.39, "learning_rate": 1.3934723380778517e-05, "loss": 0.4752, "step": 3414 }, { "epoch": 0.39, "learning_rate": 1.3931320047001838e-05, "loss": 0.4631, "step": 3415 }, { "epoch": 0.39, "learning_rate": 1.3927916174546536e-05, "loss": 0.4979, "step": 3416 }, { "epoch": 0.39, "learning_rate": 1.3924511763879025e-05, "loss": 0.4603, "step": 3417 }, { "epoch": 0.39, "learning_rate": 1.3921106815465782e-05, "loss": 0.4488, "step": 3418 }, { "epoch": 0.39, "learning_rate": 1.3917701329773364e-05, "loss": 0.4639, "step": 3419 }, { "epoch": 0.39, "learning_rate": 1.3914295307268396e-05, "loss": 0.49, "step": 3420 }, { "epoch": 0.39, "learning_rate": 1.3910888748417577e-05, "loss": 0.4681, "step": 3421 }, { "epoch": 0.39, "learning_rate": 1.3907481653687687e-05, "loss": 0.4684, "step": 3422 }, { "epoch": 0.39, "learning_rate": 1.3904074023545566e-05, "loss": 0.4867, "step": 3423 }, { "epoch": 0.39, "learning_rate": 1.390066585845815e-05, "loss": 0.4704, "step": 3424 }, { "epoch": 0.39, "learning_rate": 1.389725715889242e-05, "loss": 0.4487, "step": 3425 }, { "epoch": 0.39, "learning_rate": 1.3893847925315447e-05, "loss": 0.4687, "step": 3426 }, { "epoch": 0.39, "learning_rate": 1.3890438158194374e-05, "loss": 0.4856, "step": 3427 }, { "epoch": 0.39, "learning_rate": 1.3887027857996416e-05, "loss": 0.4726, "step": 3428 }, { "epoch": 0.39, "learning_rate": 1.3883617025188858e-05, "loss": 0.4639, "step": 3429 }, { "epoch": 0.39, "learning_rate": 1.3880205660239062e-05, "loss": 0.4716, "step": 3430 }, { "epoch": 0.39, "learning_rate": 1.387679376361446e-05, "loss": 0.4622, "step": 3431 }, { "epoch": 0.39, "learning_rate": 1.3873381335782559e-05, "loss": 0.4813, "step": 3432 }, { "epoch": 0.39, "learning_rate": 1.3869968377210936e-05, "loss": 0.4577, "step": 3433 }, { "epoch": 0.39, "learning_rate": 1.3866554888367243e-05, "loss": 0.4814, "step": 3434 }, { "epoch": 0.39, "learning_rate": 1.3863140869719207e-05, "loss": 0.4519, "step": 3435 }, { "epoch": 0.39, "learning_rate": 1.3859726321734623e-05, "loss": 0.4714, "step": 3436 }, { "epoch": 0.39, "learning_rate": 1.385631124488136e-05, "loss": 0.4725, "step": 3437 }, { "epoch": 0.39, "learning_rate": 1.3852895639627357e-05, "loss": 0.476, "step": 3438 }, { "epoch": 0.39, "learning_rate": 1.3849479506440633e-05, "loss": 0.4709, "step": 3439 }, { "epoch": 0.39, "learning_rate": 1.3846062845789275e-05, "loss": 0.4698, "step": 3440 }, { "epoch": 0.39, "learning_rate": 1.3842645658141436e-05, "loss": 0.4537, "step": 3441 }, { "epoch": 0.39, "learning_rate": 1.383922794396535e-05, "loss": 0.4755, "step": 3442 }, { "epoch": 0.39, "learning_rate": 1.3835809703729322e-05, "loss": 0.4526, "step": 3443 }, { "epoch": 0.39, "learning_rate": 1.3832390937901723e-05, "loss": 0.4573, "step": 3444 }, { "epoch": 0.39, "learning_rate": 1.3828971646951005e-05, "loss": 0.4754, "step": 3445 }, { "epoch": 0.39, "learning_rate": 1.3825551831345685e-05, "loss": 0.4687, "step": 3446 }, { "epoch": 0.39, "learning_rate": 1.3822131491554355e-05, "loss": 0.4574, "step": 3447 }, { "epoch": 0.39, "learning_rate": 1.3818710628045677e-05, "loss": 0.4768, "step": 3448 }, { "epoch": 0.39, "learning_rate": 1.3815289241288383e-05, "loss": 0.473, "step": 3449 }, { "epoch": 0.39, "learning_rate": 1.3811867331751286e-05, "loss": 0.4808, "step": 3450 }, { "epoch": 0.39, "learning_rate": 1.380844489990326e-05, "loss": 0.4514, "step": 3451 }, { "epoch": 0.39, "learning_rate": 1.3805021946213251e-05, "loss": 0.4766, "step": 3452 }, { "epoch": 0.39, "learning_rate": 1.3801598471150286e-05, "loss": 0.4523, "step": 3453 }, { "epoch": 0.39, "learning_rate": 1.3798174475183457e-05, "loss": 0.4715, "step": 3454 }, { "epoch": 0.39, "learning_rate": 1.3794749958781924e-05, "loss": 0.4447, "step": 3455 }, { "epoch": 0.39, "learning_rate": 1.3791324922414924e-05, "loss": 0.471, "step": 3456 }, { "epoch": 0.4, "learning_rate": 1.3787899366551764e-05, "loss": 0.4725, "step": 3457 }, { "epoch": 0.4, "learning_rate": 1.3784473291661824e-05, "loss": 0.4766, "step": 3458 }, { "epoch": 0.4, "learning_rate": 1.3781046698214549e-05, "loss": 0.4553, "step": 3459 }, { "epoch": 0.4, "learning_rate": 1.3777619586679458e-05, "loss": 0.4858, "step": 3460 }, { "epoch": 0.4, "learning_rate": 1.3774191957526144e-05, "loss": 0.4454, "step": 3461 }, { "epoch": 0.4, "learning_rate": 1.3770763811224273e-05, "loss": 0.4684, "step": 3462 }, { "epoch": 0.4, "learning_rate": 1.376733514824357e-05, "loss": 0.4524, "step": 3463 }, { "epoch": 0.4, "learning_rate": 1.3763905969053841e-05, "loss": 0.4756, "step": 3464 }, { "epoch": 0.4, "learning_rate": 1.376047627412496e-05, "loss": 0.4817, "step": 3465 }, { "epoch": 0.4, "learning_rate": 1.3757046063926876e-05, "loss": 0.4717, "step": 3466 }, { "epoch": 0.4, "learning_rate": 1.3753615338929598e-05, "loss": 0.4687, "step": 3467 }, { "epoch": 0.4, "learning_rate": 1.3750184099603216e-05, "loss": 0.4765, "step": 3468 }, { "epoch": 0.4, "learning_rate": 1.3746752346417884e-05, "loss": 0.4669, "step": 3469 }, { "epoch": 0.4, "learning_rate": 1.3743320079843828e-05, "loss": 0.4586, "step": 3470 }, { "epoch": 0.4, "learning_rate": 1.3739887300351349e-05, "loss": 0.4725, "step": 3471 }, { "epoch": 0.4, "learning_rate": 1.3736454008410816e-05, "loss": 0.4761, "step": 3472 }, { "epoch": 0.4, "learning_rate": 1.373302020449266e-05, "loss": 0.4666, "step": 3473 }, { "epoch": 0.4, "learning_rate": 1.3729585889067391e-05, "loss": 0.4902, "step": 3474 }, { "epoch": 0.4, "learning_rate": 1.3726151062605588e-05, "loss": 0.461, "step": 3475 }, { "epoch": 0.4, "learning_rate": 1.3722715725577902e-05, "loss": 0.4729, "step": 3476 }, { "epoch": 0.4, "learning_rate": 1.3719279878455046e-05, "loss": 0.4725, "step": 3477 }, { "epoch": 0.4, "learning_rate": 1.3715843521707805e-05, "loss": 0.4572, "step": 3478 }, { "epoch": 0.4, "learning_rate": 1.3712406655807047e-05, "loss": 0.4482, "step": 3479 }, { "epoch": 0.4, "learning_rate": 1.3708969281223687e-05, "loss": 0.4834, "step": 3480 }, { "epoch": 0.4, "learning_rate": 1.3705531398428736e-05, "loss": 0.4743, "step": 3481 }, { "epoch": 0.4, "learning_rate": 1.3702093007893249e-05, "loss": 0.4896, "step": 3482 }, { "epoch": 0.4, "learning_rate": 1.3698654110088365e-05, "loss": 0.4706, "step": 3483 }, { "epoch": 0.4, "learning_rate": 1.3695214705485294e-05, "loss": 0.4695, "step": 3484 }, { "epoch": 0.4, "learning_rate": 1.3691774794555306e-05, "loss": 0.4616, "step": 3485 }, { "epoch": 0.4, "learning_rate": 1.368833437776975e-05, "loss": 0.4823, "step": 3486 }, { "epoch": 0.4, "learning_rate": 1.3684893455600036e-05, "loss": 0.4539, "step": 3487 }, { "epoch": 0.4, "learning_rate": 1.368145202851765e-05, "loss": 0.4737, "step": 3488 }, { "epoch": 0.4, "learning_rate": 1.3678010096994143e-05, "loss": 0.4613, "step": 3489 }, { "epoch": 0.4, "learning_rate": 1.3674567661501138e-05, "loss": 0.485, "step": 3490 }, { "epoch": 0.4, "learning_rate": 1.3671124722510325e-05, "loss": 0.4766, "step": 3491 }, { "epoch": 0.4, "learning_rate": 1.366768128049346e-05, "loss": 0.4763, "step": 3492 }, { "epoch": 0.4, "learning_rate": 1.3664237335922377e-05, "loss": 0.4588, "step": 3493 }, { "epoch": 0.4, "learning_rate": 1.3660792889268967e-05, "loss": 0.4883, "step": 3494 }, { "epoch": 0.4, "learning_rate": 1.3657347941005204e-05, "loss": 0.4671, "step": 3495 }, { "epoch": 0.4, "learning_rate": 1.3653902491603117e-05, "loss": 0.464, "step": 3496 }, { "epoch": 0.4, "learning_rate": 1.3650456541534811e-05, "loss": 0.4619, "step": 3497 }, { "epoch": 0.4, "learning_rate": 1.3647010091272456e-05, "loss": 0.4806, "step": 3498 }, { "epoch": 0.4, "learning_rate": 1.3643563141288297e-05, "loss": 0.4832, "step": 3499 }, { "epoch": 0.4, "learning_rate": 1.364011569205464e-05, "loss": 0.476, "step": 3500 }, { "epoch": 0.4, "learning_rate": 1.3636667744043864e-05, "loss": 0.4768, "step": 3501 }, { "epoch": 0.4, "learning_rate": 1.3633219297728415e-05, "loss": 0.4722, "step": 3502 }, { "epoch": 0.4, "learning_rate": 1.3629770353580804e-05, "loss": 0.4721, "step": 3503 }, { "epoch": 0.4, "learning_rate": 1.3626320912073616e-05, "loss": 0.4715, "step": 3504 }, { "epoch": 0.4, "learning_rate": 1.3622870973679503e-05, "loss": 0.4711, "step": 3505 }, { "epoch": 0.4, "learning_rate": 1.361942053887118e-05, "loss": 0.4722, "step": 3506 }, { "epoch": 0.4, "learning_rate": 1.3615969608121438e-05, "loss": 0.4726, "step": 3507 }, { "epoch": 0.4, "learning_rate": 1.3612518181903127e-05, "loss": 0.465, "step": 3508 }, { "epoch": 0.4, "learning_rate": 1.360906626068917e-05, "loss": 0.4693, "step": 3509 }, { "epoch": 0.4, "learning_rate": 1.3605613844952561e-05, "loss": 0.4564, "step": 3510 }, { "epoch": 0.4, "learning_rate": 1.3602160935166357e-05, "loss": 0.4639, "step": 3511 }, { "epoch": 0.4, "learning_rate": 1.359870753180368e-05, "loss": 0.4704, "step": 3512 }, { "epoch": 0.4, "learning_rate": 1.3595253635337724e-05, "loss": 0.4511, "step": 3513 }, { "epoch": 0.4, "learning_rate": 1.3591799246241753e-05, "loss": 0.4738, "step": 3514 }, { "epoch": 0.4, "learning_rate": 1.3588344364989096e-05, "loss": 0.478, "step": 3515 }, { "epoch": 0.4, "learning_rate": 1.3584888992053146e-05, "loss": 0.4549, "step": 3516 }, { "epoch": 0.4, "learning_rate": 1.3581433127907366e-05, "loss": 0.4767, "step": 3517 }, { "epoch": 0.4, "learning_rate": 1.357797677302529e-05, "loss": 0.4492, "step": 3518 }, { "epoch": 0.4, "learning_rate": 1.3574519927880511e-05, "loss": 0.4672, "step": 3519 }, { "epoch": 0.4, "learning_rate": 1.3571062592946703e-05, "loss": 0.473, "step": 3520 }, { "epoch": 0.4, "learning_rate": 1.3567604768697585e-05, "loss": 0.4583, "step": 3521 }, { "epoch": 0.4, "learning_rate": 1.3564146455606961e-05, "loss": 0.4575, "step": 3522 }, { "epoch": 0.4, "learning_rate": 1.3560687654148703e-05, "loss": 0.4642, "step": 3523 }, { "epoch": 0.4, "learning_rate": 1.3557228364796742e-05, "loss": 0.4688, "step": 3524 }, { "epoch": 0.4, "learning_rate": 1.3553768588025073e-05, "loss": 0.4582, "step": 3525 }, { "epoch": 0.4, "learning_rate": 1.3550308324307767e-05, "loss": 0.4701, "step": 3526 }, { "epoch": 0.4, "learning_rate": 1.3546847574118951e-05, "loss": 0.4618, "step": 3527 }, { "epoch": 0.4, "learning_rate": 1.3543386337932834e-05, "loss": 0.4574, "step": 3528 }, { "epoch": 0.4, "learning_rate": 1.3539924616223679e-05, "loss": 0.4567, "step": 3529 }, { "epoch": 0.4, "learning_rate": 1.3536462409465816e-05, "loss": 0.4813, "step": 3530 }, { "epoch": 0.4, "learning_rate": 1.3532999718133648e-05, "loss": 0.4813, "step": 3531 }, { "epoch": 0.4, "learning_rate": 1.3529536542701638e-05, "loss": 0.4799, "step": 3532 }, { "epoch": 0.4, "learning_rate": 1.3526072883644326e-05, "loss": 0.4817, "step": 3533 }, { "epoch": 0.4, "learning_rate": 1.3522608741436303e-05, "loss": 0.4664, "step": 3534 }, { "epoch": 0.4, "learning_rate": 1.3519144116552236e-05, "loss": 0.4972, "step": 3535 }, { "epoch": 0.4, "learning_rate": 1.3515679009466856e-05, "loss": 0.4505, "step": 3536 }, { "epoch": 0.4, "learning_rate": 1.3512213420654959e-05, "loss": 0.4666, "step": 3537 }, { "epoch": 0.4, "learning_rate": 1.350874735059141e-05, "loss": 0.4746, "step": 3538 }, { "epoch": 0.4, "learning_rate": 1.3505280799751134e-05, "loss": 0.4741, "step": 3539 }, { "epoch": 0.4, "learning_rate": 1.3501813768609134e-05, "loss": 0.4802, "step": 3540 }, { "epoch": 0.4, "learning_rate": 1.3498346257640461e-05, "loss": 0.4697, "step": 3541 }, { "epoch": 0.4, "learning_rate": 1.349487826732025e-05, "loss": 0.4593, "step": 3542 }, { "epoch": 0.4, "learning_rate": 1.3491409798123687e-05, "loss": 0.4985, "step": 3543 }, { "epoch": 0.41, "learning_rate": 1.3487940850526033e-05, "loss": 0.4663, "step": 3544 }, { "epoch": 0.41, "learning_rate": 1.348447142500261e-05, "loss": 0.4558, "step": 3545 }, { "epoch": 0.41, "learning_rate": 1.3481001522028807e-05, "loss": 0.4566, "step": 3546 }, { "epoch": 0.41, "learning_rate": 1.3477531142080076e-05, "loss": 0.4626, "step": 3547 }, { "epoch": 0.41, "learning_rate": 1.347406028563194e-05, "loss": 0.487, "step": 3548 }, { "epoch": 0.41, "learning_rate": 1.3470588953159982e-05, "loss": 0.4712, "step": 3549 }, { "epoch": 0.41, "learning_rate": 1.3467117145139854e-05, "loss": 0.4427, "step": 3550 }, { "epoch": 0.41, "learning_rate": 1.3463644862047267e-05, "loss": 0.4693, "step": 3551 }, { "epoch": 0.41, "learning_rate": 1.3460172104358007e-05, "loss": 0.4581, "step": 3552 }, { "epoch": 0.41, "learning_rate": 1.3456698872547915e-05, "loss": 0.4775, "step": 3553 }, { "epoch": 0.41, "learning_rate": 1.3453225167092902e-05, "loss": 0.4602, "step": 3554 }, { "epoch": 0.41, "learning_rate": 1.3449750988468943e-05, "loss": 0.4855, "step": 3555 }, { "epoch": 0.41, "learning_rate": 1.344627633715208e-05, "loss": 0.4711, "step": 3556 }, { "epoch": 0.41, "learning_rate": 1.3442801213618417e-05, "loss": 0.4648, "step": 3557 }, { "epoch": 0.41, "learning_rate": 1.3439325618344123e-05, "loss": 0.4784, "step": 3558 }, { "epoch": 0.41, "learning_rate": 1.3435849551805436e-05, "loss": 0.4907, "step": 3559 }, { "epoch": 0.41, "learning_rate": 1.3432373014478644e-05, "loss": 0.4504, "step": 3560 }, { "epoch": 0.41, "learning_rate": 1.3428896006840122e-05, "loss": 0.4856, "step": 3561 }, { "epoch": 0.41, "learning_rate": 1.3425418529366293e-05, "loss": 0.4712, "step": 3562 }, { "epoch": 0.41, "learning_rate": 1.3421940582533645e-05, "loss": 0.4771, "step": 3563 }, { "epoch": 0.41, "learning_rate": 1.3418462166818743e-05, "loss": 0.4686, "step": 3564 }, { "epoch": 0.41, "learning_rate": 1.34149832826982e-05, "loss": 0.4561, "step": 3565 }, { "epoch": 0.41, "learning_rate": 1.3411503930648704e-05, "loss": 0.4762, "step": 3566 }, { "epoch": 0.41, "learning_rate": 1.3408024111147004e-05, "loss": 0.477, "step": 3567 }, { "epoch": 0.41, "learning_rate": 1.3404543824669915e-05, "loss": 0.4383, "step": 3568 }, { "epoch": 0.41, "learning_rate": 1.3401063071694309e-05, "loss": 0.4824, "step": 3569 }, { "epoch": 0.41, "learning_rate": 1.3397581852697128e-05, "loss": 0.4664, "step": 3570 }, { "epoch": 0.41, "learning_rate": 1.3394100168155382e-05, "loss": 0.4723, "step": 3571 }, { "epoch": 0.41, "learning_rate": 1.3390618018546135e-05, "loss": 0.4462, "step": 3572 }, { "epoch": 0.41, "learning_rate": 1.3387135404346519e-05, "loss": 0.4555, "step": 3573 }, { "epoch": 0.41, "learning_rate": 1.338365232603373e-05, "loss": 0.4666, "step": 3574 }, { "epoch": 0.41, "learning_rate": 1.3380168784085028e-05, "loss": 0.4895, "step": 3575 }, { "epoch": 0.41, "learning_rate": 1.3376684778977738e-05, "loss": 0.4813, "step": 3576 }, { "epoch": 0.41, "learning_rate": 1.3373200311189245e-05, "loss": 0.485, "step": 3577 }, { "epoch": 0.41, "learning_rate": 1.3369715381197e-05, "loss": 0.4799, "step": 3578 }, { "epoch": 0.41, "learning_rate": 1.336622998947851e-05, "loss": 0.4667, "step": 3579 }, { "epoch": 0.41, "learning_rate": 1.336274413651136e-05, "loss": 0.4623, "step": 3580 }, { "epoch": 0.41, "learning_rate": 1.3359257822773187e-05, "loss": 0.4914, "step": 3581 }, { "epoch": 0.41, "learning_rate": 1.3355771048741692e-05, "loss": 0.4591, "step": 3582 }, { "epoch": 0.41, "learning_rate": 1.335228381489464e-05, "loss": 0.4642, "step": 3583 }, { "epoch": 0.41, "learning_rate": 1.3348796121709862e-05, "loss": 0.4682, "step": 3584 }, { "epoch": 0.41, "learning_rate": 1.3345307969665252e-05, "loss": 0.4726, "step": 3585 }, { "epoch": 0.41, "learning_rate": 1.3341819359238762e-05, "loss": 0.4532, "step": 3586 }, { "epoch": 0.41, "learning_rate": 1.3338330290908408e-05, "loss": 0.4763, "step": 3587 }, { "epoch": 0.41, "learning_rate": 1.3334840765152272e-05, "loss": 0.4579, "step": 3588 }, { "epoch": 0.41, "learning_rate": 1.3331350782448495e-05, "loss": 0.4719, "step": 3589 }, { "epoch": 0.41, "learning_rate": 1.332786034327529e-05, "loss": 0.4579, "step": 3590 }, { "epoch": 0.41, "learning_rate": 1.3324369448110916e-05, "loss": 0.4598, "step": 3591 }, { "epoch": 0.41, "learning_rate": 1.3320878097433707e-05, "loss": 0.4768, "step": 3592 }, { "epoch": 0.41, "learning_rate": 1.331738629172206e-05, "loss": 0.4901, "step": 3593 }, { "epoch": 0.41, "learning_rate": 1.3313894031454421e-05, "loss": 0.4635, "step": 3594 }, { "epoch": 0.41, "learning_rate": 1.3310401317109316e-05, "loss": 0.4515, "step": 3595 }, { "epoch": 0.41, "learning_rate": 1.330690814916532e-05, "loss": 0.4682, "step": 3596 }, { "epoch": 0.41, "learning_rate": 1.330341452810108e-05, "loss": 0.4734, "step": 3597 }, { "epoch": 0.41, "learning_rate": 1.3299920454395296e-05, "loss": 0.4524, "step": 3598 }, { "epoch": 0.41, "learning_rate": 1.3296425928526735e-05, "loss": 0.4722, "step": 3599 }, { "epoch": 0.41, "learning_rate": 1.3292930950974223e-05, "loss": 0.4714, "step": 3600 }, { "epoch": 0.41, "learning_rate": 1.3289435522216657e-05, "loss": 0.4808, "step": 3601 }, { "epoch": 0.41, "learning_rate": 1.3285939642732979e-05, "loss": 0.4508, "step": 3602 }, { "epoch": 0.41, "learning_rate": 1.3282443313002209e-05, "loss": 0.5019, "step": 3603 }, { "epoch": 0.41, "learning_rate": 1.3278946533503422e-05, "loss": 0.4552, "step": 3604 }, { "epoch": 0.41, "learning_rate": 1.3275449304715753e-05, "loss": 0.4557, "step": 3605 }, { "epoch": 0.41, "learning_rate": 1.3271951627118402e-05, "loss": 0.4747, "step": 3606 }, { "epoch": 0.41, "learning_rate": 1.3268453501190628e-05, "loss": 0.4785, "step": 3607 }, { "epoch": 0.41, "learning_rate": 1.3264954927411751e-05, "loss": 0.4874, "step": 3608 }, { "epoch": 0.41, "learning_rate": 1.3261455906261154e-05, "loss": 0.4692, "step": 3609 }, { "epoch": 0.41, "learning_rate": 1.3257956438218283e-05, "loss": 0.472, "step": 3610 }, { "epoch": 0.41, "learning_rate": 1.3254456523762643e-05, "loss": 0.4603, "step": 3611 }, { "epoch": 0.41, "learning_rate": 1.3250956163373801e-05, "loss": 0.476, "step": 3612 }, { "epoch": 0.41, "learning_rate": 1.324745535753138e-05, "loss": 0.469, "step": 3613 }, { "epoch": 0.41, "learning_rate": 1.3243954106715074e-05, "loss": 0.4551, "step": 3614 }, { "epoch": 0.41, "learning_rate": 1.3240452411404628e-05, "loss": 0.4715, "step": 3615 }, { "epoch": 0.41, "learning_rate": 1.3236950272079858e-05, "loss": 0.4817, "step": 3616 }, { "epoch": 0.41, "learning_rate": 1.3233447689220629e-05, "loss": 0.4714, "step": 3617 }, { "epoch": 0.41, "learning_rate": 1.3229944663306877e-05, "loss": 0.4745, "step": 3618 }, { "epoch": 0.41, "learning_rate": 1.3226441194818596e-05, "loss": 0.4591, "step": 3619 }, { "epoch": 0.41, "learning_rate": 1.3222937284235835e-05, "loss": 0.4703, "step": 3620 }, { "epoch": 0.41, "learning_rate": 1.3219432932038712e-05, "loss": 0.4754, "step": 3621 }, { "epoch": 0.41, "learning_rate": 1.3215928138707396e-05, "loss": 0.4626, "step": 3622 }, { "epoch": 0.41, "learning_rate": 1.321242290472213e-05, "loss": 0.4779, "step": 3623 }, { "epoch": 0.41, "learning_rate": 1.3208917230563201e-05, "loss": 0.4725, "step": 3624 }, { "epoch": 0.41, "learning_rate": 1.3205411116710973e-05, "loss": 0.4656, "step": 3625 }, { "epoch": 0.41, "learning_rate": 1.3201904563645853e-05, "loss": 0.486, "step": 3626 }, { "epoch": 0.41, "learning_rate": 1.3198397571848323e-05, "loss": 0.4626, "step": 3627 }, { "epoch": 0.41, "learning_rate": 1.319489014179892e-05, "loss": 0.4682, "step": 3628 }, { "epoch": 0.41, "learning_rate": 1.3191382273978237e-05, "loss": 0.4631, "step": 3629 }, { "epoch": 0.41, "learning_rate": 1.3187873968866928e-05, "loss": 0.4509, "step": 3630 }, { "epoch": 0.41, "learning_rate": 1.3184365226945715e-05, "loss": 0.4576, "step": 3631 }, { "epoch": 0.42, "learning_rate": 1.318085604869537e-05, "loss": 0.4649, "step": 3632 }, { "epoch": 0.42, "learning_rate": 1.3177346434596734e-05, "loss": 0.4934, "step": 3633 }, { "epoch": 0.42, "learning_rate": 1.3173836385130693e-05, "loss": 0.4483, "step": 3634 }, { "epoch": 0.42, "learning_rate": 1.3170325900778211e-05, "loss": 0.4704, "step": 3635 }, { "epoch": 0.42, "learning_rate": 1.3166814982020298e-05, "loss": 0.4706, "step": 3636 }, { "epoch": 0.42, "learning_rate": 1.3163303629338029e-05, "loss": 0.4671, "step": 3637 }, { "epoch": 0.42, "learning_rate": 1.3159791843212542e-05, "loss": 0.4487, "step": 3638 }, { "epoch": 0.42, "learning_rate": 1.3156279624125023e-05, "loss": 0.4742, "step": 3639 }, { "epoch": 0.42, "learning_rate": 1.3152766972556727e-05, "loss": 0.4657, "step": 3640 }, { "epoch": 0.42, "learning_rate": 1.3149253888988967e-05, "loss": 0.4887, "step": 3641 }, { "epoch": 0.42, "learning_rate": 1.3145740373903118e-05, "loss": 0.4618, "step": 3642 }, { "epoch": 0.42, "learning_rate": 1.31422264277806e-05, "loss": 0.4543, "step": 3643 }, { "epoch": 0.42, "learning_rate": 1.3138712051102908e-05, "loss": 0.4653, "step": 3644 }, { "epoch": 0.42, "learning_rate": 1.3135197244351595e-05, "loss": 0.4668, "step": 3645 }, { "epoch": 0.42, "learning_rate": 1.3131682008008255e-05, "loss": 0.4705, "step": 3646 }, { "epoch": 0.42, "learning_rate": 1.3128166342554567e-05, "loss": 0.4697, "step": 3647 }, { "epoch": 0.42, "learning_rate": 1.3124650248472248e-05, "loss": 0.4545, "step": 3648 }, { "epoch": 0.42, "learning_rate": 1.3121133726243083e-05, "loss": 0.4855, "step": 3649 }, { "epoch": 0.42, "learning_rate": 1.3117616776348915e-05, "loss": 0.4607, "step": 3650 }, { "epoch": 0.42, "learning_rate": 1.3114099399271646e-05, "loss": 0.4721, "step": 3651 }, { "epoch": 0.42, "learning_rate": 1.311058159549323e-05, "loss": 0.4476, "step": 3652 }, { "epoch": 0.42, "learning_rate": 1.3107063365495692e-05, "loss": 0.4616, "step": 3653 }, { "epoch": 0.42, "learning_rate": 1.31035447097611e-05, "loss": 0.454, "step": 3654 }, { "epoch": 0.42, "learning_rate": 1.3100025628771595e-05, "loss": 0.4719, "step": 3655 }, { "epoch": 0.42, "learning_rate": 1.3096506123009368e-05, "loss": 0.4565, "step": 3656 }, { "epoch": 0.42, "learning_rate": 1.3092986192956665e-05, "loss": 0.478, "step": 3657 }, { "epoch": 0.42, "learning_rate": 1.3089465839095803e-05, "loss": 0.4596, "step": 3658 }, { "epoch": 0.42, "learning_rate": 1.3085945061909144e-05, "loss": 0.4778, "step": 3659 }, { "epoch": 0.42, "learning_rate": 1.3082423861879114e-05, "loss": 0.4706, "step": 3660 }, { "epoch": 0.42, "learning_rate": 1.3078902239488196e-05, "loss": 0.4497, "step": 3661 }, { "epoch": 0.42, "learning_rate": 1.3075380195218931e-05, "loss": 0.4668, "step": 3662 }, { "epoch": 0.42, "learning_rate": 1.3071857729553918e-05, "loss": 0.469, "step": 3663 }, { "epoch": 0.42, "learning_rate": 1.3068334842975813e-05, "loss": 0.4776, "step": 3664 }, { "epoch": 0.42, "learning_rate": 1.306481153596733e-05, "loss": 0.4726, "step": 3665 }, { "epoch": 0.42, "learning_rate": 1.3061287809011243e-05, "loss": 0.4661, "step": 3666 }, { "epoch": 0.42, "learning_rate": 1.3057763662590377e-05, "loss": 0.4822, "step": 3667 }, { "epoch": 0.42, "learning_rate": 1.3054239097187625e-05, "loss": 0.4588, "step": 3668 }, { "epoch": 0.42, "learning_rate": 1.3050714113285922e-05, "loss": 0.4591, "step": 3669 }, { "epoch": 0.42, "learning_rate": 1.3047188711368278e-05, "loss": 0.4658, "step": 3670 }, { "epoch": 0.42, "learning_rate": 1.3043662891917748e-05, "loss": 0.4681, "step": 3671 }, { "epoch": 0.42, "learning_rate": 1.3040136655417448e-05, "loss": 0.4674, "step": 3672 }, { "epoch": 0.42, "learning_rate": 1.303661000235055e-05, "loss": 0.4597, "step": 3673 }, { "epoch": 0.42, "learning_rate": 1.3033082933200287e-05, "loss": 0.4537, "step": 3674 }, { "epoch": 0.42, "learning_rate": 1.3029555448449947e-05, "loss": 0.4705, "step": 3675 }, { "epoch": 0.42, "learning_rate": 1.302602754858287e-05, "loss": 0.4701, "step": 3676 }, { "epoch": 0.42, "learning_rate": 1.3022499234082463e-05, "loss": 0.4851, "step": 3677 }, { "epoch": 0.42, "learning_rate": 1.3018970505432176e-05, "loss": 0.4751, "step": 3678 }, { "epoch": 0.42, "learning_rate": 1.3015441363115526e-05, "loss": 0.4522, "step": 3679 }, { "epoch": 0.42, "learning_rate": 1.3011911807616091e-05, "loss": 0.4703, "step": 3680 }, { "epoch": 0.42, "learning_rate": 1.3008381839417493e-05, "loss": 0.4713, "step": 3681 }, { "epoch": 0.42, "learning_rate": 1.3004851459003416e-05, "loss": 0.4806, "step": 3682 }, { "epoch": 0.42, "learning_rate": 1.30013206668576e-05, "loss": 0.4972, "step": 3683 }, { "epoch": 0.42, "learning_rate": 1.2997789463463848e-05, "loss": 0.4535, "step": 3684 }, { "epoch": 0.42, "learning_rate": 1.2994257849306009e-05, "loss": 0.479, "step": 3685 }, { "epoch": 0.42, "learning_rate": 1.2990725824867995e-05, "loss": 0.4595, "step": 3686 }, { "epoch": 0.42, "learning_rate": 1.2987193390633773e-05, "loss": 0.464, "step": 3687 }, { "epoch": 0.42, "learning_rate": 1.298366054708736e-05, "loss": 0.4592, "step": 3688 }, { "epoch": 0.42, "learning_rate": 1.2980127294712839e-05, "loss": 0.4798, "step": 3689 }, { "epoch": 0.42, "learning_rate": 1.2976593633994347e-05, "loss": 0.4443, "step": 3690 }, { "epoch": 0.42, "learning_rate": 1.297305956541607e-05, "loss": 0.4957, "step": 3691 }, { "epoch": 0.42, "learning_rate": 1.2969525089462253e-05, "loss": 0.4539, "step": 3692 }, { "epoch": 0.42, "learning_rate": 1.2965990206617203e-05, "loss": 0.4583, "step": 3693 }, { "epoch": 0.42, "learning_rate": 1.2962454917365275e-05, "loss": 0.4544, "step": 3694 }, { "epoch": 0.42, "learning_rate": 1.2958919222190885e-05, "loss": 0.4833, "step": 3695 }, { "epoch": 0.42, "learning_rate": 1.2955383121578498e-05, "loss": 0.469, "step": 3696 }, { "epoch": 0.42, "learning_rate": 1.2951846616012642e-05, "loss": 0.4562, "step": 3697 }, { "epoch": 0.42, "learning_rate": 1.2948309705977893e-05, "loss": 0.4555, "step": 3698 }, { "epoch": 0.42, "learning_rate": 1.2944772391958896e-05, "loss": 0.4657, "step": 3699 }, { "epoch": 0.42, "learning_rate": 1.294123467444033e-05, "loss": 0.4753, "step": 3700 }, { "epoch": 0.42, "learning_rate": 1.2937696553906949e-05, "loss": 0.4762, "step": 3701 }, { "epoch": 0.42, "learning_rate": 1.2934158030843554e-05, "loss": 0.45, "step": 3702 }, { "epoch": 0.42, "learning_rate": 1.2930619105734999e-05, "loss": 0.4803, "step": 3703 }, { "epoch": 0.42, "learning_rate": 1.2927079779066196e-05, "loss": 0.4837, "step": 3704 }, { "epoch": 0.42, "learning_rate": 1.2923540051322114e-05, "loss": 0.4546, "step": 3705 }, { "epoch": 0.42, "learning_rate": 1.2919999922987775e-05, "loss": 0.4731, "step": 3706 }, { "epoch": 0.42, "learning_rate": 1.291645939454825e-05, "loss": 0.4707, "step": 3707 }, { "epoch": 0.42, "learning_rate": 1.2912918466488678e-05, "loss": 0.4518, "step": 3708 }, { "epoch": 0.42, "learning_rate": 1.2909377139294242e-05, "loss": 0.4774, "step": 3709 }, { "epoch": 0.42, "learning_rate": 1.290583541345018e-05, "loss": 0.4678, "step": 3710 }, { "epoch": 0.42, "learning_rate": 1.2902293289441791e-05, "loss": 0.4693, "step": 3711 }, { "epoch": 0.42, "learning_rate": 1.2898750767754427e-05, "loss": 0.4519, "step": 3712 }, { "epoch": 0.42, "learning_rate": 1.2895207848873488e-05, "loss": 0.4656, "step": 3713 }, { "epoch": 0.42, "learning_rate": 1.2891664533284434e-05, "loss": 0.4719, "step": 3714 }, { "epoch": 0.42, "learning_rate": 1.288812082147278e-05, "loss": 0.4629, "step": 3715 }, { "epoch": 0.42, "learning_rate": 1.2884576713924093e-05, "loss": 0.4535, "step": 3716 }, { "epoch": 0.42, "learning_rate": 1.2881032211123994e-05, "loss": 0.4501, "step": 3717 }, { "epoch": 0.42, "learning_rate": 1.2877487313558159e-05, "loss": 0.4916, "step": 3718 }, { "epoch": 0.43, "learning_rate": 1.287394202171232e-05, "loss": 0.4555, "step": 3719 }, { "epoch": 0.43, "learning_rate": 1.287039633607226e-05, "loss": 0.4693, "step": 3720 }, { "epoch": 0.43, "learning_rate": 1.2866850257123817e-05, "loss": 0.4711, "step": 3721 }, { "epoch": 0.43, "learning_rate": 1.2863303785352883e-05, "loss": 0.4536, "step": 3722 }, { "epoch": 0.43, "learning_rate": 1.2859756921245403e-05, "loss": 0.4687, "step": 3723 }, { "epoch": 0.43, "learning_rate": 1.2856209665287378e-05, "loss": 0.4715, "step": 3724 }, { "epoch": 0.43, "learning_rate": 1.2852662017964863e-05, "loss": 0.4529, "step": 3725 }, { "epoch": 0.43, "learning_rate": 1.2849113979763956e-05, "loss": 0.4851, "step": 3726 }, { "epoch": 0.43, "learning_rate": 1.2845565551170829e-05, "loss": 0.4807, "step": 3727 }, { "epoch": 0.43, "learning_rate": 1.2842016732671689e-05, "loss": 0.456, "step": 3728 }, { "epoch": 0.43, "learning_rate": 1.2838467524752808e-05, "loss": 0.4591, "step": 3729 }, { "epoch": 0.43, "learning_rate": 1.2834917927900504e-05, "loss": 0.4645, "step": 3730 }, { "epoch": 0.43, "learning_rate": 1.2831367942601146e-05, "loss": 0.4533, "step": 3731 }, { "epoch": 0.43, "learning_rate": 1.2827817569341167e-05, "loss": 0.4886, "step": 3732 }, { "epoch": 0.43, "learning_rate": 1.282426680860705e-05, "loss": 0.4656, "step": 3733 }, { "epoch": 0.43, "learning_rate": 1.2820715660885328e-05, "loss": 0.4773, "step": 3734 }, { "epoch": 0.43, "learning_rate": 1.2817164126662581e-05, "loss": 0.4702, "step": 3735 }, { "epoch": 0.43, "learning_rate": 1.281361220642545e-05, "loss": 0.4791, "step": 3736 }, { "epoch": 0.43, "learning_rate": 1.281005990066063e-05, "loss": 0.4713, "step": 3737 }, { "epoch": 0.43, "learning_rate": 1.280650720985487e-05, "loss": 0.4736, "step": 3738 }, { "epoch": 0.43, "learning_rate": 1.2802954134494963e-05, "loss": 0.449, "step": 3739 }, { "epoch": 0.43, "learning_rate": 1.2799400675067754e-05, "loss": 0.4865, "step": 3740 }, { "epoch": 0.43, "learning_rate": 1.2795846832060157e-05, "loss": 0.4372, "step": 3741 }, { "epoch": 0.43, "learning_rate": 1.2792292605959125e-05, "loss": 0.4791, "step": 3742 }, { "epoch": 0.43, "learning_rate": 1.2788737997251665e-05, "loss": 0.4706, "step": 3743 }, { "epoch": 0.43, "learning_rate": 1.2785183006424836e-05, "loss": 0.4556, "step": 3744 }, { "epoch": 0.43, "learning_rate": 1.278162763396575e-05, "loss": 0.4523, "step": 3745 }, { "epoch": 0.43, "learning_rate": 1.2778071880361577e-05, "loss": 0.4699, "step": 3746 }, { "epoch": 0.43, "learning_rate": 1.2774515746099536e-05, "loss": 0.4654, "step": 3747 }, { "epoch": 0.43, "learning_rate": 1.277095923166689e-05, "loss": 0.4471, "step": 3748 }, { "epoch": 0.43, "learning_rate": 1.2767402337550966e-05, "loss": 0.4751, "step": 3749 }, { "epoch": 0.43, "learning_rate": 1.2763845064239134e-05, "loss": 0.4884, "step": 3750 }, { "epoch": 0.43, "learning_rate": 1.2760287412218824e-05, "loss": 0.4594, "step": 3751 }, { "epoch": 0.43, "learning_rate": 1.275672938197751e-05, "loss": 0.4848, "step": 3752 }, { "epoch": 0.43, "learning_rate": 1.2753170974002727e-05, "loss": 0.4542, "step": 3753 }, { "epoch": 0.43, "learning_rate": 1.2749612188782048e-05, "loss": 0.4643, "step": 3754 }, { "epoch": 0.43, "learning_rate": 1.2746053026803114e-05, "loss": 0.46, "step": 3755 }, { "epoch": 0.43, "learning_rate": 1.2742493488553606e-05, "loss": 0.4519, "step": 3756 }, { "epoch": 0.43, "learning_rate": 1.2738933574521262e-05, "loss": 0.4655, "step": 3757 }, { "epoch": 0.43, "learning_rate": 1.2735373285193867e-05, "loss": 0.4716, "step": 3758 }, { "epoch": 0.43, "learning_rate": 1.2731812621059262e-05, "loss": 0.469, "step": 3759 }, { "epoch": 0.43, "learning_rate": 1.2728251582605335e-05, "loss": 0.4608, "step": 3760 }, { "epoch": 0.43, "learning_rate": 1.2724690170320031e-05, "loss": 0.4635, "step": 3761 }, { "epoch": 0.43, "learning_rate": 1.2721128384691342e-05, "loss": 0.4552, "step": 3762 }, { "epoch": 0.43, "learning_rate": 1.2717566226207311e-05, "loss": 0.4805, "step": 3763 }, { "epoch": 0.43, "learning_rate": 1.2714003695356037e-05, "loss": 0.4595, "step": 3764 }, { "epoch": 0.43, "learning_rate": 1.2710440792625662e-05, "loss": 0.4617, "step": 3765 }, { "epoch": 0.43, "learning_rate": 1.2706877518504384e-05, "loss": 0.485, "step": 3766 }, { "epoch": 0.43, "learning_rate": 1.2703313873480451e-05, "loss": 0.462, "step": 3767 }, { "epoch": 0.43, "learning_rate": 1.2699749858042164e-05, "loss": 0.4743, "step": 3768 }, { "epoch": 0.43, "learning_rate": 1.269618547267787e-05, "loss": 0.4731, "step": 3769 }, { "epoch": 0.43, "learning_rate": 1.2692620717875972e-05, "loss": 0.4591, "step": 3770 }, { "epoch": 0.43, "learning_rate": 1.2689055594124919e-05, "loss": 0.4616, "step": 3771 }, { "epoch": 0.43, "learning_rate": 1.2685490101913214e-05, "loss": 0.4946, "step": 3772 }, { "epoch": 0.43, "learning_rate": 1.2681924241729409e-05, "loss": 0.4563, "step": 3773 }, { "epoch": 0.43, "learning_rate": 1.2678358014062104e-05, "loss": 0.4606, "step": 3774 }, { "epoch": 0.43, "learning_rate": 1.2674791419399956e-05, "loss": 0.4596, "step": 3775 }, { "epoch": 0.43, "learning_rate": 1.2671224458231664e-05, "loss": 0.5041, "step": 3776 }, { "epoch": 0.43, "learning_rate": 1.2667657131045983e-05, "loss": 0.4335, "step": 3777 }, { "epoch": 0.43, "learning_rate": 1.2664089438331716e-05, "loss": 0.4698, "step": 3778 }, { "epoch": 0.43, "learning_rate": 1.266052138057772e-05, "loss": 0.4479, "step": 3779 }, { "epoch": 0.43, "learning_rate": 1.2656952958272893e-05, "loss": 0.4608, "step": 3780 }, { "epoch": 0.43, "learning_rate": 1.2653384171906192e-05, "loss": 0.4745, "step": 3781 }, { "epoch": 0.43, "learning_rate": 1.264981502196662e-05, "loss": 0.4606, "step": 3782 }, { "epoch": 0.43, "learning_rate": 1.2646245508943227e-05, "loss": 0.47, "step": 3783 }, { "epoch": 0.43, "learning_rate": 1.2642675633325122e-05, "loss": 0.4923, "step": 3784 }, { "epoch": 0.43, "learning_rate": 1.2639105395601452e-05, "loss": 0.4503, "step": 3785 }, { "epoch": 0.43, "learning_rate": 1.2635534796261424e-05, "loss": 0.4632, "step": 3786 }, { "epoch": 0.43, "learning_rate": 1.2631963835794285e-05, "loss": 0.4807, "step": 3787 }, { "epoch": 0.43, "learning_rate": 1.2628392514689339e-05, "loss": 0.4647, "step": 3788 }, { "epoch": 0.43, "learning_rate": 1.2624820833435939e-05, "loss": 0.4696, "step": 3789 }, { "epoch": 0.43, "learning_rate": 1.262124879252348e-05, "loss": 0.4604, "step": 3790 }, { "epoch": 0.43, "learning_rate": 1.2617676392441419e-05, "loss": 0.4466, "step": 3791 }, { "epoch": 0.43, "learning_rate": 1.2614103633679244e-05, "loss": 0.4844, "step": 3792 }, { "epoch": 0.43, "learning_rate": 1.2610530516726506e-05, "loss": 0.4597, "step": 3793 }, { "epoch": 0.43, "learning_rate": 1.260695704207281e-05, "loss": 0.4664, "step": 3794 }, { "epoch": 0.43, "learning_rate": 1.2603383210207796e-05, "loss": 0.4714, "step": 3795 }, { "epoch": 0.43, "learning_rate": 1.2599809021621157e-05, "loss": 0.4559, "step": 3796 }, { "epoch": 0.43, "learning_rate": 1.2596234476802636e-05, "loss": 0.4551, "step": 3797 }, { "epoch": 0.43, "learning_rate": 1.2592659576242028e-05, "loss": 0.4842, "step": 3798 }, { "epoch": 0.43, "learning_rate": 1.2589084320429178e-05, "loss": 0.4632, "step": 3799 }, { "epoch": 0.43, "learning_rate": 1.2585508709853971e-05, "loss": 0.477, "step": 3800 }, { "epoch": 0.43, "learning_rate": 1.2581932745006343e-05, "loss": 0.4712, "step": 3801 }, { "epoch": 0.43, "learning_rate": 1.2578356426376283e-05, "loss": 0.4702, "step": 3802 }, { "epoch": 0.43, "learning_rate": 1.2574779754453831e-05, "loss": 0.4609, "step": 3803 }, { "epoch": 0.43, "learning_rate": 1.257120272972907e-05, "loss": 0.4698, "step": 3804 }, { "epoch": 0.43, "learning_rate": 1.2567625352692127e-05, "loss": 0.4681, "step": 3805 }, { "epoch": 0.43, "learning_rate": 1.2564047623833186e-05, "loss": 0.4557, "step": 3806 }, { "epoch": 0.44, "learning_rate": 1.2560469543642472e-05, "loss": 0.4728, "step": 3807 }, { "epoch": 0.44, "learning_rate": 1.255689111261027e-05, "loss": 0.4641, "step": 3808 }, { "epoch": 0.44, "learning_rate": 1.2553312331226896e-05, "loss": 0.4671, "step": 3809 }, { "epoch": 0.44, "learning_rate": 1.254973319998273e-05, "loss": 0.4723, "step": 3810 }, { "epoch": 0.44, "learning_rate": 1.2546153719368189e-05, "loss": 0.4556, "step": 3811 }, { "epoch": 0.44, "learning_rate": 1.2542573889873741e-05, "loss": 0.479, "step": 3812 }, { "epoch": 0.44, "learning_rate": 1.2538993711989906e-05, "loss": 0.4741, "step": 3813 }, { "epoch": 0.44, "learning_rate": 1.2535413186207247e-05, "loss": 0.4584, "step": 3814 }, { "epoch": 0.44, "learning_rate": 1.2531832313016374e-05, "loss": 0.4645, "step": 3815 }, { "epoch": 0.44, "learning_rate": 1.2528251092907948e-05, "loss": 0.4779, "step": 3816 }, { "epoch": 0.44, "learning_rate": 1.2524669526372674e-05, "loss": 0.4673, "step": 3817 }, { "epoch": 0.44, "learning_rate": 1.2521087613901313e-05, "loss": 0.4735, "step": 3818 }, { "epoch": 0.44, "learning_rate": 1.251750535598466e-05, "loss": 0.4649, "step": 3819 }, { "epoch": 0.44, "learning_rate": 1.2513922753113567e-05, "loss": 0.4772, "step": 3820 }, { "epoch": 0.44, "learning_rate": 1.2510339805778932e-05, "loss": 0.4602, "step": 3821 }, { "epoch": 0.44, "learning_rate": 1.2506756514471696e-05, "loss": 0.4734, "step": 3822 }, { "epoch": 0.44, "learning_rate": 1.2503172879682853e-05, "loss": 0.4635, "step": 3823 }, { "epoch": 0.44, "learning_rate": 1.2499588901903437e-05, "loss": 0.4662, "step": 3824 }, { "epoch": 0.44, "learning_rate": 1.2496004581624538e-05, "loss": 0.4722, "step": 3825 }, { "epoch": 0.44, "learning_rate": 1.2492419919337282e-05, "loss": 0.4521, "step": 3826 }, { "epoch": 0.44, "learning_rate": 1.2488834915532852e-05, "loss": 0.4681, "step": 3827 }, { "epoch": 0.44, "learning_rate": 1.2485249570702471e-05, "loss": 0.5047, "step": 3828 }, { "epoch": 0.44, "learning_rate": 1.2481663885337417e-05, "loss": 0.4595, "step": 3829 }, { "epoch": 0.44, "learning_rate": 1.2478077859929e-05, "loss": 0.4662, "step": 3830 }, { "epoch": 0.44, "learning_rate": 1.2474491494968593e-05, "loss": 0.4725, "step": 3831 }, { "epoch": 0.44, "learning_rate": 1.2470904790947605e-05, "loss": 0.4675, "step": 3832 }, { "epoch": 0.44, "learning_rate": 1.2467317748357493e-05, "loss": 0.4636, "step": 3833 }, { "epoch": 0.44, "learning_rate": 1.2463730367689768e-05, "loss": 0.4673, "step": 3834 }, { "epoch": 0.44, "learning_rate": 1.246014264943597e-05, "loss": 0.4526, "step": 3835 }, { "epoch": 0.44, "learning_rate": 1.2456554594087709e-05, "loss": 0.4888, "step": 3836 }, { "epoch": 0.44, "learning_rate": 1.245296620213662e-05, "loss": 0.4601, "step": 3837 }, { "epoch": 0.44, "learning_rate": 1.2449377474074398e-05, "loss": 0.4894, "step": 3838 }, { "epoch": 0.44, "learning_rate": 1.2445788410392778e-05, "loss": 0.4568, "step": 3839 }, { "epoch": 0.44, "learning_rate": 1.2442199011583538e-05, "loss": 0.4489, "step": 3840 }, { "epoch": 0.44, "learning_rate": 1.2438609278138509e-05, "loss": 0.4727, "step": 3841 }, { "epoch": 0.44, "learning_rate": 1.2435019210549564e-05, "loss": 0.4745, "step": 3842 }, { "epoch": 0.44, "learning_rate": 1.2431428809308625e-05, "loss": 0.4597, "step": 3843 }, { "epoch": 0.44, "learning_rate": 1.2427838074907654e-05, "loss": 0.4838, "step": 3844 }, { "epoch": 0.44, "learning_rate": 1.2424247007838659e-05, "loss": 0.4504, "step": 3845 }, { "epoch": 0.44, "learning_rate": 1.2420655608593701e-05, "loss": 0.4759, "step": 3846 }, { "epoch": 0.44, "learning_rate": 1.2417063877664883e-05, "loss": 0.4513, "step": 3847 }, { "epoch": 0.44, "learning_rate": 1.241347181554435e-05, "loss": 0.471, "step": 3848 }, { "epoch": 0.44, "learning_rate": 1.2409879422724293e-05, "loss": 0.4847, "step": 3849 }, { "epoch": 0.44, "learning_rate": 1.240628669969695e-05, "loss": 0.4829, "step": 3850 }, { "epoch": 0.44, "learning_rate": 1.2402693646954607e-05, "loss": 0.4523, "step": 3851 }, { "epoch": 0.44, "learning_rate": 1.2399100264989593e-05, "loss": 0.4763, "step": 3852 }, { "epoch": 0.44, "learning_rate": 1.2395506554294281e-05, "loss": 0.4629, "step": 3853 }, { "epoch": 0.44, "learning_rate": 1.2391912515361085e-05, "loss": 0.4689, "step": 3854 }, { "epoch": 0.44, "learning_rate": 1.2388318148682474e-05, "loss": 0.459, "step": 3855 }, { "epoch": 0.44, "learning_rate": 1.2384723454750957e-05, "loss": 0.4638, "step": 3856 }, { "epoch": 0.44, "learning_rate": 1.2381128434059082e-05, "loss": 0.4496, "step": 3857 }, { "epoch": 0.44, "learning_rate": 1.2377533087099451e-05, "loss": 0.4754, "step": 3858 }, { "epoch": 0.44, "learning_rate": 1.2373937414364703e-05, "loss": 0.4502, "step": 3859 }, { "epoch": 0.44, "learning_rate": 1.237034141634753e-05, "loss": 0.4675, "step": 3860 }, { "epoch": 0.44, "learning_rate": 1.2366745093540667e-05, "loss": 0.4682, "step": 3861 }, { "epoch": 0.44, "learning_rate": 1.2363148446436882e-05, "loss": 0.4683, "step": 3862 }, { "epoch": 0.44, "learning_rate": 1.2359551475529e-05, "loss": 0.4558, "step": 3863 }, { "epoch": 0.44, "learning_rate": 1.2355954181309883e-05, "loss": 0.4749, "step": 3864 }, { "epoch": 0.44, "learning_rate": 1.235235656427245e-05, "loss": 0.4658, "step": 3865 }, { "epoch": 0.44, "learning_rate": 1.2348758624909644e-05, "loss": 0.4681, "step": 3866 }, { "epoch": 0.44, "learning_rate": 1.2345160363714471e-05, "loss": 0.4694, "step": 3867 }, { "epoch": 0.44, "learning_rate": 1.2341561781179965e-05, "loss": 0.4718, "step": 3868 }, { "epoch": 0.44, "learning_rate": 1.233796287779922e-05, "loss": 0.4808, "step": 3869 }, { "epoch": 0.44, "learning_rate": 1.2334363654065363e-05, "loss": 0.4671, "step": 3870 }, { "epoch": 0.44, "learning_rate": 1.2330764110471567e-05, "loss": 0.4458, "step": 3871 }, { "epoch": 0.44, "learning_rate": 1.2327164247511051e-05, "loss": 0.4809, "step": 3872 }, { "epoch": 0.44, "learning_rate": 1.2323564065677078e-05, "loss": 0.4554, "step": 3873 }, { "epoch": 0.44, "learning_rate": 1.2319963565462949e-05, "loss": 0.4595, "step": 3874 }, { "epoch": 0.44, "learning_rate": 1.2316362747362019e-05, "loss": 0.4644, "step": 3875 }, { "epoch": 0.44, "learning_rate": 1.2312761611867673e-05, "loss": 0.463, "step": 3876 }, { "epoch": 0.44, "learning_rate": 1.2309160159473354e-05, "loss": 0.4827, "step": 3877 }, { "epoch": 0.44, "learning_rate": 1.2305558390672539e-05, "loss": 0.4786, "step": 3878 }, { "epoch": 0.44, "learning_rate": 1.2301956305958746e-05, "loss": 0.4691, "step": 3879 }, { "epoch": 0.44, "learning_rate": 1.2298353905825549e-05, "loss": 0.4597, "step": 3880 }, { "epoch": 0.44, "learning_rate": 1.2294751190766552e-05, "loss": 0.4655, "step": 3881 }, { "epoch": 0.44, "learning_rate": 1.229114816127541e-05, "loss": 0.4744, "step": 3882 }, { "epoch": 0.44, "learning_rate": 1.2287544817845817e-05, "loss": 0.4498, "step": 3883 }, { "epoch": 0.44, "learning_rate": 1.2283941160971512e-05, "loss": 0.4816, "step": 3884 }, { "epoch": 0.44, "learning_rate": 1.2280337191146276e-05, "loss": 0.4777, "step": 3885 }, { "epoch": 0.44, "learning_rate": 1.2276732908863933e-05, "loss": 0.4736, "step": 3886 }, { "epoch": 0.44, "learning_rate": 1.2273128314618353e-05, "loss": 0.462, "step": 3887 }, { "epoch": 0.44, "learning_rate": 1.226952340890344e-05, "loss": 0.4851, "step": 3888 }, { "epoch": 0.44, "learning_rate": 1.2265918192213153e-05, "loss": 0.4576, "step": 3889 }, { "epoch": 0.44, "learning_rate": 1.2262312665041482e-05, "loss": 0.4893, "step": 3890 }, { "epoch": 0.44, "learning_rate": 1.2258706827882472e-05, "loss": 0.462, "step": 3891 }, { "epoch": 0.44, "learning_rate": 1.2255100681230192e-05, "loss": 0.4632, "step": 3892 }, { "epoch": 0.44, "learning_rate": 1.2251494225578775e-05, "loss": 0.4544, "step": 3893 }, { "epoch": 0.45, "learning_rate": 1.224788746142238e-05, "loss": 0.4882, "step": 3894 }, { "epoch": 0.45, "learning_rate": 1.2244280389255218e-05, "loss": 0.4637, "step": 3895 }, { "epoch": 0.45, "learning_rate": 1.2240673009571536e-05, "loss": 0.459, "step": 3896 }, { "epoch": 0.45, "learning_rate": 1.2237065322865625e-05, "loss": 0.4563, "step": 3897 }, { "epoch": 0.45, "learning_rate": 1.223345732963182e-05, "loss": 0.4665, "step": 3898 }, { "epoch": 0.45, "learning_rate": 1.2229849030364496e-05, "loss": 0.4574, "step": 3899 }, { "epoch": 0.45, "learning_rate": 1.2226240425558071e-05, "loss": 0.4701, "step": 3900 }, { "epoch": 0.45, "learning_rate": 1.2222631515707005e-05, "loss": 0.4649, "step": 3901 }, { "epoch": 0.45, "learning_rate": 1.2219022301305796e-05, "loss": 0.4686, "step": 3902 }, { "epoch": 0.45, "learning_rate": 1.2215412782848993e-05, "loss": 0.4741, "step": 3903 }, { "epoch": 0.45, "learning_rate": 1.2211802960831176e-05, "loss": 0.4629, "step": 3904 }, { "epoch": 0.45, "learning_rate": 1.2208192835746973e-05, "loss": 0.4678, "step": 3905 }, { "epoch": 0.45, "learning_rate": 1.2204582408091047e-05, "loss": 0.4732, "step": 3906 }, { "epoch": 0.45, "learning_rate": 1.2200971678358113e-05, "loss": 0.4798, "step": 3907 }, { "epoch": 0.45, "learning_rate": 1.2197360647042922e-05, "loss": 0.4674, "step": 3908 }, { "epoch": 0.45, "learning_rate": 1.2193749314640264e-05, "loss": 0.4708, "step": 3909 }, { "epoch": 0.45, "learning_rate": 1.2190137681644968e-05, "loss": 0.4884, "step": 3910 }, { "epoch": 0.45, "learning_rate": 1.2186525748551914e-05, "loss": 0.468, "step": 3911 }, { "epoch": 0.45, "learning_rate": 1.2182913515856016e-05, "loss": 0.4619, "step": 3912 }, { "epoch": 0.45, "learning_rate": 1.2179300984052233e-05, "loss": 0.4604, "step": 3913 }, { "epoch": 0.45, "learning_rate": 1.217568815363556e-05, "loss": 0.4674, "step": 3914 }, { "epoch": 0.45, "learning_rate": 1.2172075025101032e-05, "loss": 0.4838, "step": 3915 }, { "epoch": 0.45, "learning_rate": 1.2168461598943728e-05, "loss": 0.4492, "step": 3916 }, { "epoch": 0.45, "learning_rate": 1.2164847875658776e-05, "loss": 0.4636, "step": 3917 }, { "epoch": 0.45, "learning_rate": 1.2161233855741332e-05, "loss": 0.4594, "step": 3918 }, { "epoch": 0.45, "learning_rate": 1.2157619539686597e-05, "loss": 0.488, "step": 3919 }, { "epoch": 0.45, "learning_rate": 1.2154004927989815e-05, "loss": 0.4618, "step": 3920 }, { "epoch": 0.45, "learning_rate": 1.2150390021146263e-05, "loss": 0.4698, "step": 3921 }, { "epoch": 0.45, "learning_rate": 1.2146774819651275e-05, "loss": 0.4638, "step": 3922 }, { "epoch": 0.45, "learning_rate": 1.2143159324000204e-05, "loss": 0.4549, "step": 3923 }, { "epoch": 0.45, "learning_rate": 1.2139543534688456e-05, "loss": 0.4666, "step": 3924 }, { "epoch": 0.45, "learning_rate": 1.2135927452211477e-05, "loss": 0.4641, "step": 3925 }, { "epoch": 0.45, "learning_rate": 1.2132311077064749e-05, "loss": 0.4634, "step": 3926 }, { "epoch": 0.45, "learning_rate": 1.2128694409743797e-05, "loss": 0.4843, "step": 3927 }, { "epoch": 0.45, "learning_rate": 1.2125077450744187e-05, "loss": 0.4659, "step": 3928 }, { "epoch": 0.45, "learning_rate": 1.2121460200561521e-05, "loss": 0.4573, "step": 3929 }, { "epoch": 0.45, "learning_rate": 1.2117842659691444e-05, "loss": 0.4587, "step": 3930 }, { "epoch": 0.45, "learning_rate": 1.2114224828629638e-05, "loss": 0.467, "step": 3931 }, { "epoch": 0.45, "learning_rate": 1.2110606707871828e-05, "loss": 0.4531, "step": 3932 }, { "epoch": 0.45, "learning_rate": 1.2106988297913778e-05, "loss": 0.4764, "step": 3933 }, { "epoch": 0.45, "learning_rate": 1.2103369599251289e-05, "loss": 0.4769, "step": 3934 }, { "epoch": 0.45, "learning_rate": 1.2099750612380205e-05, "loss": 0.4911, "step": 3935 }, { "epoch": 0.45, "learning_rate": 1.2096131337796408e-05, "loss": 0.4438, "step": 3936 }, { "epoch": 0.45, "learning_rate": 1.2092511775995821e-05, "loss": 0.4926, "step": 3937 }, { "epoch": 0.45, "learning_rate": 1.20888919274744e-05, "loss": 0.4568, "step": 3938 }, { "epoch": 0.45, "learning_rate": 1.208527179272815e-05, "loss": 0.4464, "step": 3939 }, { "epoch": 0.45, "learning_rate": 1.2081651372253107e-05, "loss": 0.4697, "step": 3940 }, { "epoch": 0.45, "learning_rate": 1.2078030666545351e-05, "loss": 0.4728, "step": 3941 }, { "epoch": 0.45, "learning_rate": 1.2074409676101e-05, "loss": 0.4593, "step": 3942 }, { "epoch": 0.45, "learning_rate": 1.2070788401416209e-05, "loss": 0.4709, "step": 3943 }, { "epoch": 0.45, "learning_rate": 1.2067166842987175e-05, "loss": 0.4667, "step": 3944 }, { "epoch": 0.45, "learning_rate": 1.206354500131013e-05, "loss": 0.4728, "step": 3945 }, { "epoch": 0.45, "learning_rate": 1.205992287688135e-05, "loss": 0.4962, "step": 3946 }, { "epoch": 0.45, "learning_rate": 1.2056300470197144e-05, "loss": 0.4613, "step": 3947 }, { "epoch": 0.45, "learning_rate": 1.2052677781753869e-05, "loss": 0.4539, "step": 3948 }, { "epoch": 0.45, "learning_rate": 1.2049054812047905e-05, "loss": 0.4602, "step": 3949 }, { "epoch": 0.45, "learning_rate": 1.2045431561575685e-05, "loss": 0.4621, "step": 3950 }, { "epoch": 0.45, "learning_rate": 1.2041808030833675e-05, "loss": 0.4672, "step": 3951 }, { "epoch": 0.45, "learning_rate": 1.2038184220318381e-05, "loss": 0.4647, "step": 3952 }, { "epoch": 0.45, "learning_rate": 1.2034560130526341e-05, "loss": 0.4773, "step": 3953 }, { "epoch": 0.45, "learning_rate": 1.2030935761954137e-05, "loss": 0.4605, "step": 3954 }, { "epoch": 0.45, "learning_rate": 1.2027311115098395e-05, "loss": 0.4847, "step": 3955 }, { "epoch": 0.45, "learning_rate": 1.2023686190455766e-05, "loss": 0.4613, "step": 3956 }, { "epoch": 0.45, "learning_rate": 1.202006098852295e-05, "loss": 0.4723, "step": 3957 }, { "epoch": 0.45, "learning_rate": 1.2016435509796677e-05, "loss": 0.4552, "step": 3958 }, { "epoch": 0.45, "learning_rate": 1.2012809754773718e-05, "loss": 0.4701, "step": 3959 }, { "epoch": 0.45, "learning_rate": 1.2009183723950886e-05, "loss": 0.4679, "step": 3960 }, { "epoch": 0.45, "learning_rate": 1.2005557417825029e-05, "loss": 0.4634, "step": 3961 }, { "epoch": 0.45, "learning_rate": 1.2001930836893026e-05, "loss": 0.4503, "step": 3962 }, { "epoch": 0.45, "learning_rate": 1.1998303981651804e-05, "loss": 0.4864, "step": 3963 }, { "epoch": 0.45, "learning_rate": 1.199467685259832e-05, "loss": 0.4726, "step": 3964 }, { "epoch": 0.45, "learning_rate": 1.1991049450229577e-05, "loss": 0.4478, "step": 3965 }, { "epoch": 0.45, "learning_rate": 1.1987421775042605e-05, "loss": 0.4787, "step": 3966 }, { "epoch": 0.45, "learning_rate": 1.1983793827534477e-05, "loss": 0.4795, "step": 3967 }, { "epoch": 0.45, "learning_rate": 1.1980165608202303e-05, "loss": 0.4697, "step": 3968 }, { "epoch": 0.45, "learning_rate": 1.1976537117543234e-05, "loss": 0.4527, "step": 3969 }, { "epoch": 0.45, "learning_rate": 1.1972908356054455e-05, "loss": 0.4764, "step": 3970 }, { "epoch": 0.45, "learning_rate": 1.1969279324233179e-05, "loss": 0.4666, "step": 3971 }, { "epoch": 0.45, "learning_rate": 1.1965650022576672e-05, "loss": 0.4536, "step": 3972 }, { "epoch": 0.45, "learning_rate": 1.196202045158222e-05, "loss": 0.4626, "step": 3973 }, { "epoch": 0.45, "learning_rate": 1.1958390611747167e-05, "loss": 0.471, "step": 3974 }, { "epoch": 0.45, "learning_rate": 1.1954760503568878e-05, "loss": 0.4596, "step": 3975 }, { "epoch": 0.45, "learning_rate": 1.1951130127544756e-05, "loss": 0.4595, "step": 3976 }, { "epoch": 0.45, "learning_rate": 1.1947499484172245e-05, "loss": 0.4803, "step": 3977 }, { "epoch": 0.45, "learning_rate": 1.1943868573948825e-05, "loss": 0.4693, "step": 3978 }, { "epoch": 0.45, "learning_rate": 1.194023739737201e-05, "loss": 0.4819, "step": 3979 }, { "epoch": 0.45, "learning_rate": 1.1936605954939355e-05, "loss": 0.4549, "step": 3980 }, { "epoch": 0.45, "learning_rate": 1.1932974247148445e-05, "loss": 0.4593, "step": 3981 }, { "epoch": 0.46, "learning_rate": 1.192934227449691e-05, "loss": 0.4699, "step": 3982 }, { "epoch": 0.46, "learning_rate": 1.1925710037482405e-05, "loss": 0.4489, "step": 3983 }, { "epoch": 0.46, "learning_rate": 1.1922077536602634e-05, "loss": 0.4618, "step": 3984 }, { "epoch": 0.46, "learning_rate": 1.1918444772355329e-05, "loss": 0.4802, "step": 3985 }, { "epoch": 0.46, "learning_rate": 1.1914811745238256e-05, "loss": 0.4796, "step": 3986 }, { "epoch": 0.46, "learning_rate": 1.1911178455749223e-05, "loss": 0.4778, "step": 3987 }, { "epoch": 0.46, "learning_rate": 1.1907544904386074e-05, "loss": 0.4448, "step": 3988 }, { "epoch": 0.46, "learning_rate": 1.1903911091646684e-05, "loss": 0.4815, "step": 3989 }, { "epoch": 0.46, "learning_rate": 1.190027701802897e-05, "loss": 0.4605, "step": 3990 }, { "epoch": 0.46, "learning_rate": 1.1896642684030874e-05, "loss": 0.4692, "step": 3991 }, { "epoch": 0.46, "learning_rate": 1.1893008090150389e-05, "loss": 0.4576, "step": 3992 }, { "epoch": 0.46, "learning_rate": 1.1889373236885531e-05, "loss": 0.472, "step": 3993 }, { "epoch": 0.46, "learning_rate": 1.1885738124734359e-05, "loss": 0.4549, "step": 3994 }, { "epoch": 0.46, "learning_rate": 1.188210275419496e-05, "loss": 0.481, "step": 3995 }, { "epoch": 0.46, "learning_rate": 1.1878467125765464e-05, "loss": 0.449, "step": 3996 }, { "epoch": 0.46, "learning_rate": 1.1874831239944034e-05, "loss": 0.4738, "step": 3997 }, { "epoch": 0.46, "learning_rate": 1.1871195097228864e-05, "loss": 0.4507, "step": 3998 }, { "epoch": 0.46, "learning_rate": 1.1867558698118192e-05, "loss": 0.4777, "step": 3999 }, { "epoch": 0.46, "learning_rate": 1.1863922043110282e-05, "loss": 0.4692, "step": 4000 }, { "epoch": 0.46, "learning_rate": 1.1860285132703435e-05, "loss": 0.474, "step": 4001 }, { "epoch": 0.46, "learning_rate": 1.1856647967395995e-05, "loss": 0.462, "step": 4002 }, { "epoch": 0.46, "learning_rate": 1.185301054768633e-05, "loss": 0.4657, "step": 4003 }, { "epoch": 0.46, "learning_rate": 1.1849372874072852e-05, "loss": 0.4854, "step": 4004 }, { "epoch": 0.46, "learning_rate": 1.1845734947054e-05, "loss": 0.4589, "step": 4005 }, { "epoch": 0.46, "learning_rate": 1.1842096767128249e-05, "loss": 0.4663, "step": 4006 }, { "epoch": 0.46, "learning_rate": 1.1838458334794116e-05, "loss": 0.4764, "step": 4007 }, { "epoch": 0.46, "learning_rate": 1.1834819650550144e-05, "loss": 0.4485, "step": 4008 }, { "epoch": 0.46, "learning_rate": 1.1831180714894918e-05, "loss": 0.4674, "step": 4009 }, { "epoch": 0.46, "learning_rate": 1.1827541528327052e-05, "loss": 0.4603, "step": 4010 }, { "epoch": 0.46, "learning_rate": 1.182390209134519e-05, "loss": 0.4521, "step": 4011 }, { "epoch": 0.46, "learning_rate": 1.1820262404448023e-05, "loss": 0.4839, "step": 4012 }, { "epoch": 0.46, "learning_rate": 1.181662246813427e-05, "loss": 0.4953, "step": 4013 }, { "epoch": 0.46, "learning_rate": 1.1812982282902676e-05, "loss": 0.4508, "step": 4014 }, { "epoch": 0.46, "learning_rate": 1.1809341849252034e-05, "loss": 0.4796, "step": 4015 }, { "epoch": 0.46, "learning_rate": 1.180570116768116e-05, "loss": 0.4567, "step": 4016 }, { "epoch": 0.46, "learning_rate": 1.1802060238688915e-05, "loss": 0.4681, "step": 4017 }, { "epoch": 0.46, "learning_rate": 1.1798419062774185e-05, "loss": 0.4736, "step": 4018 }, { "epoch": 0.46, "learning_rate": 1.179477764043589e-05, "loss": 0.4584, "step": 4019 }, { "epoch": 0.46, "learning_rate": 1.1791135972172989e-05, "loss": 0.4717, "step": 4020 }, { "epoch": 0.46, "learning_rate": 1.1787494058484468e-05, "loss": 0.4796, "step": 4021 }, { "epoch": 0.46, "learning_rate": 1.1783851899869357e-05, "loss": 0.4622, "step": 4022 }, { "epoch": 0.46, "learning_rate": 1.1780209496826707e-05, "loss": 0.4661, "step": 4023 }, { "epoch": 0.46, "learning_rate": 1.177656684985561e-05, "loss": 0.4547, "step": 4024 }, { "epoch": 0.46, "learning_rate": 1.1772923959455188e-05, "loss": 0.4589, "step": 4025 }, { "epoch": 0.46, "learning_rate": 1.1769280826124604e-05, "loss": 0.4461, "step": 4026 }, { "epoch": 0.46, "learning_rate": 1.1765637450363048e-05, "loss": 0.479, "step": 4027 }, { "epoch": 0.46, "learning_rate": 1.176199383266974e-05, "loss": 0.475, "step": 4028 }, { "epoch": 0.46, "learning_rate": 1.1758349973543936e-05, "loss": 0.485, "step": 4029 }, { "epoch": 0.46, "learning_rate": 1.1754705873484929e-05, "loss": 0.4537, "step": 4030 }, { "epoch": 0.46, "learning_rate": 1.1751061532992045e-05, "loss": 0.4889, "step": 4031 }, { "epoch": 0.46, "learning_rate": 1.1747416952564632e-05, "loss": 0.4695, "step": 4032 }, { "epoch": 0.46, "learning_rate": 1.1743772132702086e-05, "loss": 0.4752, "step": 4033 }, { "epoch": 0.46, "learning_rate": 1.1740127073903826e-05, "loss": 0.4519, "step": 4034 }, { "epoch": 0.46, "learning_rate": 1.1736481776669307e-05, "loss": 0.4603, "step": 4035 }, { "epoch": 0.46, "learning_rate": 1.1732836241498013e-05, "loss": 0.4767, "step": 4036 }, { "epoch": 0.46, "learning_rate": 1.1729190468889466e-05, "loss": 0.4883, "step": 4037 }, { "epoch": 0.46, "learning_rate": 1.1725544459343221e-05, "loss": 0.4877, "step": 4038 }, { "epoch": 0.46, "learning_rate": 1.172189821335886e-05, "loss": 0.4644, "step": 4039 }, { "epoch": 0.46, "learning_rate": 1.1718251731436001e-05, "loss": 0.4534, "step": 4040 }, { "epoch": 0.46, "learning_rate": 1.1714605014074291e-05, "loss": 0.4697, "step": 4041 }, { "epoch": 0.46, "learning_rate": 1.1710958061773413e-05, "loss": 0.4632, "step": 4042 }, { "epoch": 0.46, "learning_rate": 1.1707310875033085e-05, "loss": 0.4561, "step": 4043 }, { "epoch": 0.46, "learning_rate": 1.1703663454353045e-05, "loss": 0.4752, "step": 4044 }, { "epoch": 0.46, "learning_rate": 1.1700015800233078e-05, "loss": 0.4879, "step": 4045 }, { "epoch": 0.46, "learning_rate": 1.169636791317299e-05, "loss": 0.4552, "step": 4046 }, { "epoch": 0.46, "learning_rate": 1.1692719793672627e-05, "loss": 0.4641, "step": 4047 }, { "epoch": 0.46, "learning_rate": 1.1689071442231858e-05, "loss": 0.4615, "step": 4048 }, { "epoch": 0.46, "learning_rate": 1.1685422859350592e-05, "loss": 0.4859, "step": 4049 }, { "epoch": 0.46, "learning_rate": 1.1681774045528764e-05, "loss": 0.4727, "step": 4050 }, { "epoch": 0.46, "learning_rate": 1.1678125001266347e-05, "loss": 0.4682, "step": 4051 }, { "epoch": 0.46, "learning_rate": 1.1674475727063337e-05, "loss": 0.4597, "step": 4052 }, { "epoch": 0.46, "learning_rate": 1.1670826223419766e-05, "loss": 0.4775, "step": 4053 }, { "epoch": 0.46, "learning_rate": 1.1667176490835701e-05, "loss": 0.4741, "step": 4054 }, { "epoch": 0.46, "learning_rate": 1.1663526529811235e-05, "loss": 0.4678, "step": 4055 }, { "epoch": 0.46, "learning_rate": 1.1659876340846494e-05, "loss": 0.4658, "step": 4056 }, { "epoch": 0.46, "learning_rate": 1.165622592444164e-05, "loss": 0.4533, "step": 4057 }, { "epoch": 0.46, "learning_rate": 1.165257528109685e-05, "loss": 0.4822, "step": 4058 }, { "epoch": 0.46, "learning_rate": 1.1648924411312354e-05, "loss": 0.4722, "step": 4059 }, { "epoch": 0.46, "learning_rate": 1.1645273315588399e-05, "loss": 0.4607, "step": 4060 }, { "epoch": 0.46, "learning_rate": 1.164162199442527e-05, "loss": 0.4798, "step": 4061 }, { "epoch": 0.46, "learning_rate": 1.1637970448323274e-05, "loss": 0.4758, "step": 4062 }, { "epoch": 0.46, "learning_rate": 1.1634318677782755e-05, "loss": 0.4617, "step": 4063 }, { "epoch": 0.46, "learning_rate": 1.163066668330409e-05, "loss": 0.467, "step": 4064 }, { "epoch": 0.46, "learning_rate": 1.1627014465387685e-05, "loss": 0.4489, "step": 4065 }, { "epoch": 0.46, "learning_rate": 1.1623362024533974e-05, "loss": 0.4678, "step": 4066 }, { "epoch": 0.46, "learning_rate": 1.161970936124342e-05, "loss": 0.4925, "step": 4067 }, { "epoch": 0.46, "learning_rate": 1.1616056476016521e-05, "loss": 0.4605, "step": 4068 }, { "epoch": 0.47, "learning_rate": 1.1612403369353806e-05, "loss": 0.4645, "step": 4069 }, { "epoch": 0.47, "learning_rate": 1.1608750041755832e-05, "loss": 0.4682, "step": 4070 }, { "epoch": 0.47, "learning_rate": 1.1605096493723183e-05, "loss": 0.4891, "step": 4071 }, { "epoch": 0.47, "learning_rate": 1.1601442725756478e-05, "loss": 0.4667, "step": 4072 }, { "epoch": 0.47, "learning_rate": 1.1597788738356365e-05, "loss": 0.4829, "step": 4073 }, { "epoch": 0.47, "learning_rate": 1.1594134532023525e-05, "loss": 0.4345, "step": 4074 }, { "epoch": 0.47, "learning_rate": 1.1590480107258663e-05, "loss": 0.4448, "step": 4075 }, { "epoch": 0.47, "learning_rate": 1.1586825464562515e-05, "loss": 0.4806, "step": 4076 }, { "epoch": 0.47, "learning_rate": 1.1583170604435851e-05, "loss": 0.4897, "step": 4077 }, { "epoch": 0.47, "learning_rate": 1.1579515527379468e-05, "loss": 0.4704, "step": 4078 }, { "epoch": 0.47, "learning_rate": 1.1575860233894195e-05, "loss": 0.4678, "step": 4079 }, { "epoch": 0.47, "learning_rate": 1.1572204724480887e-05, "loss": 0.4891, "step": 4080 }, { "epoch": 0.47, "learning_rate": 1.1568548999640428e-05, "loss": 0.4619, "step": 4081 }, { "epoch": 0.47, "learning_rate": 1.1564893059873734e-05, "loss": 0.4855, "step": 4082 }, { "epoch": 0.47, "learning_rate": 1.1561236905681761e-05, "loss": 0.4489, "step": 4083 }, { "epoch": 0.47, "learning_rate": 1.155758053756547e-05, "loss": 0.4747, "step": 4084 }, { "epoch": 0.47, "learning_rate": 1.1553923956025871e-05, "loss": 0.4877, "step": 4085 }, { "epoch": 0.47, "learning_rate": 1.1550267161563998e-05, "loss": 0.4616, "step": 4086 }, { "epoch": 0.47, "learning_rate": 1.1546610154680908e-05, "loss": 0.4657, "step": 4087 }, { "epoch": 0.47, "learning_rate": 1.1542952935877703e-05, "loss": 0.4554, "step": 4088 }, { "epoch": 0.47, "learning_rate": 1.1539295505655494e-05, "loss": 0.4621, "step": 4089 }, { "epoch": 0.47, "learning_rate": 1.1535637864515436e-05, "loss": 0.4696, "step": 4090 }, { "epoch": 0.47, "learning_rate": 1.1531980012958706e-05, "loss": 0.4821, "step": 4091 }, { "epoch": 0.47, "learning_rate": 1.152832195148651e-05, "loss": 0.4452, "step": 4092 }, { "epoch": 0.47, "learning_rate": 1.1524663680600083e-05, "loss": 0.5015, "step": 4093 }, { "epoch": 0.47, "learning_rate": 1.1521005200800694e-05, "loss": 0.4502, "step": 4094 }, { "epoch": 0.47, "learning_rate": 1.1517346512589635e-05, "loss": 0.4993, "step": 4095 }, { "epoch": 0.47, "learning_rate": 1.1513687616468225e-05, "loss": 0.4516, "step": 4096 }, { "epoch": 0.47, "learning_rate": 1.1510028512937818e-05, "loss": 0.4495, "step": 4097 }, { "epoch": 0.47, "learning_rate": 1.1506369202499791e-05, "loss": 0.4643, "step": 4098 }, { "epoch": 0.47, "learning_rate": 1.1502709685655553e-05, "loss": 0.474, "step": 4099 }, { "epoch": 0.47, "learning_rate": 1.149904996290654e-05, "loss": 0.448, "step": 4100 }, { "epoch": 0.47, "learning_rate": 1.149539003475421e-05, "loss": 0.4667, "step": 4101 }, { "epoch": 0.47, "learning_rate": 1.1491729901700062e-05, "loss": 0.4557, "step": 4102 }, { "epoch": 0.47, "learning_rate": 1.148806956424561e-05, "loss": 0.4826, "step": 4103 }, { "epoch": 0.47, "learning_rate": 1.1484409022892406e-05, "loss": 0.4517, "step": 4104 }, { "epoch": 0.47, "learning_rate": 1.1480748278142025e-05, "loss": 0.4756, "step": 4105 }, { "epoch": 0.47, "learning_rate": 1.1477087330496071e-05, "loss": 0.4744, "step": 4106 }, { "epoch": 0.47, "learning_rate": 1.1473426180456174e-05, "loss": 0.4785, "step": 4107 }, { "epoch": 0.47, "learning_rate": 1.1469764828523995e-05, "loss": 0.4586, "step": 4108 }, { "epoch": 0.47, "learning_rate": 1.146610327520122e-05, "loss": 0.4743, "step": 4109 }, { "epoch": 0.47, "learning_rate": 1.1462441520989565e-05, "loss": 0.4627, "step": 4110 }, { "epoch": 0.47, "learning_rate": 1.1458779566390768e-05, "loss": 0.4851, "step": 4111 }, { "epoch": 0.47, "learning_rate": 1.1455117411906604e-05, "loss": 0.4588, "step": 4112 }, { "epoch": 0.47, "learning_rate": 1.1451455058038864e-05, "loss": 0.47, "step": 4113 }, { "epoch": 0.47, "learning_rate": 1.1447792505289384e-05, "loss": 0.4498, "step": 4114 }, { "epoch": 0.47, "learning_rate": 1.1444129754159998e-05, "loss": 0.4372, "step": 4115 }, { "epoch": 0.47, "learning_rate": 1.1440466805152596e-05, "loss": 0.4844, "step": 4116 }, { "epoch": 0.47, "learning_rate": 1.1436803658769082e-05, "loss": 0.4632, "step": 4117 }, { "epoch": 0.47, "learning_rate": 1.1433140315511392e-05, "loss": 0.4676, "step": 4118 }, { "epoch": 0.47, "learning_rate": 1.142947677588148e-05, "loss": 0.4622, "step": 4119 }, { "epoch": 0.47, "learning_rate": 1.1425813040381332e-05, "loss": 0.4423, "step": 4120 }, { "epoch": 0.47, "learning_rate": 1.1422149109512967e-05, "loss": 0.4961, "step": 4121 }, { "epoch": 0.47, "learning_rate": 1.1418484983778421e-05, "loss": 0.4723, "step": 4122 }, { "epoch": 0.47, "learning_rate": 1.1414820663679768e-05, "loss": 0.486, "step": 4123 }, { "epoch": 0.47, "learning_rate": 1.1411156149719094e-05, "loss": 0.4641, "step": 4124 }, { "epoch": 0.47, "learning_rate": 1.1407491442398518e-05, "loss": 0.4745, "step": 4125 }, { "epoch": 0.47, "learning_rate": 1.1403826542220193e-05, "loss": 0.4447, "step": 4126 }, { "epoch": 0.47, "learning_rate": 1.1400161449686293e-05, "loss": 0.4544, "step": 4127 }, { "epoch": 0.47, "learning_rate": 1.139649616529901e-05, "loss": 0.4771, "step": 4128 }, { "epoch": 0.47, "learning_rate": 1.1392830689560577e-05, "loss": 0.4845, "step": 4129 }, { "epoch": 0.47, "learning_rate": 1.1389165022973238e-05, "loss": 0.4613, "step": 4130 }, { "epoch": 0.47, "learning_rate": 1.1385499166039281e-05, "loss": 0.4566, "step": 4131 }, { "epoch": 0.47, "learning_rate": 1.1381833119261003e-05, "loss": 0.4597, "step": 4132 }, { "epoch": 0.47, "learning_rate": 1.1378166883140738e-05, "loss": 0.4653, "step": 4133 }, { "epoch": 0.47, "learning_rate": 1.1374500458180839e-05, "loss": 0.4702, "step": 4134 }, { "epoch": 0.47, "learning_rate": 1.137083384488369e-05, "loss": 0.4467, "step": 4135 }, { "epoch": 0.47, "learning_rate": 1.1367167043751701e-05, "loss": 0.4668, "step": 4136 }, { "epoch": 0.47, "learning_rate": 1.1363500055287301e-05, "loss": 0.4543, "step": 4137 }, { "epoch": 0.47, "learning_rate": 1.1359832879992956e-05, "loss": 0.4653, "step": 4138 }, { "epoch": 0.47, "learning_rate": 1.1356165518371142e-05, "loss": 0.4749, "step": 4139 }, { "epoch": 0.47, "learning_rate": 1.1352497970924376e-05, "loss": 0.4748, "step": 4140 }, { "epoch": 0.47, "learning_rate": 1.1348830238155191e-05, "loss": 0.4532, "step": 4141 }, { "epoch": 0.47, "learning_rate": 1.134516232056615e-05, "loss": 0.4458, "step": 4142 }, { "epoch": 0.47, "learning_rate": 1.134149421865984e-05, "loss": 0.4781, "step": 4143 }, { "epoch": 0.47, "learning_rate": 1.1337825932938866e-05, "loss": 0.4488, "step": 4144 }, { "epoch": 0.47, "learning_rate": 1.1334157463905876e-05, "loss": 0.4605, "step": 4145 }, { "epoch": 0.47, "learning_rate": 1.1330488812063526e-05, "loss": 0.4605, "step": 4146 }, { "epoch": 0.47, "learning_rate": 1.1326819977914503e-05, "loss": 0.4966, "step": 4147 }, { "epoch": 0.47, "learning_rate": 1.132315096196152e-05, "loss": 0.4677, "step": 4148 }, { "epoch": 0.47, "learning_rate": 1.1319481764707313e-05, "loss": 0.4461, "step": 4149 }, { "epoch": 0.47, "learning_rate": 1.131581238665465e-05, "loss": 0.4615, "step": 4150 }, { "epoch": 0.47, "learning_rate": 1.1312142828306309e-05, "loss": 0.4617, "step": 4151 }, { "epoch": 0.47, "learning_rate": 1.1308473090165107e-05, "loss": 0.4534, "step": 4152 }, { "epoch": 0.47, "learning_rate": 1.1304803172733878e-05, "loss": 0.4575, "step": 4153 }, { "epoch": 0.47, "learning_rate": 1.1301133076515482e-05, "loss": 0.463, "step": 4154 }, { "epoch": 0.47, "learning_rate": 1.1297462802012806e-05, "loss": 0.4876, "step": 4155 }, { "epoch": 0.47, "learning_rate": 1.129379234972876e-05, "loss": 0.4654, "step": 4156 }, { "epoch": 0.48, "learning_rate": 1.1290121720166277e-05, "loss": 0.4713, "step": 4157 }, { "epoch": 0.48, "learning_rate": 1.1286450913828313e-05, "loss": 0.4479, "step": 4158 }, { "epoch": 0.48, "learning_rate": 1.1282779931217852e-05, "loss": 0.4562, "step": 4159 }, { "epoch": 0.48, "learning_rate": 1.1279108772837901e-05, "loss": 0.4596, "step": 4160 }, { "epoch": 0.48, "learning_rate": 1.1275437439191493e-05, "loss": 0.469, "step": 4161 }, { "epoch": 0.48, "learning_rate": 1.1271765930781677e-05, "loss": 0.4607, "step": 4162 }, { "epoch": 0.48, "learning_rate": 1.1268094248111536e-05, "loss": 0.471, "step": 4163 }, { "epoch": 0.48, "learning_rate": 1.1264422391684171e-05, "loss": 0.4497, "step": 4164 }, { "epoch": 0.48, "learning_rate": 1.126075036200271e-05, "loss": 0.4635, "step": 4165 }, { "epoch": 0.48, "learning_rate": 1.1257078159570303e-05, "loss": 0.4637, "step": 4166 }, { "epoch": 0.48, "learning_rate": 1.125340578489012e-05, "loss": 0.4544, "step": 4167 }, { "epoch": 0.48, "learning_rate": 1.1249733238465359e-05, "loss": 0.4707, "step": 4168 }, { "epoch": 0.48, "learning_rate": 1.1246060520799244e-05, "loss": 0.4489, "step": 4169 }, { "epoch": 0.48, "learning_rate": 1.1242387632395019e-05, "loss": 0.4794, "step": 4170 }, { "epoch": 0.48, "learning_rate": 1.1238714573755954e-05, "loss": 0.4467, "step": 4171 }, { "epoch": 0.48, "learning_rate": 1.1235041345385328e-05, "loss": 0.4618, "step": 4172 }, { "epoch": 0.48, "learning_rate": 1.123136794778647e-05, "loss": 0.4623, "step": 4173 }, { "epoch": 0.48, "learning_rate": 1.122769438146271e-05, "loss": 0.4752, "step": 4174 }, { "epoch": 0.48, "learning_rate": 1.1224020646917413e-05, "loss": 0.4514, "step": 4175 }, { "epoch": 0.48, "learning_rate": 1.1220346744653956e-05, "loss": 0.4628, "step": 4176 }, { "epoch": 0.48, "learning_rate": 1.1216672675175748e-05, "loss": 0.4627, "step": 4177 }, { "epoch": 0.48, "learning_rate": 1.1212998438986223e-05, "loss": 0.4575, "step": 4178 }, { "epoch": 0.48, "learning_rate": 1.1209324036588828e-05, "loss": 0.4789, "step": 4179 }, { "epoch": 0.48, "learning_rate": 1.1205649468487042e-05, "loss": 0.4914, "step": 4180 }, { "epoch": 0.48, "learning_rate": 1.1201974735184362e-05, "loss": 0.4602, "step": 4181 }, { "epoch": 0.48, "learning_rate": 1.1198299837184305e-05, "loss": 0.4697, "step": 4182 }, { "epoch": 0.48, "learning_rate": 1.1194624774990418e-05, "loss": 0.4737, "step": 4183 }, { "epoch": 0.48, "learning_rate": 1.119094954910627e-05, "loss": 0.4548, "step": 4184 }, { "epoch": 0.48, "learning_rate": 1.118727416003544e-05, "loss": 0.4352, "step": 4185 }, { "epoch": 0.48, "learning_rate": 1.1183598608281543e-05, "loss": 0.4824, "step": 4186 }, { "epoch": 0.48, "learning_rate": 1.1179922894348207e-05, "loss": 0.4557, "step": 4187 }, { "epoch": 0.48, "learning_rate": 1.11762470187391e-05, "loss": 0.4896, "step": 4188 }, { "epoch": 0.48, "learning_rate": 1.1172570981957886e-05, "loss": 0.4562, "step": 4189 }, { "epoch": 0.48, "learning_rate": 1.1168894784508268e-05, "loss": 0.4579, "step": 4190 }, { "epoch": 0.48, "learning_rate": 1.1165218426893969e-05, "loss": 0.4793, "step": 4191 }, { "epoch": 0.48, "learning_rate": 1.1161541909618728e-05, "loss": 0.4601, "step": 4192 }, { "epoch": 0.48, "learning_rate": 1.1157865233186315e-05, "loss": 0.4474, "step": 4193 }, { "epoch": 0.48, "learning_rate": 1.1154188398100516e-05, "loss": 0.4726, "step": 4194 }, { "epoch": 0.48, "learning_rate": 1.1150511404865136e-05, "loss": 0.4498, "step": 4195 }, { "epoch": 0.48, "learning_rate": 1.1146834253984008e-05, "loss": 0.473, "step": 4196 }, { "epoch": 0.48, "learning_rate": 1.114315694596098e-05, "loss": 0.4606, "step": 4197 }, { "epoch": 0.48, "learning_rate": 1.1139479481299928e-05, "loss": 0.4608, "step": 4198 }, { "epoch": 0.48, "learning_rate": 1.113580186050475e-05, "loss": 0.4625, "step": 4199 }, { "epoch": 0.48, "learning_rate": 1.1132124084079359e-05, "loss": 0.4688, "step": 4200 }, { "epoch": 0.48, "learning_rate": 1.112844615252769e-05, "loss": 0.4852, "step": 4201 }, { "epoch": 0.48, "learning_rate": 1.1124768066353705e-05, "loss": 0.4653, "step": 4202 }, { "epoch": 0.48, "learning_rate": 1.1121089826061385e-05, "loss": 0.4611, "step": 4203 }, { "epoch": 0.48, "learning_rate": 1.1117411432154725e-05, "loss": 0.47, "step": 4204 }, { "epoch": 0.48, "learning_rate": 1.1113732885137755e-05, "loss": 0.4632, "step": 4205 }, { "epoch": 0.48, "learning_rate": 1.1110054185514513e-05, "loss": 0.4561, "step": 4206 }, { "epoch": 0.48, "learning_rate": 1.1106375333789065e-05, "loss": 0.4782, "step": 4207 }, { "epoch": 0.48, "learning_rate": 1.1102696330465495e-05, "loss": 0.4728, "step": 4208 }, { "epoch": 0.48, "learning_rate": 1.1099017176047909e-05, "loss": 0.4594, "step": 4209 }, { "epoch": 0.48, "learning_rate": 1.109533787104043e-05, "loss": 0.4676, "step": 4210 }, { "epoch": 0.48, "learning_rate": 1.109165841594721e-05, "loss": 0.46, "step": 4211 }, { "epoch": 0.48, "learning_rate": 1.1087978811272417e-05, "loss": 0.4804, "step": 4212 }, { "epoch": 0.48, "learning_rate": 1.1084299057520234e-05, "loss": 0.4493, "step": 4213 }, { "epoch": 0.48, "learning_rate": 1.1080619155194873e-05, "loss": 0.4893, "step": 4214 }, { "epoch": 0.48, "learning_rate": 1.107693910480056e-05, "loss": 0.452, "step": 4215 }, { "epoch": 0.48, "learning_rate": 1.1073258906841547e-05, "loss": 0.4683, "step": 4216 }, { "epoch": 0.48, "learning_rate": 1.10695785618221e-05, "loss": 0.4677, "step": 4217 }, { "epoch": 0.48, "learning_rate": 1.1065898070246512e-05, "loss": 0.4687, "step": 4218 }, { "epoch": 0.48, "learning_rate": 1.1062217432619095e-05, "loss": 0.4808, "step": 4219 }, { "epoch": 0.48, "learning_rate": 1.1058536649444167e-05, "loss": 0.4601, "step": 4220 }, { "epoch": 0.48, "learning_rate": 1.105485572122609e-05, "loss": 0.4564, "step": 4221 }, { "epoch": 0.48, "learning_rate": 1.1051174648469225e-05, "loss": 0.4677, "step": 4222 }, { "epoch": 0.48, "learning_rate": 1.104749343167797e-05, "loss": 0.4712, "step": 4223 }, { "epoch": 0.48, "learning_rate": 1.104381207135672e-05, "loss": 0.475, "step": 4224 }, { "epoch": 0.48, "learning_rate": 1.104013056800992e-05, "loss": 0.4599, "step": 4225 }, { "epoch": 0.48, "learning_rate": 1.1036448922142004e-05, "loss": 0.4706, "step": 4226 }, { "epoch": 0.48, "learning_rate": 1.1032767134257451e-05, "loss": 0.4714, "step": 4227 }, { "epoch": 0.48, "learning_rate": 1.102908520486074e-05, "loss": 0.4596, "step": 4228 }, { "epoch": 0.48, "learning_rate": 1.1025403134456378e-05, "loss": 0.4529, "step": 4229 }, { "epoch": 0.48, "learning_rate": 1.1021720923548897e-05, "loss": 0.4729, "step": 4230 }, { "epoch": 0.48, "learning_rate": 1.1018038572642837e-05, "loss": 0.4506, "step": 4231 }, { "epoch": 0.48, "learning_rate": 1.1014356082242766e-05, "loss": 0.4713, "step": 4232 }, { "epoch": 0.48, "learning_rate": 1.1010673452853262e-05, "loss": 0.4613, "step": 4233 }, { "epoch": 0.48, "learning_rate": 1.1006990684978928e-05, "loss": 0.4614, "step": 4234 }, { "epoch": 0.48, "learning_rate": 1.1003307779124392e-05, "loss": 0.4434, "step": 4235 }, { "epoch": 0.48, "learning_rate": 1.0999624735794292e-05, "loss": 0.4647, "step": 4236 }, { "epoch": 0.48, "learning_rate": 1.0995941555493283e-05, "loss": 0.4507, "step": 4237 }, { "epoch": 0.48, "learning_rate": 1.0992258238726046e-05, "loss": 0.4711, "step": 4238 }, { "epoch": 0.48, "learning_rate": 1.0988574785997275e-05, "loss": 0.4512, "step": 4239 }, { "epoch": 0.48, "learning_rate": 1.0984891197811686e-05, "loss": 0.4598, "step": 4240 }, { "epoch": 0.48, "learning_rate": 1.0981207474674021e-05, "loss": 0.4618, "step": 4241 }, { "epoch": 0.48, "learning_rate": 1.0977523617089019e-05, "loss": 0.473, "step": 4242 }, { "epoch": 0.48, "learning_rate": 1.097383962556146e-05, "loss": 0.4364, "step": 4243 }, { "epoch": 0.49, "learning_rate": 1.0970155500596127e-05, "loss": 0.4559, "step": 4244 }, { "epoch": 0.49, "learning_rate": 1.0966471242697834e-05, "loss": 0.4674, "step": 4245 }, { "epoch": 0.49, "learning_rate": 1.0962786852371402e-05, "loss": 0.4773, "step": 4246 }, { "epoch": 0.49, "learning_rate": 1.0959102330121676e-05, "loss": 0.4772, "step": 4247 }, { "epoch": 0.49, "learning_rate": 1.0955417676453517e-05, "loss": 0.4668, "step": 4248 }, { "epoch": 0.49, "learning_rate": 1.0951732891871807e-05, "loss": 0.4536, "step": 4249 }, { "epoch": 0.49, "learning_rate": 1.0948047976881439e-05, "loss": 0.4819, "step": 4250 }, { "epoch": 0.49, "learning_rate": 1.0944362931987336e-05, "loss": 0.4545, "step": 4251 }, { "epoch": 0.49, "learning_rate": 1.0940677757694425e-05, "loss": 0.4557, "step": 4252 }, { "epoch": 0.49, "learning_rate": 1.093699245450766e-05, "loss": 0.4531, "step": 4253 }, { "epoch": 0.49, "learning_rate": 1.093330702293201e-05, "loss": 0.4528, "step": 4254 }, { "epoch": 0.49, "learning_rate": 1.092962146347246e-05, "loss": 0.4605, "step": 4255 }, { "epoch": 0.49, "learning_rate": 1.0925935776634014e-05, "loss": 0.4651, "step": 4256 }, { "epoch": 0.49, "learning_rate": 1.0922249962921694e-05, "loss": 0.4555, "step": 4257 }, { "epoch": 0.49, "learning_rate": 1.0918564022840539e-05, "loss": 0.4513, "step": 4258 }, { "epoch": 0.49, "learning_rate": 1.0914877956895604e-05, "loss": 0.4656, "step": 4259 }, { "epoch": 0.49, "learning_rate": 1.0911191765591966e-05, "loss": 0.4609, "step": 4260 }, { "epoch": 0.49, "learning_rate": 1.090750544943471e-05, "loss": 0.4698, "step": 4261 }, { "epoch": 0.49, "learning_rate": 1.0903819008928948e-05, "loss": 0.4613, "step": 4262 }, { "epoch": 0.49, "learning_rate": 1.0900132444579801e-05, "loss": 0.4463, "step": 4263 }, { "epoch": 0.49, "learning_rate": 1.0896445756892415e-05, "loss": 0.4858, "step": 4264 }, { "epoch": 0.49, "learning_rate": 1.0892758946371943e-05, "loss": 0.4598, "step": 4265 }, { "epoch": 0.49, "learning_rate": 1.0889072013523568e-05, "loss": 0.4422, "step": 4266 }, { "epoch": 0.49, "learning_rate": 1.0885384958852474e-05, "loss": 0.4569, "step": 4267 }, { "epoch": 0.49, "learning_rate": 1.0881697782863874e-05, "loss": 0.4665, "step": 4268 }, { "epoch": 0.49, "learning_rate": 1.0878010486062993e-05, "loss": 0.4516, "step": 4269 }, { "epoch": 0.49, "learning_rate": 1.0874323068955073e-05, "loss": 0.4574, "step": 4270 }, { "epoch": 0.49, "learning_rate": 1.0870635532045375e-05, "loss": 0.4604, "step": 4271 }, { "epoch": 0.49, "learning_rate": 1.0866947875839167e-05, "loss": 0.4557, "step": 4272 }, { "epoch": 0.49, "learning_rate": 1.0863260100841744e-05, "loss": 0.4617, "step": 4273 }, { "epoch": 0.49, "learning_rate": 1.0859572207558416e-05, "loss": 0.4668, "step": 4274 }, { "epoch": 0.49, "learning_rate": 1.0855884196494507e-05, "loss": 0.451, "step": 4275 }, { "epoch": 0.49, "learning_rate": 1.0852196068155352e-05, "loss": 0.4583, "step": 4276 }, { "epoch": 0.49, "learning_rate": 1.0848507823046306e-05, "loss": 0.4804, "step": 4277 }, { "epoch": 0.49, "learning_rate": 1.0844819461672748e-05, "loss": 0.4617, "step": 4278 }, { "epoch": 0.49, "learning_rate": 1.0841130984540063e-05, "loss": 0.4703, "step": 4279 }, { "epoch": 0.49, "learning_rate": 1.0837442392153651e-05, "loss": 0.4611, "step": 4280 }, { "epoch": 0.49, "learning_rate": 1.0833753685018935e-05, "loss": 0.451, "step": 4281 }, { "epoch": 0.49, "learning_rate": 1.0830064863641352e-05, "loss": 0.4829, "step": 4282 }, { "epoch": 0.49, "learning_rate": 1.082637592852635e-05, "loss": 0.459, "step": 4283 }, { "epoch": 0.49, "learning_rate": 1.0822686880179395e-05, "loss": 0.468, "step": 4284 }, { "epoch": 0.49, "learning_rate": 1.081899771910597e-05, "loss": 0.4545, "step": 4285 }, { "epoch": 0.49, "learning_rate": 1.081530844581157e-05, "loss": 0.4563, "step": 4286 }, { "epoch": 0.49, "learning_rate": 1.0811619060801713e-05, "loss": 0.4765, "step": 4287 }, { "epoch": 0.49, "learning_rate": 1.0807929564581925e-05, "loss": 0.4501, "step": 4288 }, { "epoch": 0.49, "learning_rate": 1.080423995765775e-05, "loss": 0.4503, "step": 4289 }, { "epoch": 0.49, "learning_rate": 1.0800550240534742e-05, "loss": 0.4785, "step": 4290 }, { "epoch": 0.49, "learning_rate": 1.0796860413718475e-05, "loss": 0.4585, "step": 4291 }, { "epoch": 0.49, "learning_rate": 1.0793170477714546e-05, "loss": 0.4625, "step": 4292 }, { "epoch": 0.49, "learning_rate": 1.0789480433028551e-05, "loss": 0.4596, "step": 4293 }, { "epoch": 0.49, "learning_rate": 1.0785790280166114e-05, "loss": 0.4536, "step": 4294 }, { "epoch": 0.49, "learning_rate": 1.078210001963286e-05, "loss": 0.4592, "step": 4295 }, { "epoch": 0.49, "learning_rate": 1.0778409651934442e-05, "loss": 0.4829, "step": 4296 }, { "epoch": 0.49, "learning_rate": 1.0774719177576526e-05, "loss": 0.4804, "step": 4297 }, { "epoch": 0.49, "learning_rate": 1.0771028597064785e-05, "loss": 0.4635, "step": 4298 }, { "epoch": 0.49, "learning_rate": 1.076733791090491e-05, "loss": 0.458, "step": 4299 }, { "epoch": 0.49, "learning_rate": 1.0763647119602614e-05, "loss": 0.4521, "step": 4300 }, { "epoch": 0.49, "learning_rate": 1.0759956223663608e-05, "loss": 0.4635, "step": 4301 }, { "epoch": 0.49, "learning_rate": 1.0756265223593637e-05, "loss": 0.4627, "step": 4302 }, { "epoch": 0.49, "learning_rate": 1.0752574119898445e-05, "loss": 0.4643, "step": 4303 }, { "epoch": 0.49, "learning_rate": 1.0748882913083794e-05, "loss": 0.4849, "step": 4304 }, { "epoch": 0.49, "learning_rate": 1.0745191603655466e-05, "loss": 0.4653, "step": 4305 }, { "epoch": 0.49, "learning_rate": 1.074150019211925e-05, "loss": 0.48, "step": 4306 }, { "epoch": 0.49, "learning_rate": 1.0737808678980954e-05, "loss": 0.4599, "step": 4307 }, { "epoch": 0.49, "learning_rate": 1.0734117064746395e-05, "loss": 0.4787, "step": 4308 }, { "epoch": 0.49, "learning_rate": 1.073042534992141e-05, "loss": 0.4467, "step": 4309 }, { "epoch": 0.49, "learning_rate": 1.0726733535011844e-05, "loss": 0.4669, "step": 4310 }, { "epoch": 0.49, "learning_rate": 1.0723041620523558e-05, "loss": 0.4679, "step": 4311 }, { "epoch": 0.49, "learning_rate": 1.0719349606962426e-05, "loss": 0.443, "step": 4312 }, { "epoch": 0.49, "learning_rate": 1.071565749483434e-05, "loss": 0.4815, "step": 4313 }, { "epoch": 0.49, "learning_rate": 1.0711965284645198e-05, "loss": 0.4714, "step": 4314 }, { "epoch": 0.49, "learning_rate": 1.0708272976900915e-05, "loss": 0.45, "step": 4315 }, { "epoch": 0.49, "learning_rate": 1.0704580572107424e-05, "loss": 0.4824, "step": 4316 }, { "epoch": 0.49, "learning_rate": 1.0700888070770663e-05, "loss": 0.4578, "step": 4317 }, { "epoch": 0.49, "learning_rate": 1.0697195473396587e-05, "loss": 0.4675, "step": 4318 }, { "epoch": 0.49, "learning_rate": 1.0693502780491168e-05, "loss": 0.4679, "step": 4319 }, { "epoch": 0.49, "learning_rate": 1.0689809992560382e-05, "loss": 0.4471, "step": 4320 }, { "epoch": 0.49, "learning_rate": 1.0686117110110228e-05, "loss": 0.4587, "step": 4321 }, { "epoch": 0.49, "learning_rate": 1.0682424133646712e-05, "loss": 0.4886, "step": 4322 }, { "epoch": 0.49, "learning_rate": 1.067873106367585e-05, "loss": 0.4718, "step": 4323 }, { "epoch": 0.49, "learning_rate": 1.0675037900703684e-05, "loss": 0.4528, "step": 4324 }, { "epoch": 0.49, "learning_rate": 1.0671344645236253e-05, "loss": 0.4683, "step": 4325 }, { "epoch": 0.49, "learning_rate": 1.0667651297779615e-05, "loss": 0.473, "step": 4326 }, { "epoch": 0.49, "learning_rate": 1.0663957858839843e-05, "loss": 0.4572, "step": 4327 }, { "epoch": 0.49, "learning_rate": 1.0660264328923024e-05, "loss": 0.4593, "step": 4328 }, { "epoch": 0.49, "learning_rate": 1.0656570708535248e-05, "loss": 0.4559, "step": 4329 }, { "epoch": 0.49, "learning_rate": 1.0652876998182626e-05, "loss": 0.4716, "step": 4330 }, { "epoch": 0.49, "learning_rate": 1.064918319837128e-05, "loss": 0.5014, "step": 4331 }, { "epoch": 0.5, "learning_rate": 1.0645489309607346e-05, "loss": 0.4458, "step": 4332 }, { "epoch": 0.5, "learning_rate": 1.064179533239696e-05, "loss": 0.4546, "step": 4333 }, { "epoch": 0.5, "learning_rate": 1.0638101267246283e-05, "loss": 0.5054, "step": 4334 }, { "epoch": 0.5, "learning_rate": 1.0634407114661492e-05, "loss": 0.4734, "step": 4335 }, { "epoch": 0.5, "learning_rate": 1.0630712875148758e-05, "loss": 0.4572, "step": 4336 }, { "epoch": 0.5, "learning_rate": 1.0627018549214284e-05, "loss": 0.4573, "step": 4337 }, { "epoch": 0.5, "learning_rate": 1.062332413736426e-05, "loss": 0.4595, "step": 4338 }, { "epoch": 0.5, "learning_rate": 1.0619629640104921e-05, "loss": 0.4774, "step": 4339 }, { "epoch": 0.5, "learning_rate": 1.0615935057942485e-05, "loss": 0.4731, "step": 4340 }, { "epoch": 0.5, "learning_rate": 1.0612240391383197e-05, "loss": 0.4404, "step": 4341 }, { "epoch": 0.5, "learning_rate": 1.0608545640933304e-05, "loss": 0.4807, "step": 4342 }, { "epoch": 0.5, "learning_rate": 1.060485080709907e-05, "loss": 0.4475, "step": 4343 }, { "epoch": 0.5, "learning_rate": 1.0601155890386771e-05, "loss": 0.468, "step": 4344 }, { "epoch": 0.5, "learning_rate": 1.05974608913027e-05, "loss": 0.4684, "step": 4345 }, { "epoch": 0.5, "learning_rate": 1.0593765810353142e-05, "loss": 0.4471, "step": 4346 }, { "epoch": 0.5, "learning_rate": 1.0590070648044415e-05, "loss": 0.465, "step": 4347 }, { "epoch": 0.5, "learning_rate": 1.0586375404882832e-05, "loss": 0.4646, "step": 4348 }, { "epoch": 0.5, "learning_rate": 1.0582680081374728e-05, "loss": 0.4695, "step": 4349 }, { "epoch": 0.5, "learning_rate": 1.0578984678026445e-05, "loss": 0.4684, "step": 4350 }, { "epoch": 0.5, "learning_rate": 1.0575289195344334e-05, "loss": 0.454, "step": 4351 }, { "epoch": 0.5, "learning_rate": 1.0571593633834758e-05, "loss": 0.477, "step": 4352 }, { "epoch": 0.5, "learning_rate": 1.0567897994004093e-05, "loss": 0.4632, "step": 4353 }, { "epoch": 0.5, "learning_rate": 1.0564202276358726e-05, "loss": 0.4516, "step": 4354 }, { "epoch": 0.5, "learning_rate": 1.0560506481405048e-05, "loss": 0.4679, "step": 4355 }, { "epoch": 0.5, "learning_rate": 1.0556810609649471e-05, "loss": 0.4686, "step": 4356 }, { "epoch": 0.5, "learning_rate": 1.0553114661598406e-05, "loss": 0.4695, "step": 4357 }, { "epoch": 0.5, "learning_rate": 1.0549418637758284e-05, "loss": 0.4569, "step": 4358 }, { "epoch": 0.5, "learning_rate": 1.0545722538635544e-05, "loss": 0.4721, "step": 4359 }, { "epoch": 0.5, "learning_rate": 1.054202636473663e-05, "loss": 0.4599, "step": 4360 }, { "epoch": 0.5, "learning_rate": 1.0538330116568006e-05, "loss": 0.4584, "step": 4361 }, { "epoch": 0.5, "learning_rate": 1.0534633794636134e-05, "loss": 0.469, "step": 4362 }, { "epoch": 0.5, "learning_rate": 1.0530937399447496e-05, "loss": 0.4706, "step": 4363 }, { "epoch": 0.5, "learning_rate": 1.0527240931508582e-05, "loss": 0.4607, "step": 4364 }, { "epoch": 0.5, "learning_rate": 1.0523544391325888e-05, "loss": 0.4766, "step": 4365 }, { "epoch": 0.5, "learning_rate": 1.0519847779405926e-05, "loss": 0.4552, "step": 4366 }, { "epoch": 0.5, "learning_rate": 1.051615109625521e-05, "loss": 0.4917, "step": 4367 }, { "epoch": 0.5, "learning_rate": 1.0512454342380269e-05, "loss": 0.4614, "step": 4368 }, { "epoch": 0.5, "learning_rate": 1.0508757518287642e-05, "loss": 0.453, "step": 4369 }, { "epoch": 0.5, "learning_rate": 1.0505060624483878e-05, "loss": 0.4705, "step": 4370 }, { "epoch": 0.5, "learning_rate": 1.0501363661475533e-05, "loss": 0.4748, "step": 4371 }, { "epoch": 0.5, "learning_rate": 1.0497666629769172e-05, "loss": 0.4521, "step": 4372 }, { "epoch": 0.5, "learning_rate": 1.049396952987137e-05, "loss": 0.463, "step": 4373 }, { "epoch": 0.5, "learning_rate": 1.0490272362288716e-05, "loss": 0.4574, "step": 4374 }, { "epoch": 0.5, "learning_rate": 1.0486575127527802e-05, "loss": 0.5077, "step": 4375 }, { "epoch": 0.5, "learning_rate": 1.0482877826095233e-05, "loss": 0.4699, "step": 4376 }, { "epoch": 0.5, "learning_rate": 1.047918045849762e-05, "loss": 0.4626, "step": 4377 }, { "epoch": 0.5, "learning_rate": 1.0475483025241587e-05, "loss": 0.4677, "step": 4378 }, { "epoch": 0.5, "learning_rate": 1.0471785526833762e-05, "loss": 0.4496, "step": 4379 }, { "epoch": 0.5, "learning_rate": 1.046808796378079e-05, "loss": 0.4818, "step": 4380 }, { "epoch": 0.5, "learning_rate": 1.0464390336589311e-05, "loss": 0.4648, "step": 4381 }, { "epoch": 0.5, "learning_rate": 1.046069264576599e-05, "loss": 0.4639, "step": 4382 }, { "epoch": 0.5, "learning_rate": 1.0456994891817492e-05, "loss": 0.501, "step": 4383 }, { "epoch": 0.5, "learning_rate": 1.045329707525049e-05, "loss": 0.4538, "step": 4384 }, { "epoch": 0.5, "learning_rate": 1.0449599196571671e-05, "loss": 0.4661, "step": 4385 }, { "epoch": 0.5, "learning_rate": 1.044590125628772e-05, "loss": 0.4508, "step": 4386 }, { "epoch": 0.5, "learning_rate": 1.0442203254905346e-05, "loss": 0.4545, "step": 4387 }, { "epoch": 0.5, "learning_rate": 1.043850519293125e-05, "loss": 0.4552, "step": 4388 }, { "epoch": 0.5, "learning_rate": 1.0434807070872154e-05, "loss": 0.4872, "step": 4389 }, { "epoch": 0.5, "learning_rate": 1.0431108889234783e-05, "loss": 0.4596, "step": 4390 }, { "epoch": 0.5, "learning_rate": 1.0427410648525863e-05, "loss": 0.4589, "step": 4391 }, { "epoch": 0.5, "learning_rate": 1.0423712349252148e-05, "loss": 0.4557, "step": 4392 }, { "epoch": 0.5, "learning_rate": 1.0420013991920382e-05, "loss": 0.4582, "step": 4393 }, { "epoch": 0.5, "learning_rate": 1.041631557703732e-05, "loss": 0.4466, "step": 4394 }, { "epoch": 0.5, "learning_rate": 1.0412617105109725e-05, "loss": 0.4584, "step": 4395 }, { "epoch": 0.5, "learning_rate": 1.0408918576644378e-05, "loss": 0.4645, "step": 4396 }, { "epoch": 0.5, "learning_rate": 1.0405219992148057e-05, "loss": 0.4663, "step": 4397 }, { "epoch": 0.5, "learning_rate": 1.040152135212755e-05, "loss": 0.4447, "step": 4398 }, { "epoch": 0.5, "learning_rate": 1.0397822657089653e-05, "loss": 0.4731, "step": 4399 }, { "epoch": 0.5, "learning_rate": 1.039412390754117e-05, "loss": 0.4579, "step": 4400 }, { "epoch": 0.5, "learning_rate": 1.039042510398891e-05, "loss": 0.4788, "step": 4401 }, { "epoch": 0.5, "learning_rate": 1.03867262469397e-05, "loss": 0.473, "step": 4402 }, { "epoch": 0.5, "learning_rate": 1.0383027336900356e-05, "loss": 0.4693, "step": 4403 }, { "epoch": 0.5, "learning_rate": 1.0379328374377715e-05, "loss": 0.4546, "step": 4404 }, { "epoch": 0.5, "learning_rate": 1.0375629359878616e-05, "loss": 0.4708, "step": 4405 }, { "epoch": 0.5, "learning_rate": 1.0371930293909911e-05, "loss": 0.4519, "step": 4406 }, { "epoch": 0.5, "learning_rate": 1.0368231176978454e-05, "loss": 0.4842, "step": 4407 }, { "epoch": 0.5, "learning_rate": 1.0364532009591101e-05, "loss": 0.4637, "step": 4408 }, { "epoch": 0.5, "learning_rate": 1.0360832792254727e-05, "loss": 0.4791, "step": 4409 }, { "epoch": 0.5, "learning_rate": 1.03571335254762e-05, "loss": 0.4545, "step": 4410 }, { "epoch": 0.5, "learning_rate": 1.0353434209762412e-05, "loss": 0.4852, "step": 4411 }, { "epoch": 0.5, "learning_rate": 1.0349734845620244e-05, "loss": 0.4396, "step": 4412 }, { "epoch": 0.5, "learning_rate": 1.0346035433556594e-05, "loss": 0.4579, "step": 4413 }, { "epoch": 0.5, "learning_rate": 1.0342335974078364e-05, "loss": 0.4664, "step": 4414 }, { "epoch": 0.5, "learning_rate": 1.0338636467692462e-05, "loss": 0.4647, "step": 4415 }, { "epoch": 0.5, "learning_rate": 1.0334936914905802e-05, "loss": 0.4764, "step": 4416 }, { "epoch": 0.5, "learning_rate": 1.0331237316225309e-05, "loss": 0.4702, "step": 4417 }, { "epoch": 0.5, "learning_rate": 1.0327537672157908e-05, "loss": 0.4681, "step": 4418 }, { "epoch": 0.51, "learning_rate": 1.0323837983210535e-05, "loss": 0.4651, "step": 4419 }, { "epoch": 0.51, "learning_rate": 1.0320138249890126e-05, "loss": 0.465, "step": 4420 }, { "epoch": 0.51, "learning_rate": 1.031643847270363e-05, "loss": 0.4518, "step": 4421 }, { "epoch": 0.51, "learning_rate": 1.0312738652157996e-05, "loss": 0.4564, "step": 4422 }, { "epoch": 0.51, "learning_rate": 1.0309038788760185e-05, "loss": 0.481, "step": 4423 }, { "epoch": 0.51, "learning_rate": 1.0305338883017163e-05, "loss": 0.4721, "step": 4424 }, { "epoch": 0.51, "learning_rate": 1.0301638935435896e-05, "loss": 0.469, "step": 4425 }, { "epoch": 0.51, "learning_rate": 1.0297938946523361e-05, "loss": 0.4487, "step": 4426 }, { "epoch": 0.51, "learning_rate": 1.0294238916786537e-05, "loss": 0.4555, "step": 4427 }, { "epoch": 0.51, "learning_rate": 1.0290538846732415e-05, "loss": 0.453, "step": 4428 }, { "epoch": 0.51, "learning_rate": 1.0286838736867981e-05, "loss": 0.4768, "step": 4429 }, { "epoch": 0.51, "learning_rate": 1.0283138587700236e-05, "loss": 0.4549, "step": 4430 }, { "epoch": 0.51, "learning_rate": 1.0279438399736185e-05, "loss": 0.4679, "step": 4431 }, { "epoch": 0.51, "learning_rate": 1.0275738173482835e-05, "loss": 0.4489, "step": 4432 }, { "epoch": 0.51, "learning_rate": 1.0272037909447197e-05, "loss": 0.4635, "step": 4433 }, { "epoch": 0.51, "learning_rate": 1.0268337608136292e-05, "loss": 0.4474, "step": 4434 }, { "epoch": 0.51, "learning_rate": 1.0264637270057146e-05, "loss": 0.4724, "step": 4435 }, { "epoch": 0.51, "learning_rate": 1.0260936895716781e-05, "loss": 0.458, "step": 4436 }, { "epoch": 0.51, "learning_rate": 1.0257236485622241e-05, "loss": 0.4632, "step": 4437 }, { "epoch": 0.51, "learning_rate": 1.0253536040280556e-05, "loss": 0.4592, "step": 4438 }, { "epoch": 0.51, "learning_rate": 1.0249835560198772e-05, "loss": 0.4643, "step": 4439 }, { "epoch": 0.51, "learning_rate": 1.0246135045883943e-05, "loss": 0.4771, "step": 4440 }, { "epoch": 0.51, "learning_rate": 1.0242434497843117e-05, "loss": 0.4872, "step": 4441 }, { "epoch": 0.51, "learning_rate": 1.023873391658335e-05, "loss": 0.4517, "step": 4442 }, { "epoch": 0.51, "learning_rate": 1.0235033302611704e-05, "loss": 0.4768, "step": 4443 }, { "epoch": 0.51, "learning_rate": 1.023133265643525e-05, "loss": 0.4565, "step": 4444 }, { "epoch": 0.51, "learning_rate": 1.0227631978561057e-05, "loss": 0.4665, "step": 4445 }, { "epoch": 0.51, "learning_rate": 1.0223931269496204e-05, "loss": 0.4572, "step": 4446 }, { "epoch": 0.51, "learning_rate": 1.0220230529747766e-05, "loss": 0.4538, "step": 4447 }, { "epoch": 0.51, "learning_rate": 1.0216529759822823e-05, "loss": 0.4572, "step": 4448 }, { "epoch": 0.51, "learning_rate": 1.0212828960228475e-05, "loss": 0.4631, "step": 4449 }, { "epoch": 0.51, "learning_rate": 1.0209128131471809e-05, "loss": 0.454, "step": 4450 }, { "epoch": 0.51, "learning_rate": 1.0205427274059915e-05, "loss": 0.4702, "step": 4451 }, { "epoch": 0.51, "learning_rate": 1.02017263884999e-05, "loss": 0.4545, "step": 4452 }, { "epoch": 0.51, "learning_rate": 1.0198025475298865e-05, "loss": 0.4729, "step": 4453 }, { "epoch": 0.51, "learning_rate": 1.019432453496392e-05, "loss": 0.4482, "step": 4454 }, { "epoch": 0.51, "learning_rate": 1.0190623568002178e-05, "loss": 0.446, "step": 4455 }, { "epoch": 0.51, "learning_rate": 1.0186922574920747e-05, "loss": 0.4636, "step": 4456 }, { "epoch": 0.51, "learning_rate": 1.018322155622675e-05, "loss": 0.4636, "step": 4457 }, { "epoch": 0.51, "learning_rate": 1.017952051242731e-05, "loss": 0.469, "step": 4458 }, { "epoch": 0.51, "learning_rate": 1.0175819444029555e-05, "loss": 0.4491, "step": 4459 }, { "epoch": 0.51, "learning_rate": 1.0172118351540608e-05, "loss": 0.4544, "step": 4460 }, { "epoch": 0.51, "learning_rate": 1.0168417235467604e-05, "loss": 0.4653, "step": 4461 }, { "epoch": 0.51, "learning_rate": 1.0164716096317677e-05, "loss": 0.4614, "step": 4462 }, { "epoch": 0.51, "learning_rate": 1.016101493459797e-05, "loss": 0.4497, "step": 4463 }, { "epoch": 0.51, "learning_rate": 1.0157313750815623e-05, "loss": 0.4507, "step": 4464 }, { "epoch": 0.51, "learning_rate": 1.0153612545477778e-05, "loss": 0.4477, "step": 4465 }, { "epoch": 0.51, "learning_rate": 1.0149911319091583e-05, "loss": 0.4675, "step": 4466 }, { "epoch": 0.51, "learning_rate": 1.014621007216419e-05, "loss": 0.4669, "step": 4467 }, { "epoch": 0.51, "learning_rate": 1.0142508805202757e-05, "loss": 0.4668, "step": 4468 }, { "epoch": 0.51, "learning_rate": 1.0138807518714435e-05, "loss": 0.4754, "step": 4469 }, { "epoch": 0.51, "learning_rate": 1.0135106213206382e-05, "loss": 0.4581, "step": 4470 }, { "epoch": 0.51, "learning_rate": 1.0131404889185762e-05, "loss": 0.4621, "step": 4471 }, { "epoch": 0.51, "learning_rate": 1.012770354715974e-05, "loss": 0.459, "step": 4472 }, { "epoch": 0.51, "learning_rate": 1.012400218763548e-05, "loss": 0.4633, "step": 4473 }, { "epoch": 0.51, "learning_rate": 1.012030081112015e-05, "loss": 0.4751, "step": 4474 }, { "epoch": 0.51, "learning_rate": 1.0116599418120924e-05, "loss": 0.4624, "step": 4475 }, { "epoch": 0.51, "learning_rate": 1.0112898009144977e-05, "loss": 0.4584, "step": 4476 }, { "epoch": 0.51, "learning_rate": 1.0109196584699478e-05, "loss": 0.4615, "step": 4477 }, { "epoch": 0.51, "learning_rate": 1.0105495145291612e-05, "loss": 0.4712, "step": 4478 }, { "epoch": 0.51, "learning_rate": 1.0101793691428554e-05, "loss": 0.456, "step": 4479 }, { "epoch": 0.51, "learning_rate": 1.0098092223617488e-05, "loss": 0.4551, "step": 4480 }, { "epoch": 0.51, "learning_rate": 1.0094390742365598e-05, "loss": 0.4553, "step": 4481 }, { "epoch": 0.51, "learning_rate": 1.009068924818007e-05, "loss": 0.47, "step": 4482 }, { "epoch": 0.51, "learning_rate": 1.0086987741568089e-05, "loss": 0.4609, "step": 4483 }, { "epoch": 0.51, "learning_rate": 1.0083286223036845e-05, "loss": 0.4694, "step": 4484 }, { "epoch": 0.51, "learning_rate": 1.0079584693093529e-05, "loss": 0.4731, "step": 4485 }, { "epoch": 0.51, "learning_rate": 1.0075883152245334e-05, "loss": 0.4774, "step": 4486 }, { "epoch": 0.51, "learning_rate": 1.007218160099945e-05, "loss": 0.4797, "step": 4487 }, { "epoch": 0.51, "learning_rate": 1.006848003986308e-05, "loss": 0.4382, "step": 4488 }, { "epoch": 0.51, "learning_rate": 1.0064778469343413e-05, "loss": 0.4554, "step": 4489 }, { "epoch": 0.51, "learning_rate": 1.006107688994765e-05, "loss": 0.4602, "step": 4490 }, { "epoch": 0.51, "learning_rate": 1.0057375302182988e-05, "loss": 0.4634, "step": 4491 }, { "epoch": 0.51, "learning_rate": 1.005367370655663e-05, "loss": 0.4633, "step": 4492 }, { "epoch": 0.51, "learning_rate": 1.0049972103575775e-05, "loss": 0.4775, "step": 4493 }, { "epoch": 0.51, "learning_rate": 1.004627049374763e-05, "loss": 0.462, "step": 4494 }, { "epoch": 0.51, "learning_rate": 1.0042568877579388e-05, "loss": 0.4605, "step": 4495 }, { "epoch": 0.51, "learning_rate": 1.0038867255578261e-05, "loss": 0.45, "step": 4496 }, { "epoch": 0.51, "learning_rate": 1.0035165628251455e-05, "loss": 0.4773, "step": 4497 }, { "epoch": 0.51, "learning_rate": 1.0031463996106175e-05, "loss": 0.462, "step": 4498 }, { "epoch": 0.51, "learning_rate": 1.002776235964962e-05, "loss": 0.4733, "step": 4499 }, { "epoch": 0.51, "learning_rate": 1.0024060719389002e-05, "loss": 0.4687, "step": 4500 }, { "epoch": 0.51, "learning_rate": 1.002035907583153e-05, "loss": 0.4611, "step": 4501 }, { "epoch": 0.51, "learning_rate": 1.001665742948441e-05, "loss": 0.4397, "step": 4502 }, { "epoch": 0.51, "learning_rate": 1.0012955780854852e-05, "loss": 0.4622, "step": 4503 }, { "epoch": 0.51, "learning_rate": 1.0009254130450059e-05, "loss": 0.4544, "step": 4504 }, { "epoch": 0.51, "learning_rate": 1.0005552478777244e-05, "loss": 0.4854, "step": 4505 }, { "epoch": 0.51, "learning_rate": 1.0001850826343615e-05, "loss": 0.458, "step": 4506 }, { "epoch": 0.52, "learning_rate": 9.998149173656387e-06, "loss": 0.4704, "step": 4507 }, { "epoch": 0.52, "learning_rate": 9.994447521222758e-06, "loss": 0.4649, "step": 4508 }, { "epoch": 0.52, "learning_rate": 9.990745869549943e-06, "loss": 0.4603, "step": 4509 }, { "epoch": 0.52, "learning_rate": 9.987044219145155e-06, "loss": 0.4715, "step": 4510 }, { "epoch": 0.52, "learning_rate": 9.983342570515592e-06, "loss": 0.4502, "step": 4511 }, { "epoch": 0.52, "learning_rate": 9.979640924168475e-06, "loss": 0.4481, "step": 4512 }, { "epoch": 0.52, "learning_rate": 9.975939280611e-06, "loss": 0.4688, "step": 4513 }, { "epoch": 0.52, "learning_rate": 9.972237640350383e-06, "loss": 0.4572, "step": 4514 }, { "epoch": 0.52, "learning_rate": 9.968536003893832e-06, "loss": 0.4765, "step": 4515 }, { "epoch": 0.52, "learning_rate": 9.964834371748547e-06, "loss": 0.4421, "step": 4516 }, { "epoch": 0.52, "learning_rate": 9.96113274442174e-06, "loss": 0.4692, "step": 4517 }, { "epoch": 0.52, "learning_rate": 9.957431122420615e-06, "loss": 0.4652, "step": 4518 }, { "epoch": 0.52, "learning_rate": 9.953729506252374e-06, "loss": 0.4713, "step": 4519 }, { "epoch": 0.52, "learning_rate": 9.950027896424228e-06, "loss": 0.4544, "step": 4520 }, { "epoch": 0.52, "learning_rate": 9.946326293443371e-06, "loss": 0.4721, "step": 4521 }, { "epoch": 0.52, "learning_rate": 9.942624697817015e-06, "loss": 0.4527, "step": 4522 }, { "epoch": 0.52, "learning_rate": 9.938923110052353e-06, "loss": 0.4667, "step": 4523 }, { "epoch": 0.52, "learning_rate": 9.935221530656589e-06, "loss": 0.4684, "step": 4524 }, { "epoch": 0.52, "learning_rate": 9.931519960136925e-06, "loss": 0.469, "step": 4525 }, { "epoch": 0.52, "learning_rate": 9.92781839900055e-06, "loss": 0.4682, "step": 4526 }, { "epoch": 0.52, "learning_rate": 9.92411684775467e-06, "loss": 0.4617, "step": 4527 }, { "epoch": 0.52, "learning_rate": 9.920415306906475e-06, "loss": 0.4692, "step": 4528 }, { "epoch": 0.52, "learning_rate": 9.916713776963156e-06, "loss": 0.4503, "step": 4529 }, { "epoch": 0.52, "learning_rate": 9.913012258431915e-06, "loss": 0.453, "step": 4530 }, { "epoch": 0.52, "learning_rate": 9.909310751819936e-06, "loss": 0.4832, "step": 4531 }, { "epoch": 0.52, "learning_rate": 9.905609257634404e-06, "loss": 0.4704, "step": 4532 }, { "epoch": 0.52, "learning_rate": 9.901907776382514e-06, "loss": 0.4666, "step": 4533 }, { "epoch": 0.52, "learning_rate": 9.898206308571446e-06, "loss": 0.4546, "step": 4534 }, { "epoch": 0.52, "learning_rate": 9.894504854708391e-06, "loss": 0.4571, "step": 4535 }, { "epoch": 0.52, "learning_rate": 9.890803415300527e-06, "loss": 0.475, "step": 4536 }, { "epoch": 0.52, "learning_rate": 9.887101990855027e-06, "loss": 0.4718, "step": 4537 }, { "epoch": 0.52, "learning_rate": 9.883400581879077e-06, "loss": 0.4536, "step": 4538 }, { "epoch": 0.52, "learning_rate": 9.87969918887985e-06, "loss": 0.4675, "step": 4539 }, { "epoch": 0.52, "learning_rate": 9.875997812364524e-06, "loss": 0.451, "step": 4540 }, { "epoch": 0.52, "learning_rate": 9.872296452840266e-06, "loss": 0.4575, "step": 4541 }, { "epoch": 0.52, "learning_rate": 9.86859511081424e-06, "loss": 0.4571, "step": 4542 }, { "epoch": 0.52, "learning_rate": 9.86489378679362e-06, "loss": 0.4678, "step": 4543 }, { "epoch": 0.52, "learning_rate": 9.86119248128557e-06, "loss": 0.4673, "step": 4544 }, { "epoch": 0.52, "learning_rate": 9.857491194797244e-06, "loss": 0.4733, "step": 4545 }, { "epoch": 0.52, "learning_rate": 9.853789927835811e-06, "loss": 0.4682, "step": 4546 }, { "epoch": 0.52, "learning_rate": 9.85008868090842e-06, "loss": 0.4519, "step": 4547 }, { "epoch": 0.52, "learning_rate": 9.846387454522225e-06, "loss": 0.4542, "step": 4548 }, { "epoch": 0.52, "learning_rate": 9.842686249184384e-06, "loss": 0.4461, "step": 4549 }, { "epoch": 0.52, "learning_rate": 9.838985065402032e-06, "loss": 0.4728, "step": 4550 }, { "epoch": 0.52, "learning_rate": 9.835283903682327e-06, "loss": 0.4747, "step": 4551 }, { "epoch": 0.52, "learning_rate": 9.831582764532399e-06, "loss": 0.4419, "step": 4552 }, { "epoch": 0.52, "learning_rate": 9.827881648459396e-06, "loss": 0.4559, "step": 4553 }, { "epoch": 0.52, "learning_rate": 9.824180555970451e-06, "loss": 0.4902, "step": 4554 }, { "epoch": 0.52, "learning_rate": 9.820479487572691e-06, "loss": 0.443, "step": 4555 }, { "epoch": 0.52, "learning_rate": 9.816778443773253e-06, "loss": 0.4473, "step": 4556 }, { "epoch": 0.52, "learning_rate": 9.813077425079258e-06, "loss": 0.4676, "step": 4557 }, { "epoch": 0.52, "learning_rate": 9.809376431997825e-06, "loss": 0.446, "step": 4558 }, { "epoch": 0.52, "learning_rate": 9.805675465036084e-06, "loss": 0.4786, "step": 4559 }, { "epoch": 0.52, "learning_rate": 9.801974524701135e-06, "loss": 0.4651, "step": 4560 }, { "epoch": 0.52, "learning_rate": 9.798273611500103e-06, "loss": 0.4478, "step": 4561 }, { "epoch": 0.52, "learning_rate": 9.794572725940088e-06, "loss": 0.4633, "step": 4562 }, { "epoch": 0.52, "learning_rate": 9.790871868528194e-06, "loss": 0.4631, "step": 4563 }, { "epoch": 0.52, "learning_rate": 9.787171039771528e-06, "loss": 0.458, "step": 4564 }, { "epoch": 0.52, "learning_rate": 9.783470240177175e-06, "loss": 0.4644, "step": 4565 }, { "epoch": 0.52, "learning_rate": 9.779769470252237e-06, "loss": 0.4525, "step": 4566 }, { "epoch": 0.52, "learning_rate": 9.776068730503801e-06, "loss": 0.48, "step": 4567 }, { "epoch": 0.52, "learning_rate": 9.772368021438943e-06, "loss": 0.4676, "step": 4568 }, { "epoch": 0.52, "learning_rate": 9.768667343564752e-06, "loss": 0.4516, "step": 4569 }, { "epoch": 0.52, "learning_rate": 9.7649666973883e-06, "loss": 0.4608, "step": 4570 }, { "epoch": 0.52, "learning_rate": 9.761266083416655e-06, "loss": 0.4624, "step": 4571 }, { "epoch": 0.52, "learning_rate": 9.75756550215689e-06, "loss": 0.4609, "step": 4572 }, { "epoch": 0.52, "learning_rate": 9.753864954116058e-06, "loss": 0.4632, "step": 4573 }, { "epoch": 0.52, "learning_rate": 9.75016443980123e-06, "loss": 0.4696, "step": 4574 }, { "epoch": 0.52, "learning_rate": 9.746463959719447e-06, "loss": 0.4639, "step": 4575 }, { "epoch": 0.52, "learning_rate": 9.74276351437776e-06, "loss": 0.4705, "step": 4576 }, { "epoch": 0.52, "learning_rate": 9.73906310428322e-06, "loss": 0.4716, "step": 4577 }, { "epoch": 0.52, "learning_rate": 9.735362729942856e-06, "loss": 0.4548, "step": 4578 }, { "epoch": 0.52, "learning_rate": 9.731662391863711e-06, "loss": 0.453, "step": 4579 }, { "epoch": 0.52, "learning_rate": 9.727962090552808e-06, "loss": 0.4619, "step": 4580 }, { "epoch": 0.52, "learning_rate": 9.724261826517167e-06, "loss": 0.4502, "step": 4581 }, { "epoch": 0.52, "learning_rate": 9.720561600263818e-06, "loss": 0.4543, "step": 4582 }, { "epoch": 0.52, "learning_rate": 9.716861412299769e-06, "loss": 0.4512, "step": 4583 }, { "epoch": 0.52, "learning_rate": 9.713161263132022e-06, "loss": 0.4865, "step": 4584 }, { "epoch": 0.52, "learning_rate": 9.70946115326759e-06, "loss": 0.4704, "step": 4585 }, { "epoch": 0.52, "learning_rate": 9.705761083213463e-06, "loss": 0.4619, "step": 4586 }, { "epoch": 0.52, "learning_rate": 9.702061053476642e-06, "loss": 0.4452, "step": 4587 }, { "epoch": 0.52, "learning_rate": 9.698361064564107e-06, "loss": 0.4892, "step": 4588 }, { "epoch": 0.52, "learning_rate": 9.694661116982838e-06, "loss": 0.437, "step": 4589 }, { "epoch": 0.52, "learning_rate": 9.690961211239816e-06, "loss": 0.4578, "step": 4590 }, { "epoch": 0.52, "learning_rate": 9.687261347842004e-06, "loss": 0.4736, "step": 4591 }, { "epoch": 0.52, "learning_rate": 9.683561527296375e-06, "loss": 0.4749, "step": 4592 }, { "epoch": 0.52, "learning_rate": 9.67986175010988e-06, "loss": 0.4598, "step": 4593 }, { "epoch": 0.53, "learning_rate": 9.676162016789469e-06, "loss": 0.4787, "step": 4594 }, { "epoch": 0.53, "learning_rate": 9.672462327842095e-06, "loss": 0.4639, "step": 4595 }, { "epoch": 0.53, "learning_rate": 9.668762683774691e-06, "loss": 0.4549, "step": 4596 }, { "epoch": 0.53, "learning_rate": 9.6650630850942e-06, "loss": 0.4702, "step": 4597 }, { "epoch": 0.53, "learning_rate": 9.661363532307543e-06, "loss": 0.4616, "step": 4598 }, { "epoch": 0.53, "learning_rate": 9.65766402592164e-06, "loss": 0.4599, "step": 4599 }, { "epoch": 0.53, "learning_rate": 9.65396456644341e-06, "loss": 0.4743, "step": 4600 }, { "epoch": 0.53, "learning_rate": 9.650265154379761e-06, "loss": 0.4605, "step": 4601 }, { "epoch": 0.53, "learning_rate": 9.64656579023759e-06, "loss": 0.4574, "step": 4602 }, { "epoch": 0.53, "learning_rate": 9.642866474523802e-06, "loss": 0.458, "step": 4603 }, { "epoch": 0.53, "learning_rate": 9.639167207745276e-06, "loss": 0.448, "step": 4604 }, { "epoch": 0.53, "learning_rate": 9.6354679904089e-06, "loss": 0.4661, "step": 4605 }, { "epoch": 0.53, "learning_rate": 9.631768823021551e-06, "loss": 0.4667, "step": 4606 }, { "epoch": 0.53, "learning_rate": 9.628069706090089e-06, "loss": 0.4673, "step": 4607 }, { "epoch": 0.53, "learning_rate": 9.624370640121387e-06, "loss": 0.4743, "step": 4608 }, { "epoch": 0.53, "learning_rate": 9.620671625622287e-06, "loss": 0.4708, "step": 4609 }, { "epoch": 0.53, "learning_rate": 9.616972663099648e-06, "loss": 0.4519, "step": 4610 }, { "epoch": 0.53, "learning_rate": 9.613273753060306e-06, "loss": 0.4693, "step": 4611 }, { "epoch": 0.53, "learning_rate": 9.60957489601109e-06, "loss": 0.4497, "step": 4612 }, { "epoch": 0.53, "learning_rate": 9.605876092458835e-06, "loss": 0.4547, "step": 4613 }, { "epoch": 0.53, "learning_rate": 9.60217734291035e-06, "loss": 0.4704, "step": 4614 }, { "epoch": 0.53, "learning_rate": 9.598478647872451e-06, "loss": 0.4674, "step": 4615 }, { "epoch": 0.53, "learning_rate": 9.594780007851947e-06, "loss": 0.4687, "step": 4616 }, { "epoch": 0.53, "learning_rate": 9.591081423355622e-06, "loss": 0.4746, "step": 4617 }, { "epoch": 0.53, "learning_rate": 9.587382894890276e-06, "loss": 0.4641, "step": 4618 }, { "epoch": 0.53, "learning_rate": 9.583684422962686e-06, "loss": 0.4568, "step": 4619 }, { "epoch": 0.53, "learning_rate": 9.57998600807962e-06, "loss": 0.4585, "step": 4620 }, { "epoch": 0.53, "learning_rate": 9.576287650747854e-06, "loss": 0.455, "step": 4621 }, { "epoch": 0.53, "learning_rate": 9.572589351474135e-06, "loss": 0.4596, "step": 4622 }, { "epoch": 0.53, "learning_rate": 9.568891110765219e-06, "loss": 0.4498, "step": 4623 }, { "epoch": 0.53, "learning_rate": 9.565192929127849e-06, "loss": 0.4718, "step": 4624 }, { "epoch": 0.53, "learning_rate": 9.56149480706875e-06, "loss": 0.459, "step": 4625 }, { "epoch": 0.53, "learning_rate": 9.557796745094659e-06, "loss": 0.4699, "step": 4626 }, { "epoch": 0.53, "learning_rate": 9.554098743712282e-06, "loss": 0.4617, "step": 4627 }, { "epoch": 0.53, "learning_rate": 9.55040080342833e-06, "loss": 0.4584, "step": 4628 }, { "epoch": 0.53, "learning_rate": 9.546702924749513e-06, "loss": 0.4683, "step": 4629 }, { "epoch": 0.53, "learning_rate": 9.543005108182508e-06, "loss": 0.4565, "step": 4630 }, { "epoch": 0.53, "learning_rate": 9.539307354234013e-06, "loss": 0.4596, "step": 4631 }, { "epoch": 0.53, "learning_rate": 9.535609663410692e-06, "loss": 0.4669, "step": 4632 }, { "epoch": 0.53, "learning_rate": 9.531912036219214e-06, "loss": 0.4542, "step": 4633 }, { "epoch": 0.53, "learning_rate": 9.528214473166241e-06, "loss": 0.4628, "step": 4634 }, { "epoch": 0.53, "learning_rate": 9.524516974758415e-06, "loss": 0.4588, "step": 4635 }, { "epoch": 0.53, "learning_rate": 9.520819541502384e-06, "loss": 0.4724, "step": 4636 }, { "epoch": 0.53, "learning_rate": 9.51712217390477e-06, "loss": 0.4556, "step": 4637 }, { "epoch": 0.53, "learning_rate": 9.5134248724722e-06, "loss": 0.4625, "step": 4638 }, { "epoch": 0.53, "learning_rate": 9.509727637711287e-06, "loss": 0.4548, "step": 4639 }, { "epoch": 0.53, "learning_rate": 9.506030470128635e-06, "loss": 0.4666, "step": 4640 }, { "epoch": 0.53, "learning_rate": 9.502333370230831e-06, "loss": 0.4542, "step": 4641 }, { "epoch": 0.53, "learning_rate": 9.49863633852447e-06, "loss": 0.4654, "step": 4642 }, { "epoch": 0.53, "learning_rate": 9.494939375516122e-06, "loss": 0.4402, "step": 4643 }, { "epoch": 0.53, "learning_rate": 9.49124248171236e-06, "loss": 0.459, "step": 4644 }, { "epoch": 0.53, "learning_rate": 9.487545657619736e-06, "loss": 0.4613, "step": 4645 }, { "epoch": 0.53, "learning_rate": 9.483848903744795e-06, "loss": 0.4691, "step": 4646 }, { "epoch": 0.53, "learning_rate": 9.48015222059408e-06, "loss": 0.451, "step": 4647 }, { "epoch": 0.53, "learning_rate": 9.476455608674112e-06, "loss": 0.4657, "step": 4648 }, { "epoch": 0.53, "learning_rate": 9.472759068491421e-06, "loss": 0.4631, "step": 4649 }, { "epoch": 0.53, "learning_rate": 9.469062600552509e-06, "loss": 0.4553, "step": 4650 }, { "epoch": 0.53, "learning_rate": 9.46536620536387e-06, "loss": 0.4589, "step": 4651 }, { "epoch": 0.53, "learning_rate": 9.461669883431997e-06, "loss": 0.4644, "step": 4652 }, { "epoch": 0.53, "learning_rate": 9.457973635263375e-06, "loss": 0.4886, "step": 4653 }, { "epoch": 0.53, "learning_rate": 9.45427746136446e-06, "loss": 0.4691, "step": 4654 }, { "epoch": 0.53, "learning_rate": 9.45058136224172e-06, "loss": 0.4444, "step": 4655 }, { "epoch": 0.53, "learning_rate": 9.446885338401597e-06, "loss": 0.4715, "step": 4656 }, { "epoch": 0.53, "learning_rate": 9.443189390350534e-06, "loss": 0.4667, "step": 4657 }, { "epoch": 0.53, "learning_rate": 9.439493518594957e-06, "loss": 0.4679, "step": 4658 }, { "epoch": 0.53, "learning_rate": 9.435797723641277e-06, "loss": 0.4479, "step": 4659 }, { "epoch": 0.53, "learning_rate": 9.432102005995912e-06, "loss": 0.4777, "step": 4660 }, { "epoch": 0.53, "learning_rate": 9.428406366165244e-06, "loss": 0.4656, "step": 4661 }, { "epoch": 0.53, "learning_rate": 9.424710804655669e-06, "loss": 0.4465, "step": 4662 }, { "epoch": 0.53, "learning_rate": 9.42101532197356e-06, "loss": 0.4584, "step": 4663 }, { "epoch": 0.53, "learning_rate": 9.417319918625274e-06, "loss": 0.4644, "step": 4664 }, { "epoch": 0.53, "learning_rate": 9.413624595117173e-06, "loss": 0.4449, "step": 4665 }, { "epoch": 0.53, "learning_rate": 9.409929351955592e-06, "loss": 0.4884, "step": 4666 }, { "epoch": 0.53, "learning_rate": 9.40623418964686e-06, "loss": 0.4483, "step": 4667 }, { "epoch": 0.53, "learning_rate": 9.402539108697306e-06, "loss": 0.4915, "step": 4668 }, { "epoch": 0.53, "learning_rate": 9.398844109613228e-06, "loss": 0.4573, "step": 4669 }, { "epoch": 0.53, "learning_rate": 9.395149192900934e-06, "loss": 0.4712, "step": 4670 }, { "epoch": 0.53, "learning_rate": 9.391454359066701e-06, "loss": 0.4664, "step": 4671 }, { "epoch": 0.53, "learning_rate": 9.387759608616806e-06, "loss": 0.4573, "step": 4672 }, { "epoch": 0.53, "learning_rate": 9.384064942057518e-06, "loss": 0.4352, "step": 4673 }, { "epoch": 0.53, "learning_rate": 9.380370359895079e-06, "loss": 0.4715, "step": 4674 }, { "epoch": 0.53, "learning_rate": 9.37667586263574e-06, "loss": 0.4777, "step": 4675 }, { "epoch": 0.53, "learning_rate": 9.372981450785723e-06, "loss": 0.4662, "step": 4676 }, { "epoch": 0.53, "learning_rate": 9.369287124851243e-06, "loss": 0.4557, "step": 4677 }, { "epoch": 0.53, "learning_rate": 9.365592885338512e-06, "loss": 0.457, "step": 4678 }, { "epoch": 0.53, "learning_rate": 9.361898732753715e-06, "loss": 0.4632, "step": 4679 }, { "epoch": 0.53, "learning_rate": 9.358204667603043e-06, "loss": 0.4692, "step": 4680 }, { "epoch": 0.53, "learning_rate": 9.35451069039266e-06, "loss": 0.4565, "step": 4681 }, { "epoch": 0.54, "learning_rate": 9.35081680162872e-06, "loss": 0.4649, "step": 4682 }, { "epoch": 0.54, "learning_rate": 9.347123001817376e-06, "loss": 0.4416, "step": 4683 }, { "epoch": 0.54, "learning_rate": 9.343429291464756e-06, "loss": 0.485, "step": 4684 }, { "epoch": 0.54, "learning_rate": 9.339735671076978e-06, "loss": 0.4466, "step": 4685 }, { "epoch": 0.54, "learning_rate": 9.336042141160158e-06, "loss": 0.4855, "step": 4686 }, { "epoch": 0.54, "learning_rate": 9.332348702220386e-06, "loss": 0.4635, "step": 4687 }, { "epoch": 0.54, "learning_rate": 9.32865535476375e-06, "loss": 0.4589, "step": 4688 }, { "epoch": 0.54, "learning_rate": 9.32496209929632e-06, "loss": 0.4634, "step": 4689 }, { "epoch": 0.54, "learning_rate": 9.32126893632415e-06, "loss": 0.4645, "step": 4690 }, { "epoch": 0.54, "learning_rate": 9.317575866353293e-06, "loss": 0.442, "step": 4691 }, { "epoch": 0.54, "learning_rate": 9.313882889889773e-06, "loss": 0.4607, "step": 4692 }, { "epoch": 0.54, "learning_rate": 9.31019000743962e-06, "loss": 0.4629, "step": 4693 }, { "epoch": 0.54, "learning_rate": 9.306497219508835e-06, "loss": 0.4754, "step": 4694 }, { "epoch": 0.54, "learning_rate": 9.302804526603413e-06, "loss": 0.4514, "step": 4695 }, { "epoch": 0.54, "learning_rate": 9.29911192922934e-06, "loss": 0.4604, "step": 4696 }, { "epoch": 0.54, "learning_rate": 9.29541942789258e-06, "loss": 0.4665, "step": 4697 }, { "epoch": 0.54, "learning_rate": 9.291727023099087e-06, "loss": 0.4833, "step": 4698 }, { "epoch": 0.54, "learning_rate": 9.288034715354806e-06, "loss": 0.4474, "step": 4699 }, { "epoch": 0.54, "learning_rate": 9.28434250516566e-06, "loss": 0.4553, "step": 4700 }, { "epoch": 0.54, "learning_rate": 9.280650393037578e-06, "loss": 0.4573, "step": 4701 }, { "epoch": 0.54, "learning_rate": 9.276958379476449e-06, "loss": 0.4991, "step": 4702 }, { "epoch": 0.54, "learning_rate": 9.27326646498816e-06, "loss": 0.4458, "step": 4703 }, { "epoch": 0.54, "learning_rate": 9.269574650078594e-06, "loss": 0.471, "step": 4704 }, { "epoch": 0.54, "learning_rate": 9.265882935253605e-06, "loss": 0.4525, "step": 4705 }, { "epoch": 0.54, "learning_rate": 9.262191321019049e-06, "loss": 0.473, "step": 4706 }, { "epoch": 0.54, "learning_rate": 9.258499807880755e-06, "loss": 0.4637, "step": 4707 }, { "epoch": 0.54, "learning_rate": 9.254808396344536e-06, "loss": 0.4749, "step": 4708 }, { "epoch": 0.54, "learning_rate": 9.251117086916209e-06, "loss": 0.4477, "step": 4709 }, { "epoch": 0.54, "learning_rate": 9.247425880101561e-06, "loss": 0.4813, "step": 4710 }, { "epoch": 0.54, "learning_rate": 9.243734776406365e-06, "loss": 0.4593, "step": 4711 }, { "epoch": 0.54, "learning_rate": 9.240043776336397e-06, "loss": 0.4823, "step": 4712 }, { "epoch": 0.54, "learning_rate": 9.23635288039739e-06, "loss": 0.4511, "step": 4713 }, { "epoch": 0.54, "learning_rate": 9.232662089095091e-06, "loss": 0.4458, "step": 4714 }, { "epoch": 0.54, "learning_rate": 9.22897140293522e-06, "loss": 0.4836, "step": 4715 }, { "epoch": 0.54, "learning_rate": 9.225280822423477e-06, "loss": 0.4481, "step": 4716 }, { "epoch": 0.54, "learning_rate": 9.221590348065561e-06, "loss": 0.4664, "step": 4717 }, { "epoch": 0.54, "learning_rate": 9.217899980367142e-06, "loss": 0.4613, "step": 4718 }, { "epoch": 0.54, "learning_rate": 9.214209719833891e-06, "loss": 0.4589, "step": 4719 }, { "epoch": 0.54, "learning_rate": 9.210519566971452e-06, "loss": 0.4755, "step": 4720 }, { "epoch": 0.54, "learning_rate": 9.206829522285456e-06, "loss": 0.4648, "step": 4721 }, { "epoch": 0.54, "learning_rate": 9.203139586281527e-06, "loss": 0.4539, "step": 4722 }, { "epoch": 0.54, "learning_rate": 9.199449759465263e-06, "loss": 0.455, "step": 4723 }, { "epoch": 0.54, "learning_rate": 9.195760042342254e-06, "loss": 0.4757, "step": 4724 }, { "epoch": 0.54, "learning_rate": 9.192070435418079e-06, "loss": 0.4543, "step": 4725 }, { "epoch": 0.54, "learning_rate": 9.188380939198287e-06, "loss": 0.4611, "step": 4726 }, { "epoch": 0.54, "learning_rate": 9.184691554188432e-06, "loss": 0.4593, "step": 4727 }, { "epoch": 0.54, "learning_rate": 9.181002280894034e-06, "loss": 0.4526, "step": 4728 }, { "epoch": 0.54, "learning_rate": 9.177313119820608e-06, "loss": 0.4462, "step": 4729 }, { "epoch": 0.54, "learning_rate": 9.173624071473655e-06, "loss": 0.4694, "step": 4730 }, { "epoch": 0.54, "learning_rate": 9.16993513635865e-06, "loss": 0.4631, "step": 4731 }, { "epoch": 0.54, "learning_rate": 9.166246314981066e-06, "loss": 0.4379, "step": 4732 }, { "epoch": 0.54, "learning_rate": 9.162557607846352e-06, "loss": 0.4645, "step": 4733 }, { "epoch": 0.54, "learning_rate": 9.158869015459939e-06, "loss": 0.4768, "step": 4734 }, { "epoch": 0.54, "learning_rate": 9.155180538327255e-06, "loss": 0.4581, "step": 4735 }, { "epoch": 0.54, "learning_rate": 9.151492176953697e-06, "loss": 0.4598, "step": 4736 }, { "epoch": 0.54, "learning_rate": 9.147803931844651e-06, "loss": 0.4646, "step": 4737 }, { "epoch": 0.54, "learning_rate": 9.144115803505498e-06, "loss": 0.493, "step": 4738 }, { "epoch": 0.54, "learning_rate": 9.140427792441584e-06, "loss": 0.4566, "step": 4739 }, { "epoch": 0.54, "learning_rate": 9.136739899158257e-06, "loss": 0.4656, "step": 4740 }, { "epoch": 0.54, "learning_rate": 9.133052124160837e-06, "loss": 0.4568, "step": 4741 }, { "epoch": 0.54, "learning_rate": 9.129364467954628e-06, "loss": 0.4596, "step": 4742 }, { "epoch": 0.54, "learning_rate": 9.125676931044928e-06, "loss": 0.4573, "step": 4743 }, { "epoch": 0.54, "learning_rate": 9.121989513937007e-06, "loss": 0.456, "step": 4744 }, { "epoch": 0.54, "learning_rate": 9.11830221713613e-06, "loss": 0.4509, "step": 4745 }, { "epoch": 0.54, "learning_rate": 9.11461504114753e-06, "loss": 0.4743, "step": 4746 }, { "epoch": 0.54, "learning_rate": 9.110927986476434e-06, "loss": 0.4662, "step": 4747 }, { "epoch": 0.54, "learning_rate": 9.107241053628058e-06, "loss": 0.4476, "step": 4748 }, { "epoch": 0.54, "learning_rate": 9.103554243107592e-06, "loss": 0.4494, "step": 4749 }, { "epoch": 0.54, "learning_rate": 9.0998675554202e-06, "loss": 0.4702, "step": 4750 }, { "epoch": 0.54, "learning_rate": 9.096180991071055e-06, "loss": 0.4599, "step": 4751 }, { "epoch": 0.54, "learning_rate": 9.09249455056529e-06, "loss": 0.4609, "step": 4752 }, { "epoch": 0.54, "learning_rate": 9.088808234408037e-06, "loss": 0.4478, "step": 4753 }, { "epoch": 0.54, "learning_rate": 9.0851220431044e-06, "loss": 0.4582, "step": 4754 }, { "epoch": 0.54, "learning_rate": 9.081435977159464e-06, "loss": 0.4391, "step": 4755 }, { "epoch": 0.54, "learning_rate": 9.07775003707831e-06, "loss": 0.4849, "step": 4756 }, { "epoch": 0.54, "learning_rate": 9.074064223365986e-06, "loss": 0.4503, "step": 4757 }, { "epoch": 0.54, "learning_rate": 9.070378536527544e-06, "loss": 0.4415, "step": 4758 }, { "epoch": 0.54, "learning_rate": 9.066692977067996e-06, "loss": 0.4643, "step": 4759 }, { "epoch": 0.54, "learning_rate": 9.063007545492342e-06, "loss": 0.4695, "step": 4760 }, { "epoch": 0.54, "learning_rate": 9.059322242305579e-06, "loss": 0.4582, "step": 4761 }, { "epoch": 0.54, "learning_rate": 9.055637068012664e-06, "loss": 0.4431, "step": 4762 }, { "epoch": 0.54, "learning_rate": 9.051952023118563e-06, "loss": 0.4624, "step": 4763 }, { "epoch": 0.54, "learning_rate": 9.048267108128198e-06, "loss": 0.4788, "step": 4764 }, { "epoch": 0.54, "learning_rate": 9.044582323546486e-06, "loss": 0.457, "step": 4765 }, { "epoch": 0.54, "learning_rate": 9.040897669878327e-06, "loss": 0.4669, "step": 4766 }, { "epoch": 0.54, "learning_rate": 9.037213147628603e-06, "loss": 0.4772, "step": 4767 }, { "epoch": 0.54, "learning_rate": 9.033528757302167e-06, "loss": 0.4535, "step": 4768 }, { "epoch": 0.55, "learning_rate": 9.029844499403876e-06, "loss": 0.4751, "step": 4769 }, { "epoch": 0.55, "learning_rate": 9.026160374438543e-06, "loss": 0.4523, "step": 4770 }, { "epoch": 0.55, "learning_rate": 9.022476382910983e-06, "loss": 0.462, "step": 4771 }, { "epoch": 0.55, "learning_rate": 9.018792525325986e-06, "loss": 0.458, "step": 4772 }, { "epoch": 0.55, "learning_rate": 9.015108802188314e-06, "loss": 0.4503, "step": 4773 }, { "epoch": 0.55, "learning_rate": 9.01142521400273e-06, "loss": 0.4615, "step": 4774 }, { "epoch": 0.55, "learning_rate": 9.007741761273957e-06, "loss": 0.447, "step": 4775 }, { "epoch": 0.55, "learning_rate": 9.004058444506718e-06, "loss": 0.4495, "step": 4776 }, { "epoch": 0.55, "learning_rate": 9.000375264205713e-06, "loss": 0.4651, "step": 4777 }, { "epoch": 0.55, "learning_rate": 8.996692220875608e-06, "loss": 0.448, "step": 4778 }, { "epoch": 0.55, "learning_rate": 8.993009315021073e-06, "loss": 0.467, "step": 4779 }, { "epoch": 0.55, "learning_rate": 8.989326547146743e-06, "loss": 0.4631, "step": 4780 }, { "epoch": 0.55, "learning_rate": 8.985643917757237e-06, "loss": 0.4623, "step": 4781 }, { "epoch": 0.55, "learning_rate": 8.981961427357166e-06, "loss": 0.459, "step": 4782 }, { "epoch": 0.55, "learning_rate": 8.978279076451104e-06, "loss": 0.4612, "step": 4783 }, { "epoch": 0.55, "learning_rate": 8.974596865543624e-06, "loss": 0.449, "step": 4784 }, { "epoch": 0.55, "learning_rate": 8.970914795139264e-06, "loss": 0.4779, "step": 4785 }, { "epoch": 0.55, "learning_rate": 8.967232865742552e-06, "loss": 0.4482, "step": 4786 }, { "epoch": 0.55, "learning_rate": 8.963551077857999e-06, "loss": 0.4515, "step": 4787 }, { "epoch": 0.55, "learning_rate": 8.959869431990082e-06, "loss": 0.4554, "step": 4788 }, { "epoch": 0.55, "learning_rate": 8.956187928643281e-06, "loss": 0.474, "step": 4789 }, { "epoch": 0.55, "learning_rate": 8.952506568322036e-06, "loss": 0.4525, "step": 4790 }, { "epoch": 0.55, "learning_rate": 8.948825351530774e-06, "loss": 0.4463, "step": 4791 }, { "epoch": 0.55, "learning_rate": 8.945144278773914e-06, "loss": 0.4477, "step": 4792 }, { "epoch": 0.55, "learning_rate": 8.941463350555835e-06, "loss": 0.4675, "step": 4793 }, { "epoch": 0.55, "learning_rate": 8.937782567380908e-06, "loss": 0.4434, "step": 4794 }, { "epoch": 0.55, "learning_rate": 8.93410192975349e-06, "loss": 0.4687, "step": 4795 }, { "epoch": 0.55, "learning_rate": 8.9304214381779e-06, "loss": 0.4757, "step": 4796 }, { "epoch": 0.55, "learning_rate": 8.926741093158456e-06, "loss": 0.4694, "step": 4797 }, { "epoch": 0.55, "learning_rate": 8.923060895199442e-06, "loss": 0.4357, "step": 4798 }, { "epoch": 0.55, "learning_rate": 8.919380844805129e-06, "loss": 0.4529, "step": 4799 }, { "epoch": 0.55, "learning_rate": 8.915700942479769e-06, "loss": 0.4772, "step": 4800 }, { "epoch": 0.55, "learning_rate": 8.912021188727585e-06, "loss": 0.4556, "step": 4801 }, { "epoch": 0.55, "learning_rate": 8.908341584052791e-06, "loss": 0.4584, "step": 4802 }, { "epoch": 0.55, "learning_rate": 8.904662128959571e-06, "loss": 0.4709, "step": 4803 }, { "epoch": 0.55, "learning_rate": 8.900982823952093e-06, "loss": 0.4442, "step": 4804 }, { "epoch": 0.55, "learning_rate": 8.897303669534508e-06, "loss": 0.4682, "step": 4805 }, { "epoch": 0.55, "learning_rate": 8.89362466621094e-06, "loss": 0.4557, "step": 4806 }, { "epoch": 0.55, "learning_rate": 8.88994581448549e-06, "loss": 0.4719, "step": 4807 }, { "epoch": 0.55, "learning_rate": 8.886267114862248e-06, "loss": 0.4619, "step": 4808 }, { "epoch": 0.55, "learning_rate": 8.882588567845275e-06, "loss": 0.4531, "step": 4809 }, { "epoch": 0.55, "learning_rate": 8.87891017393862e-06, "loss": 0.4544, "step": 4810 }, { "epoch": 0.55, "learning_rate": 8.8752319336463e-06, "loss": 0.4691, "step": 4811 }, { "epoch": 0.55, "learning_rate": 8.871553847472313e-06, "loss": 0.4549, "step": 4812 }, { "epoch": 0.55, "learning_rate": 8.867875915920645e-06, "loss": 0.4411, "step": 4813 }, { "epoch": 0.55, "learning_rate": 8.86419813949525e-06, "loss": 0.4696, "step": 4814 }, { "epoch": 0.55, "learning_rate": 8.860520518700074e-06, "loss": 0.4568, "step": 4815 }, { "epoch": 0.55, "learning_rate": 8.856843054039026e-06, "loss": 0.4446, "step": 4816 }, { "epoch": 0.55, "learning_rate": 8.853165746015997e-06, "loss": 0.4509, "step": 4817 }, { "epoch": 0.55, "learning_rate": 8.849488595134867e-06, "loss": 0.4493, "step": 4818 }, { "epoch": 0.55, "learning_rate": 8.84581160189949e-06, "loss": 0.4747, "step": 4819 }, { "epoch": 0.55, "learning_rate": 8.842134766813687e-06, "loss": 0.4503, "step": 4820 }, { "epoch": 0.55, "learning_rate": 8.838458090381274e-06, "loss": 0.4668, "step": 4821 }, { "epoch": 0.55, "learning_rate": 8.834781573106035e-06, "loss": 0.4503, "step": 4822 }, { "epoch": 0.55, "learning_rate": 8.831105215491734e-06, "loss": 0.4464, "step": 4823 }, { "epoch": 0.55, "learning_rate": 8.827429018042119e-06, "loss": 0.467, "step": 4824 }, { "epoch": 0.55, "learning_rate": 8.823752981260904e-06, "loss": 0.4819, "step": 4825 }, { "epoch": 0.55, "learning_rate": 8.820077105651794e-06, "loss": 0.4618, "step": 4826 }, { "epoch": 0.55, "learning_rate": 8.81640139171846e-06, "loss": 0.478, "step": 4827 }, { "epoch": 0.55, "learning_rate": 8.812725839964564e-06, "loss": 0.4558, "step": 4828 }, { "epoch": 0.55, "learning_rate": 8.809050450893737e-06, "loss": 0.4699, "step": 4829 }, { "epoch": 0.55, "learning_rate": 8.805375225009583e-06, "loss": 0.4374, "step": 4830 }, { "epoch": 0.55, "learning_rate": 8.801700162815698e-06, "loss": 0.465, "step": 4831 }, { "epoch": 0.55, "learning_rate": 8.798025264815643e-06, "loss": 0.4757, "step": 4832 }, { "epoch": 0.55, "learning_rate": 8.79435053151296e-06, "loss": 0.4561, "step": 4833 }, { "epoch": 0.55, "learning_rate": 8.790675963411175e-06, "loss": 0.4736, "step": 4834 }, { "epoch": 0.55, "learning_rate": 8.787001561013779e-06, "loss": 0.4534, "step": 4835 }, { "epoch": 0.55, "learning_rate": 8.783327324824255e-06, "loss": 0.4696, "step": 4836 }, { "epoch": 0.55, "learning_rate": 8.779653255346049e-06, "loss": 0.4809, "step": 4837 }, { "epoch": 0.55, "learning_rate": 8.77597935308259e-06, "loss": 0.4455, "step": 4838 }, { "epoch": 0.55, "learning_rate": 8.772305618537293e-06, "loss": 0.4506, "step": 4839 }, { "epoch": 0.55, "learning_rate": 8.768632052213532e-06, "loss": 0.4514, "step": 4840 }, { "epoch": 0.55, "learning_rate": 8.764958654614673e-06, "loss": 0.4674, "step": 4841 }, { "epoch": 0.55, "learning_rate": 8.761285426244053e-06, "loss": 0.45, "step": 4842 }, { "epoch": 0.55, "learning_rate": 8.757612367604983e-06, "loss": 0.4517, "step": 4843 }, { "epoch": 0.55, "learning_rate": 8.753939479200758e-06, "loss": 0.4691, "step": 4844 }, { "epoch": 0.55, "learning_rate": 8.750266761534641e-06, "loss": 0.4638, "step": 4845 }, { "epoch": 0.55, "learning_rate": 8.746594215109884e-06, "loss": 0.4645, "step": 4846 }, { "epoch": 0.55, "learning_rate": 8.742921840429702e-06, "loss": 0.4585, "step": 4847 }, { "epoch": 0.55, "learning_rate": 8.73924963799729e-06, "loss": 0.4481, "step": 4848 }, { "epoch": 0.55, "learning_rate": 8.73557760831583e-06, "loss": 0.4553, "step": 4849 }, { "epoch": 0.55, "learning_rate": 8.731905751888466e-06, "loss": 0.4728, "step": 4850 }, { "epoch": 0.55, "learning_rate": 8.728234069218325e-06, "loss": 0.459, "step": 4851 }, { "epoch": 0.55, "learning_rate": 8.724562560808512e-06, "loss": 0.4681, "step": 4852 }, { "epoch": 0.55, "learning_rate": 8.720891227162099e-06, "loss": 0.4699, "step": 4853 }, { "epoch": 0.55, "learning_rate": 8.71722006878215e-06, "loss": 0.4628, "step": 4854 }, { "epoch": 0.55, "learning_rate": 8.71354908617169e-06, "loss": 0.4618, "step": 4855 }, { "epoch": 0.55, "learning_rate": 8.709878279833725e-06, "loss": 0.4481, "step": 4856 }, { "epoch": 0.56, "learning_rate": 8.706207650271243e-06, "loss": 0.4791, "step": 4857 }, { "epoch": 0.56, "learning_rate": 8.702537197987193e-06, "loss": 0.4634, "step": 4858 }, { "epoch": 0.56, "learning_rate": 8.698866923484521e-06, "loss": 0.4584, "step": 4859 }, { "epoch": 0.56, "learning_rate": 8.695196827266126e-06, "loss": 0.4717, "step": 4860 }, { "epoch": 0.56, "learning_rate": 8.691526909834895e-06, "loss": 0.4573, "step": 4861 }, { "epoch": 0.56, "learning_rate": 8.687857171693693e-06, "loss": 0.4662, "step": 4862 }, { "epoch": 0.56, "learning_rate": 8.684187613345356e-06, "loss": 0.4881, "step": 4863 }, { "epoch": 0.56, "learning_rate": 8.680518235292688e-06, "loss": 0.4418, "step": 4864 }, { "epoch": 0.56, "learning_rate": 8.676849038038483e-06, "loss": 0.4666, "step": 4865 }, { "epoch": 0.56, "learning_rate": 8.673180022085499e-06, "loss": 0.4722, "step": 4866 }, { "epoch": 0.56, "learning_rate": 8.669511187936478e-06, "loss": 0.4519, "step": 4867 }, { "epoch": 0.56, "learning_rate": 8.66584253609413e-06, "loss": 0.4627, "step": 4868 }, { "epoch": 0.56, "learning_rate": 8.662174067061135e-06, "loss": 0.4508, "step": 4869 }, { "epoch": 0.56, "learning_rate": 8.658505781340166e-06, "loss": 0.4772, "step": 4870 }, { "epoch": 0.56, "learning_rate": 8.654837679433852e-06, "loss": 0.4594, "step": 4871 }, { "epoch": 0.56, "learning_rate": 8.651169761844812e-06, "loss": 0.4637, "step": 4872 }, { "epoch": 0.56, "learning_rate": 8.64750202907563e-06, "loss": 0.4445, "step": 4873 }, { "epoch": 0.56, "learning_rate": 8.643834481628861e-06, "loss": 0.4444, "step": 4874 }, { "epoch": 0.56, "learning_rate": 8.640167120007047e-06, "loss": 0.4511, "step": 4875 }, { "epoch": 0.56, "learning_rate": 8.636499944712702e-06, "loss": 0.4727, "step": 4876 }, { "epoch": 0.56, "learning_rate": 8.6328329562483e-06, "loss": 0.4674, "step": 4877 }, { "epoch": 0.56, "learning_rate": 8.629166155116312e-06, "loss": 0.48, "step": 4878 }, { "epoch": 0.56, "learning_rate": 8.625499541819163e-06, "loss": 0.4411, "step": 4879 }, { "epoch": 0.56, "learning_rate": 8.621833116859264e-06, "loss": 0.4496, "step": 4880 }, { "epoch": 0.56, "learning_rate": 8.618166880739e-06, "loss": 0.5047, "step": 4881 }, { "epoch": 0.56, "learning_rate": 8.614500833960722e-06, "loss": 0.4631, "step": 4882 }, { "epoch": 0.56, "learning_rate": 8.610834977026765e-06, "loss": 0.4548, "step": 4883 }, { "epoch": 0.56, "learning_rate": 8.607169310439427e-06, "loss": 0.4439, "step": 4884 }, { "epoch": 0.56, "learning_rate": 8.603503834700993e-06, "loss": 0.4659, "step": 4885 }, { "epoch": 0.56, "learning_rate": 8.599838550313714e-06, "loss": 0.4751, "step": 4886 }, { "epoch": 0.56, "learning_rate": 8.596173457779807e-06, "loss": 0.4699, "step": 4887 }, { "epoch": 0.56, "learning_rate": 8.592508557601484e-06, "loss": 0.4542, "step": 4888 }, { "epoch": 0.56, "learning_rate": 8.588843850280911e-06, "loss": 0.4825, "step": 4889 }, { "epoch": 0.56, "learning_rate": 8.585179336320235e-06, "loss": 0.4437, "step": 4890 }, { "epoch": 0.56, "learning_rate": 8.58151501622158e-06, "loss": 0.455, "step": 4891 }, { "epoch": 0.56, "learning_rate": 8.577850890487035e-06, "loss": 0.4626, "step": 4892 }, { "epoch": 0.56, "learning_rate": 8.574186959618671e-06, "loss": 0.4551, "step": 4893 }, { "epoch": 0.56, "learning_rate": 8.570523224118526e-06, "loss": 0.472, "step": 4894 }, { "epoch": 0.56, "learning_rate": 8.566859684488611e-06, "loss": 0.4657, "step": 4895 }, { "epoch": 0.56, "learning_rate": 8.56319634123092e-06, "loss": 0.4572, "step": 4896 }, { "epoch": 0.56, "learning_rate": 8.559533194847406e-06, "loss": 0.4532, "step": 4897 }, { "epoch": 0.56, "learning_rate": 8.555870245840005e-06, "loss": 0.4627, "step": 4898 }, { "epoch": 0.56, "learning_rate": 8.552207494710623e-06, "loss": 0.4717, "step": 4899 }, { "epoch": 0.56, "learning_rate": 8.548544941961134e-06, "loss": 0.458, "step": 4900 }, { "epoch": 0.56, "learning_rate": 8.544882588093399e-06, "loss": 0.4661, "step": 4901 }, { "epoch": 0.56, "learning_rate": 8.541220433609234e-06, "loss": 0.4533, "step": 4902 }, { "epoch": 0.56, "learning_rate": 8.53755847901044e-06, "loss": 0.4695, "step": 4903 }, { "epoch": 0.56, "learning_rate": 8.533896724798784e-06, "loss": 0.4595, "step": 4904 }, { "epoch": 0.56, "learning_rate": 8.530235171476005e-06, "loss": 0.4565, "step": 4905 }, { "epoch": 0.56, "learning_rate": 8.526573819543828e-06, "loss": 0.4569, "step": 4906 }, { "epoch": 0.56, "learning_rate": 8.522912669503932e-06, "loss": 0.4691, "step": 4907 }, { "epoch": 0.56, "learning_rate": 8.519251721857977e-06, "loss": 0.4539, "step": 4908 }, { "epoch": 0.56, "learning_rate": 8.515590977107597e-06, "loss": 0.4729, "step": 4909 }, { "epoch": 0.56, "learning_rate": 8.511930435754391e-06, "loss": 0.4549, "step": 4910 }, { "epoch": 0.56, "learning_rate": 8.508270098299943e-06, "loss": 0.4571, "step": 4911 }, { "epoch": 0.56, "learning_rate": 8.504609965245793e-06, "loss": 0.4656, "step": 4912 }, { "epoch": 0.56, "learning_rate": 8.500950037093462e-06, "loss": 0.4603, "step": 4913 }, { "epoch": 0.56, "learning_rate": 8.49729031434445e-06, "loss": 0.4627, "step": 4914 }, { "epoch": 0.56, "learning_rate": 8.493630797500214e-06, "loss": 0.4876, "step": 4915 }, { "epoch": 0.56, "learning_rate": 8.489971487062184e-06, "loss": 0.4382, "step": 4916 }, { "epoch": 0.56, "learning_rate": 8.486312383531777e-06, "loss": 0.4776, "step": 4917 }, { "epoch": 0.56, "learning_rate": 8.482653487410367e-06, "loss": 0.4457, "step": 4918 }, { "epoch": 0.56, "learning_rate": 8.478994799199308e-06, "loss": 0.4529, "step": 4919 }, { "epoch": 0.56, "learning_rate": 8.47533631939992e-06, "loss": 0.4611, "step": 4920 }, { "epoch": 0.56, "learning_rate": 8.471678048513494e-06, "loss": 0.4637, "step": 4921 }, { "epoch": 0.56, "learning_rate": 8.468019987041298e-06, "loss": 0.4798, "step": 4922 }, { "epoch": 0.56, "learning_rate": 8.464362135484564e-06, "loss": 0.4612, "step": 4923 }, { "epoch": 0.56, "learning_rate": 8.460704494344508e-06, "loss": 0.45, "step": 4924 }, { "epoch": 0.56, "learning_rate": 8.4570470641223e-06, "loss": 0.4651, "step": 4925 }, { "epoch": 0.56, "learning_rate": 8.453389845319092e-06, "loss": 0.4471, "step": 4926 }, { "epoch": 0.56, "learning_rate": 8.449732838436006e-06, "loss": 0.4679, "step": 4927 }, { "epoch": 0.56, "learning_rate": 8.44607604397413e-06, "loss": 0.4558, "step": 4928 }, { "epoch": 0.56, "learning_rate": 8.442419462434533e-06, "loss": 0.4744, "step": 4929 }, { "epoch": 0.56, "learning_rate": 8.438763094318245e-06, "loss": 0.4627, "step": 4930 }, { "epoch": 0.56, "learning_rate": 8.435106940126266e-06, "loss": 0.4728, "step": 4931 }, { "epoch": 0.56, "learning_rate": 8.431451000359575e-06, "loss": 0.4689, "step": 4932 }, { "epoch": 0.56, "learning_rate": 8.42779527551912e-06, "loss": 0.4442, "step": 4933 }, { "epoch": 0.56, "learning_rate": 8.424139766105808e-06, "loss": 0.4379, "step": 4934 }, { "epoch": 0.56, "learning_rate": 8.420484472620535e-06, "loss": 0.4609, "step": 4935 }, { "epoch": 0.56, "learning_rate": 8.41682939556415e-06, "loss": 0.4641, "step": 4936 }, { "epoch": 0.56, "learning_rate": 8.413174535437486e-06, "loss": 0.4572, "step": 4937 }, { "epoch": 0.56, "learning_rate": 8.409519892741342e-06, "loss": 0.4448, "step": 4938 }, { "epoch": 0.56, "learning_rate": 8.405865467976477e-06, "loss": 0.4714, "step": 4939 }, { "epoch": 0.56, "learning_rate": 8.402211261643638e-06, "loss": 0.4533, "step": 4940 }, { "epoch": 0.56, "learning_rate": 8.398557274243524e-06, "loss": 0.4597, "step": 4941 }, { "epoch": 0.56, "learning_rate": 8.39490350627682e-06, "loss": 0.4445, "step": 4942 }, { "epoch": 0.56, "learning_rate": 8.391249958244173e-06, "loss": 0.4642, "step": 4943 }, { "epoch": 0.57, "learning_rate": 8.387596630646195e-06, "loss": 0.4629, "step": 4944 }, { "epoch": 0.57, "learning_rate": 8.383943523983482e-06, "loss": 0.445, "step": 4945 }, { "epoch": 0.57, "learning_rate": 8.380290638756584e-06, "loss": 0.4638, "step": 4946 }, { "epoch": 0.57, "learning_rate": 8.376637975466029e-06, "loss": 0.4669, "step": 4947 }, { "epoch": 0.57, "learning_rate": 8.372985534612317e-06, "loss": 0.4508, "step": 4948 }, { "epoch": 0.57, "learning_rate": 8.369333316695909e-06, "loss": 0.4773, "step": 4949 }, { "epoch": 0.57, "learning_rate": 8.365681322217247e-06, "loss": 0.4547, "step": 4950 }, { "epoch": 0.57, "learning_rate": 8.362029551676731e-06, "loss": 0.4548, "step": 4951 }, { "epoch": 0.57, "learning_rate": 8.358378005574731e-06, "loss": 0.4562, "step": 4952 }, { "epoch": 0.57, "learning_rate": 8.354726684411604e-06, "loss": 0.4575, "step": 4953 }, { "epoch": 0.57, "learning_rate": 8.351075588687648e-06, "loss": 0.4677, "step": 4954 }, { "epoch": 0.57, "learning_rate": 8.347424718903152e-06, "loss": 0.4593, "step": 4955 }, { "epoch": 0.57, "learning_rate": 8.343774075558366e-06, "loss": 0.4511, "step": 4956 }, { "epoch": 0.57, "learning_rate": 8.340123659153506e-06, "loss": 0.4596, "step": 4957 }, { "epoch": 0.57, "learning_rate": 8.336473470188767e-06, "loss": 0.4628, "step": 4958 }, { "epoch": 0.57, "learning_rate": 8.3328235091643e-06, "loss": 0.4524, "step": 4959 }, { "epoch": 0.57, "learning_rate": 8.329173776580236e-06, "loss": 0.4604, "step": 4960 }, { "epoch": 0.57, "learning_rate": 8.325524272936668e-06, "loss": 0.4824, "step": 4961 }, { "epoch": 0.57, "learning_rate": 8.321874998733654e-06, "loss": 0.4744, "step": 4962 }, { "epoch": 0.57, "learning_rate": 8.318225954471238e-06, "loss": 0.4642, "step": 4963 }, { "epoch": 0.57, "learning_rate": 8.31457714064941e-06, "loss": 0.4616, "step": 4964 }, { "epoch": 0.57, "learning_rate": 8.310928557768145e-06, "loss": 0.4421, "step": 4965 }, { "epoch": 0.57, "learning_rate": 8.307280206327376e-06, "loss": 0.4755, "step": 4966 }, { "epoch": 0.57, "learning_rate": 8.30363208682701e-06, "loss": 0.4527, "step": 4967 }, { "epoch": 0.57, "learning_rate": 8.299984199766925e-06, "loss": 0.4444, "step": 4968 }, { "epoch": 0.57, "learning_rate": 8.296336545646957e-06, "loss": 0.4497, "step": 4969 }, { "epoch": 0.57, "learning_rate": 8.292689124966917e-06, "loss": 0.4672, "step": 4970 }, { "epoch": 0.57, "learning_rate": 8.28904193822659e-06, "loss": 0.4503, "step": 4971 }, { "epoch": 0.57, "learning_rate": 8.285394985925714e-06, "loss": 0.4621, "step": 4972 }, { "epoch": 0.57, "learning_rate": 8.281748268564002e-06, "loss": 0.459, "step": 4973 }, { "epoch": 0.57, "learning_rate": 8.278101786641142e-06, "loss": 0.4655, "step": 4974 }, { "epoch": 0.57, "learning_rate": 8.27445554065678e-06, "loss": 0.4612, "step": 4975 }, { "epoch": 0.57, "learning_rate": 8.270809531110536e-06, "loss": 0.4627, "step": 4976 }, { "epoch": 0.57, "learning_rate": 8.267163758501992e-06, "loss": 0.4448, "step": 4977 }, { "epoch": 0.57, "learning_rate": 8.263518223330698e-06, "loss": 0.4608, "step": 4978 }, { "epoch": 0.57, "learning_rate": 8.259872926096177e-06, "loss": 0.4677, "step": 4979 }, { "epoch": 0.57, "learning_rate": 8.256227867297915e-06, "loss": 0.47, "step": 4980 }, { "epoch": 0.57, "learning_rate": 8.25258304743537e-06, "loss": 0.4541, "step": 4981 }, { "epoch": 0.57, "learning_rate": 8.24893846700796e-06, "loss": 0.4523, "step": 4982 }, { "epoch": 0.57, "learning_rate": 8.245294126515073e-06, "loss": 0.4618, "step": 4983 }, { "epoch": 0.57, "learning_rate": 8.241650026456065e-06, "loss": 0.4756, "step": 4984 }, { "epoch": 0.57, "learning_rate": 8.238006167330266e-06, "loss": 0.44, "step": 4985 }, { "epoch": 0.57, "learning_rate": 8.234362549636953e-06, "loss": 0.4509, "step": 4986 }, { "epoch": 0.57, "learning_rate": 8.230719173875399e-06, "loss": 0.4718, "step": 4987 }, { "epoch": 0.57, "learning_rate": 8.227076040544813e-06, "loss": 0.4867, "step": 4988 }, { "epoch": 0.57, "learning_rate": 8.223433150144393e-06, "loss": 0.4502, "step": 4989 }, { "epoch": 0.57, "learning_rate": 8.2197905031733e-06, "loss": 0.4644, "step": 4990 }, { "epoch": 0.57, "learning_rate": 8.216148100130647e-06, "loss": 0.4476, "step": 4991 }, { "epoch": 0.57, "learning_rate": 8.212505941515536e-06, "loss": 0.4573, "step": 4992 }, { "epoch": 0.57, "learning_rate": 8.208864027827015e-06, "loss": 0.474, "step": 4993 }, { "epoch": 0.57, "learning_rate": 8.205222359564113e-06, "loss": 0.4377, "step": 4994 }, { "epoch": 0.57, "learning_rate": 8.20158093722582e-06, "loss": 0.462, "step": 4995 }, { "epoch": 0.57, "learning_rate": 8.197939761311087e-06, "loss": 0.4753, "step": 4996 }, { "epoch": 0.57, "learning_rate": 8.194298832318843e-06, "loss": 0.4643, "step": 4997 }, { "epoch": 0.57, "learning_rate": 8.190658150747973e-06, "loss": 0.4496, "step": 4998 }, { "epoch": 0.57, "learning_rate": 8.187017717097327e-06, "loss": 0.4611, "step": 4999 }, { "epoch": 0.57, "learning_rate": 8.183377531865737e-06, "loss": 0.4553, "step": 5000 }, { "epoch": 0.57, "learning_rate": 8.179737595551979e-06, "loss": 0.4481, "step": 5001 }, { "epoch": 0.57, "learning_rate": 8.176097908654814e-06, "loss": 0.4679, "step": 5002 }, { "epoch": 0.57, "learning_rate": 8.172458471672953e-06, "loss": 0.4676, "step": 5003 }, { "epoch": 0.57, "learning_rate": 8.168819285105084e-06, "loss": 0.4493, "step": 5004 }, { "epoch": 0.57, "learning_rate": 8.165180349449857e-06, "loss": 0.4536, "step": 5005 }, { "epoch": 0.57, "learning_rate": 8.161541665205885e-06, "loss": 0.4662, "step": 5006 }, { "epoch": 0.57, "learning_rate": 8.157903232871755e-06, "loss": 0.4608, "step": 5007 }, { "epoch": 0.57, "learning_rate": 8.154265052946005e-06, "loss": 0.4607, "step": 5008 }, { "epoch": 0.57, "learning_rate": 8.15062712592715e-06, "loss": 0.4508, "step": 5009 }, { "epoch": 0.57, "learning_rate": 8.146989452313671e-06, "loss": 0.4459, "step": 5010 }, { "epoch": 0.57, "learning_rate": 8.143352032604007e-06, "loss": 0.4568, "step": 5011 }, { "epoch": 0.57, "learning_rate": 8.139714867296567e-06, "loss": 0.4647, "step": 5012 }, { "epoch": 0.57, "learning_rate": 8.136077956889723e-06, "loss": 0.4756, "step": 5013 }, { "epoch": 0.57, "learning_rate": 8.13244130188181e-06, "loss": 0.4675, "step": 5014 }, { "epoch": 0.57, "learning_rate": 8.128804902771137e-06, "loss": 0.4786, "step": 5015 }, { "epoch": 0.57, "learning_rate": 8.125168760055971e-06, "loss": 0.471, "step": 5016 }, { "epoch": 0.57, "learning_rate": 8.121532874234539e-06, "loss": 0.4604, "step": 5017 }, { "epoch": 0.57, "learning_rate": 8.117897245805044e-06, "loss": 0.4471, "step": 5018 }, { "epoch": 0.57, "learning_rate": 8.114261875265643e-06, "loss": 0.4433, "step": 5019 }, { "epoch": 0.57, "learning_rate": 8.11062676311447e-06, "loss": 0.4612, "step": 5020 }, { "epoch": 0.57, "learning_rate": 8.106991909849613e-06, "loss": 0.4797, "step": 5021 }, { "epoch": 0.57, "learning_rate": 8.103357315969127e-06, "loss": 0.4456, "step": 5022 }, { "epoch": 0.57, "learning_rate": 8.099722981971035e-06, "loss": 0.4634, "step": 5023 }, { "epoch": 0.57, "learning_rate": 8.096088908353316e-06, "loss": 0.4674, "step": 5024 }, { "epoch": 0.57, "learning_rate": 8.092455095613927e-06, "loss": 0.4568, "step": 5025 }, { "epoch": 0.57, "learning_rate": 8.088821544250778e-06, "loss": 0.4572, "step": 5026 }, { "epoch": 0.57, "learning_rate": 8.085188254761744e-06, "loss": 0.4588, "step": 5027 }, { "epoch": 0.57, "learning_rate": 8.081555227644674e-06, "loss": 0.4563, "step": 5028 }, { "epoch": 0.57, "learning_rate": 8.077922463397371e-06, "loss": 0.4857, "step": 5029 }, { "epoch": 0.57, "learning_rate": 8.074289962517597e-06, "loss": 0.4454, "step": 5030 }, { "epoch": 0.57, "learning_rate": 8.070657725503094e-06, "loss": 0.4636, "step": 5031 }, { "epoch": 0.58, "learning_rate": 8.067025752851555e-06, "loss": 0.4605, "step": 5032 }, { "epoch": 0.58, "learning_rate": 8.063394045060648e-06, "loss": 0.4575, "step": 5033 }, { "epoch": 0.58, "learning_rate": 8.059762602627995e-06, "loss": 0.4647, "step": 5034 }, { "epoch": 0.58, "learning_rate": 8.05613142605118e-06, "loss": 0.4465, "step": 5035 }, { "epoch": 0.58, "learning_rate": 8.052500515827759e-06, "loss": 0.4594, "step": 5036 }, { "epoch": 0.58, "learning_rate": 8.048869872455246e-06, "loss": 0.4623, "step": 5037 }, { "epoch": 0.58, "learning_rate": 8.045239496431125e-06, "loss": 0.4749, "step": 5038 }, { "epoch": 0.58, "learning_rate": 8.041609388252836e-06, "loss": 0.4546, "step": 5039 }, { "epoch": 0.58, "learning_rate": 8.037979548417781e-06, "loss": 0.4709, "step": 5040 }, { "epoch": 0.58, "learning_rate": 8.034349977423332e-06, "loss": 0.4572, "step": 5041 }, { "epoch": 0.58, "learning_rate": 8.030720675766825e-06, "loss": 0.4705, "step": 5042 }, { "epoch": 0.58, "learning_rate": 8.027091643945548e-06, "loss": 0.4479, "step": 5043 }, { "epoch": 0.58, "learning_rate": 8.023462882456768e-06, "loss": 0.4596, "step": 5044 }, { "epoch": 0.58, "learning_rate": 8.019834391797696e-06, "loss": 0.4481, "step": 5045 }, { "epoch": 0.58, "learning_rate": 8.016206172465525e-06, "loss": 0.4726, "step": 5046 }, { "epoch": 0.58, "learning_rate": 8.0125782249574e-06, "loss": 0.4526, "step": 5047 }, { "epoch": 0.58, "learning_rate": 8.008950549770426e-06, "loss": 0.4478, "step": 5048 }, { "epoch": 0.58, "learning_rate": 8.005323147401684e-06, "loss": 0.4693, "step": 5049 }, { "epoch": 0.58, "learning_rate": 8.0016960183482e-06, "loss": 0.4515, "step": 5050 }, { "epoch": 0.58, "learning_rate": 7.998069163106977e-06, "loss": 0.4497, "step": 5051 }, { "epoch": 0.58, "learning_rate": 7.994442582174976e-06, "loss": 0.4524, "step": 5052 }, { "epoch": 0.58, "learning_rate": 7.990816276049115e-06, "loss": 0.4489, "step": 5053 }, { "epoch": 0.58, "learning_rate": 7.987190245226285e-06, "loss": 0.4759, "step": 5054 }, { "epoch": 0.58, "learning_rate": 7.983564490203328e-06, "loss": 0.4643, "step": 5055 }, { "epoch": 0.58, "learning_rate": 7.979939011477052e-06, "loss": 0.4524, "step": 5056 }, { "epoch": 0.58, "learning_rate": 7.976313809544237e-06, "loss": 0.4649, "step": 5057 }, { "epoch": 0.58, "learning_rate": 7.972688884901606e-06, "loss": 0.439, "step": 5058 }, { "epoch": 0.58, "learning_rate": 7.969064238045865e-06, "loss": 0.4411, "step": 5059 }, { "epoch": 0.58, "learning_rate": 7.965439869473664e-06, "loss": 0.4819, "step": 5060 }, { "epoch": 0.58, "learning_rate": 7.961815779681624e-06, "loss": 0.4461, "step": 5061 }, { "epoch": 0.58, "learning_rate": 7.95819196916633e-06, "loss": 0.4635, "step": 5062 }, { "epoch": 0.58, "learning_rate": 7.954568438424315e-06, "loss": 0.44, "step": 5063 }, { "epoch": 0.58, "learning_rate": 7.9509451879521e-06, "loss": 0.4765, "step": 5064 }, { "epoch": 0.58, "learning_rate": 7.947322218246136e-06, "loss": 0.4726, "step": 5065 }, { "epoch": 0.58, "learning_rate": 7.943699529802854e-06, "loss": 0.4714, "step": 5066 }, { "epoch": 0.58, "learning_rate": 7.940077123118654e-06, "loss": 0.4558, "step": 5067 }, { "epoch": 0.58, "learning_rate": 7.936454998689875e-06, "loss": 0.4609, "step": 5068 }, { "epoch": 0.58, "learning_rate": 7.932833157012829e-06, "loss": 0.4656, "step": 5069 }, { "epoch": 0.58, "learning_rate": 7.929211598583795e-06, "loss": 0.4652, "step": 5070 }, { "epoch": 0.58, "learning_rate": 7.925590323899002e-06, "loss": 0.4624, "step": 5071 }, { "epoch": 0.58, "learning_rate": 7.921969333454652e-06, "loss": 0.46, "step": 5072 }, { "epoch": 0.58, "learning_rate": 7.918348627746896e-06, "loss": 0.4763, "step": 5073 }, { "epoch": 0.58, "learning_rate": 7.914728207271853e-06, "loss": 0.4567, "step": 5074 }, { "epoch": 0.58, "learning_rate": 7.911108072525603e-06, "loss": 0.4655, "step": 5075 }, { "epoch": 0.58, "learning_rate": 7.90748822400418e-06, "loss": 0.4465, "step": 5076 }, { "epoch": 0.58, "learning_rate": 7.903868662203594e-06, "loss": 0.4486, "step": 5077 }, { "epoch": 0.58, "learning_rate": 7.900249387619797e-06, "loss": 0.4767, "step": 5078 }, { "epoch": 0.58, "learning_rate": 7.896630400748715e-06, "loss": 0.4576, "step": 5079 }, { "epoch": 0.58, "learning_rate": 7.893011702086225e-06, "loss": 0.4671, "step": 5080 }, { "epoch": 0.58, "learning_rate": 7.889393292128177e-06, "loss": 0.4425, "step": 5081 }, { "epoch": 0.58, "learning_rate": 7.885775171370364e-06, "loss": 0.4573, "step": 5082 }, { "epoch": 0.58, "learning_rate": 7.88215734030856e-06, "loss": 0.4664, "step": 5083 }, { "epoch": 0.58, "learning_rate": 7.878539799438479e-06, "loss": 0.464, "step": 5084 }, { "epoch": 0.58, "learning_rate": 7.874922549255814e-06, "loss": 0.444, "step": 5085 }, { "epoch": 0.58, "learning_rate": 7.871305590256206e-06, "loss": 0.4777, "step": 5086 }, { "epoch": 0.58, "learning_rate": 7.867688922935253e-06, "loss": 0.4662, "step": 5087 }, { "epoch": 0.58, "learning_rate": 7.864072547788526e-06, "loss": 0.4694, "step": 5088 }, { "epoch": 0.58, "learning_rate": 7.860456465311544e-06, "loss": 0.4534, "step": 5089 }, { "epoch": 0.58, "learning_rate": 7.856840675999799e-06, "loss": 0.4482, "step": 5090 }, { "epoch": 0.58, "learning_rate": 7.85322518034873e-06, "loss": 0.4837, "step": 5091 }, { "epoch": 0.58, "learning_rate": 7.849609978853735e-06, "loss": 0.4548, "step": 5092 }, { "epoch": 0.58, "learning_rate": 7.845995072010188e-06, "loss": 0.4736, "step": 5093 }, { "epoch": 0.58, "learning_rate": 7.842380460313408e-06, "loss": 0.4498, "step": 5094 }, { "epoch": 0.58, "learning_rate": 7.83876614425867e-06, "loss": 0.4545, "step": 5095 }, { "epoch": 0.58, "learning_rate": 7.835152124341228e-06, "loss": 0.459, "step": 5096 }, { "epoch": 0.58, "learning_rate": 7.831538401056274e-06, "loss": 0.4741, "step": 5097 }, { "epoch": 0.58, "learning_rate": 7.827924974898973e-06, "loss": 0.4798, "step": 5098 }, { "epoch": 0.58, "learning_rate": 7.824311846364448e-06, "loss": 0.4477, "step": 5099 }, { "epoch": 0.58, "learning_rate": 7.82069901594777e-06, "loss": 0.4804, "step": 5100 }, { "epoch": 0.58, "learning_rate": 7.817086484143987e-06, "loss": 0.4712, "step": 5101 }, { "epoch": 0.58, "learning_rate": 7.813474251448086e-06, "loss": 0.44, "step": 5102 }, { "epoch": 0.58, "learning_rate": 7.809862318355033e-06, "loss": 0.4624, "step": 5103 }, { "epoch": 0.58, "learning_rate": 7.806250685359742e-06, "loss": 0.468, "step": 5104 }, { "epoch": 0.58, "learning_rate": 7.80263935295708e-06, "loss": 0.4681, "step": 5105 }, { "epoch": 0.58, "learning_rate": 7.799028321641889e-06, "loss": 0.457, "step": 5106 }, { "epoch": 0.58, "learning_rate": 7.795417591908954e-06, "loss": 0.4619, "step": 5107 }, { "epoch": 0.58, "learning_rate": 7.79180716425303e-06, "loss": 0.4449, "step": 5108 }, { "epoch": 0.58, "learning_rate": 7.788197039168829e-06, "loss": 0.4714, "step": 5109 }, { "epoch": 0.58, "learning_rate": 7.784587217151009e-06, "loss": 0.4515, "step": 5110 }, { "epoch": 0.58, "learning_rate": 7.780977698694206e-06, "loss": 0.4551, "step": 5111 }, { "epoch": 0.58, "learning_rate": 7.777368484293e-06, "loss": 0.4647, "step": 5112 }, { "epoch": 0.58, "learning_rate": 7.77375957444193e-06, "loss": 0.4572, "step": 5113 }, { "epoch": 0.58, "learning_rate": 7.770150969635509e-06, "loss": 0.4862, "step": 5114 }, { "epoch": 0.58, "learning_rate": 7.766542670368182e-06, "loss": 0.4475, "step": 5115 }, { "epoch": 0.58, "learning_rate": 7.76293467713438e-06, "loss": 0.4581, "step": 5116 }, { "epoch": 0.58, "learning_rate": 7.759326990428468e-06, "loss": 0.4624, "step": 5117 }, { "epoch": 0.58, "learning_rate": 7.755719610744783e-06, "loss": 0.4533, "step": 5118 }, { "epoch": 0.59, "learning_rate": 7.752112538577623e-06, "loss": 0.458, "step": 5119 }, { "epoch": 0.59, "learning_rate": 7.748505774421227e-06, "loss": 0.4647, "step": 5120 }, { "epoch": 0.59, "learning_rate": 7.744899318769811e-06, "loss": 0.4381, "step": 5121 }, { "epoch": 0.59, "learning_rate": 7.741293172117533e-06, "loss": 0.486, "step": 5122 }, { "epoch": 0.59, "learning_rate": 7.737687334958518e-06, "loss": 0.4649, "step": 5123 }, { "epoch": 0.59, "learning_rate": 7.73408180778685e-06, "loss": 0.4676, "step": 5124 }, { "epoch": 0.59, "learning_rate": 7.730476591096565e-06, "loss": 0.464, "step": 5125 }, { "epoch": 0.59, "learning_rate": 7.726871685381652e-06, "loss": 0.4425, "step": 5126 }, { "epoch": 0.59, "learning_rate": 7.72326709113607e-06, "loss": 0.4543, "step": 5127 }, { "epoch": 0.59, "learning_rate": 7.719662808853726e-06, "loss": 0.454, "step": 5128 }, { "epoch": 0.59, "learning_rate": 7.71605883902849e-06, "loss": 0.4574, "step": 5129 }, { "epoch": 0.59, "learning_rate": 7.712455182154186e-06, "loss": 0.477, "step": 5130 }, { "epoch": 0.59, "learning_rate": 7.708851838724592e-06, "loss": 0.4669, "step": 5131 }, { "epoch": 0.59, "learning_rate": 7.70524880923345e-06, "loss": 0.4791, "step": 5132 }, { "epoch": 0.59, "learning_rate": 7.701646094174451e-06, "loss": 0.4468, "step": 5133 }, { "epoch": 0.59, "learning_rate": 7.698043694041256e-06, "loss": 0.4403, "step": 5134 }, { "epoch": 0.59, "learning_rate": 7.694441609327465e-06, "loss": 0.4693, "step": 5135 }, { "epoch": 0.59, "learning_rate": 7.69083984052665e-06, "loss": 0.4503, "step": 5136 }, { "epoch": 0.59, "learning_rate": 7.68723838813233e-06, "loss": 0.4546, "step": 5137 }, { "epoch": 0.59, "learning_rate": 7.683637252637988e-06, "loss": 0.474, "step": 5138 }, { "epoch": 0.59, "learning_rate": 7.680036434537054e-06, "loss": 0.4519, "step": 5139 }, { "epoch": 0.59, "learning_rate": 7.676435934322925e-06, "loss": 0.4492, "step": 5140 }, { "epoch": 0.59, "learning_rate": 7.67283575248895e-06, "loss": 0.4679, "step": 5141 }, { "epoch": 0.59, "learning_rate": 7.669235889528436e-06, "loss": 0.4641, "step": 5142 }, { "epoch": 0.59, "learning_rate": 7.665636345934642e-06, "loss": 0.4657, "step": 5143 }, { "epoch": 0.59, "learning_rate": 7.662037122200783e-06, "loss": 0.4692, "step": 5144 }, { "epoch": 0.59, "learning_rate": 7.658438218820037e-06, "loss": 0.4639, "step": 5145 }, { "epoch": 0.59, "learning_rate": 7.65483963628553e-06, "loss": 0.4528, "step": 5146 }, { "epoch": 0.59, "learning_rate": 7.651241375090358e-06, "loss": 0.4656, "step": 5147 }, { "epoch": 0.59, "learning_rate": 7.647643435727555e-06, "loss": 0.4515, "step": 5148 }, { "epoch": 0.59, "learning_rate": 7.644045818690118e-06, "loss": 0.4597, "step": 5149 }, { "epoch": 0.59, "learning_rate": 7.640448524471002e-06, "loss": 0.4585, "step": 5150 }, { "epoch": 0.59, "learning_rate": 7.636851553563123e-06, "loss": 0.4527, "step": 5151 }, { "epoch": 0.59, "learning_rate": 7.633254906459335e-06, "loss": 0.4651, "step": 5152 }, { "epoch": 0.59, "learning_rate": 7.629658583652471e-06, "loss": 0.4537, "step": 5153 }, { "epoch": 0.59, "learning_rate": 7.6260625856352966e-06, "loss": 0.4566, "step": 5154 }, { "epoch": 0.59, "learning_rate": 7.6224669129005516e-06, "loss": 0.4639, "step": 5155 }, { "epoch": 0.59, "learning_rate": 7.6188715659409216e-06, "loss": 0.4979, "step": 5156 }, { "epoch": 0.59, "learning_rate": 7.615276545249046e-06, "loss": 0.4343, "step": 5157 }, { "epoch": 0.59, "learning_rate": 7.611681851317529e-06, "loss": 0.4736, "step": 5158 }, { "epoch": 0.59, "learning_rate": 7.608087484638915e-06, "loss": 0.4522, "step": 5159 }, { "epoch": 0.59, "learning_rate": 7.604493445705722e-06, "loss": 0.4479, "step": 5160 }, { "epoch": 0.59, "learning_rate": 7.60089973501041e-06, "loss": 0.4702, "step": 5161 }, { "epoch": 0.59, "learning_rate": 7.597306353045393e-06, "loss": 0.4507, "step": 5162 }, { "epoch": 0.59, "learning_rate": 7.593713300303054e-06, "loss": 0.4657, "step": 5163 }, { "epoch": 0.59, "learning_rate": 7.590120577275713e-06, "loss": 0.4633, "step": 5164 }, { "epoch": 0.59, "learning_rate": 7.586528184455653e-06, "loss": 0.4432, "step": 5165 }, { "epoch": 0.59, "learning_rate": 7.58293612233512e-06, "loss": 0.4541, "step": 5166 }, { "epoch": 0.59, "learning_rate": 7.579344391406299e-06, "loss": 0.4552, "step": 5167 }, { "epoch": 0.59, "learning_rate": 7.575752992161345e-06, "loss": 0.4491, "step": 5168 }, { "epoch": 0.59, "learning_rate": 7.572161925092352e-06, "loss": 0.4613, "step": 5169 }, { "epoch": 0.59, "learning_rate": 7.568571190691378e-06, "loss": 0.4477, "step": 5170 }, { "epoch": 0.59, "learning_rate": 7.564980789450438e-06, "loss": 0.4663, "step": 5171 }, { "epoch": 0.59, "learning_rate": 7.5613907218614925e-06, "loss": 0.4692, "step": 5172 }, { "epoch": 0.59, "learning_rate": 7.5578009884164646e-06, "loss": 0.4534, "step": 5173 }, { "epoch": 0.59, "learning_rate": 7.554211589607227e-06, "loss": 0.469, "step": 5174 }, { "epoch": 0.59, "learning_rate": 7.5506225259256025e-06, "loss": 0.4627, "step": 5175 }, { "epoch": 0.59, "learning_rate": 7.547033797863382e-06, "loss": 0.4678, "step": 5176 }, { "epoch": 0.59, "learning_rate": 7.543445405912298e-06, "loss": 0.4545, "step": 5177 }, { "epoch": 0.59, "learning_rate": 7.5398573505640326e-06, "loss": 0.4504, "step": 5178 }, { "epoch": 0.59, "learning_rate": 7.536269632310238e-06, "loss": 0.4522, "step": 5179 }, { "epoch": 0.59, "learning_rate": 7.532682251642508e-06, "loss": 0.4594, "step": 5180 }, { "epoch": 0.59, "learning_rate": 7.5290952090523995e-06, "loss": 0.4656, "step": 5181 }, { "epoch": 0.59, "learning_rate": 7.525508505031412e-06, "loss": 0.4779, "step": 5182 }, { "epoch": 0.59, "learning_rate": 7.521922140071003e-06, "loss": 0.4321, "step": 5183 }, { "epoch": 0.59, "learning_rate": 7.518336114662588e-06, "loss": 0.4792, "step": 5184 }, { "epoch": 0.59, "learning_rate": 7.514750429297528e-06, "loss": 0.4704, "step": 5185 }, { "epoch": 0.59, "learning_rate": 7.5111650844671515e-06, "loss": 0.4456, "step": 5186 }, { "epoch": 0.59, "learning_rate": 7.507580080662722e-06, "loss": 0.4904, "step": 5187 }, { "epoch": 0.59, "learning_rate": 7.5039954183754674e-06, "loss": 0.4394, "step": 5188 }, { "epoch": 0.59, "learning_rate": 7.5004110980965664e-06, "loss": 0.467, "step": 5189 }, { "epoch": 0.59, "learning_rate": 7.496827120317149e-06, "loss": 0.4668, "step": 5190 }, { "epoch": 0.59, "learning_rate": 7.493243485528306e-06, "loss": 0.4549, "step": 5191 }, { "epoch": 0.59, "learning_rate": 7.489660194221071e-06, "loss": 0.4694, "step": 5192 }, { "epoch": 0.59, "learning_rate": 7.486077246886435e-06, "loss": 0.465, "step": 5193 }, { "epoch": 0.59, "learning_rate": 7.4824946440153436e-06, "loss": 0.4509, "step": 5194 }, { "epoch": 0.59, "learning_rate": 7.478912386098692e-06, "loss": 0.4735, "step": 5195 }, { "epoch": 0.59, "learning_rate": 7.475330473627327e-06, "loss": 0.4617, "step": 5196 }, { "epoch": 0.59, "learning_rate": 7.471748907092056e-06, "loss": 0.4542, "step": 5197 }, { "epoch": 0.59, "learning_rate": 7.468167686983627e-06, "loss": 0.4588, "step": 5198 }, { "epoch": 0.59, "learning_rate": 7.464586813792757e-06, "loss": 0.4637, "step": 5199 }, { "epoch": 0.59, "learning_rate": 7.4610062880100985e-06, "loss": 0.4593, "step": 5200 }, { "epoch": 0.59, "learning_rate": 7.4574261101262604e-06, "loss": 0.4585, "step": 5201 }, { "epoch": 0.59, "learning_rate": 7.453846280631814e-06, "loss": 0.457, "step": 5202 }, { "epoch": 0.59, "learning_rate": 7.45026680001727e-06, "loss": 0.4588, "step": 5203 }, { "epoch": 0.59, "learning_rate": 7.446687668773105e-06, "loss": 0.4484, "step": 5204 }, { "epoch": 0.59, "learning_rate": 7.443108887389735e-06, "loss": 0.4708, "step": 5205 }, { "epoch": 0.59, "learning_rate": 7.439530456357528e-06, "loss": 0.452, "step": 5206 }, { "epoch": 0.6, "learning_rate": 7.435952376166818e-06, "loss": 0.4659, "step": 5207 }, { "epoch": 0.6, "learning_rate": 7.432374647307878e-06, "loss": 0.4689, "step": 5208 }, { "epoch": 0.6, "learning_rate": 7.428797270270933e-06, "loss": 0.4541, "step": 5209 }, { "epoch": 0.6, "learning_rate": 7.425220245546172e-06, "loss": 0.4608, "step": 5210 }, { "epoch": 0.6, "learning_rate": 7.421643573623717e-06, "loss": 0.4559, "step": 5211 }, { "epoch": 0.6, "learning_rate": 7.41806725499366e-06, "loss": 0.4525, "step": 5212 }, { "epoch": 0.6, "learning_rate": 7.4144912901460355e-06, "loss": 0.4628, "step": 5213 }, { "epoch": 0.6, "learning_rate": 7.410915679570825e-06, "loss": 0.4476, "step": 5214 }, { "epoch": 0.6, "learning_rate": 7.407340423757974e-06, "loss": 0.4521, "step": 5215 }, { "epoch": 0.6, "learning_rate": 7.403765523197365e-06, "loss": 0.4727, "step": 5216 }, { "epoch": 0.6, "learning_rate": 7.4001909783788465e-06, "loss": 0.4596, "step": 5217 }, { "epoch": 0.6, "learning_rate": 7.396616789792208e-06, "loss": 0.4606, "step": 5218 }, { "epoch": 0.6, "learning_rate": 7.39304295792719e-06, "loss": 0.485, "step": 5219 }, { "epoch": 0.6, "learning_rate": 7.389469483273495e-06, "loss": 0.4432, "step": 5220 }, { "epoch": 0.6, "learning_rate": 7.385896366320761e-06, "loss": 0.4672, "step": 5221 }, { "epoch": 0.6, "learning_rate": 7.382323607558585e-06, "loss": 0.4679, "step": 5222 }, { "epoch": 0.6, "learning_rate": 7.378751207476522e-06, "loss": 0.4712, "step": 5223 }, { "epoch": 0.6, "learning_rate": 7.375179166564062e-06, "loss": 0.4411, "step": 5224 }, { "epoch": 0.6, "learning_rate": 7.3716074853106635e-06, "loss": 0.4791, "step": 5225 }, { "epoch": 0.6, "learning_rate": 7.368036164205719e-06, "loss": 0.4627, "step": 5226 }, { "epoch": 0.6, "learning_rate": 7.3644652037385785e-06, "loss": 0.4696, "step": 5227 }, { "epoch": 0.6, "learning_rate": 7.3608946043985515e-06, "loss": 0.4502, "step": 5228 }, { "epoch": 0.6, "learning_rate": 7.357324366674881e-06, "loss": 0.4456, "step": 5229 }, { "epoch": 0.6, "learning_rate": 7.353754491056776e-06, "loss": 0.4576, "step": 5230 }, { "epoch": 0.6, "learning_rate": 7.350184978033386e-06, "loss": 0.4659, "step": 5231 }, { "epoch": 0.6, "learning_rate": 7.34661582809381e-06, "loss": 0.4441, "step": 5232 }, { "epoch": 0.6, "learning_rate": 7.3430470417271106e-06, "loss": 0.4653, "step": 5233 }, { "epoch": 0.6, "learning_rate": 7.339478619422287e-06, "loss": 0.4634, "step": 5234 }, { "epoch": 0.6, "learning_rate": 7.335910561668286e-06, "loss": 0.4618, "step": 5235 }, { "epoch": 0.6, "learning_rate": 7.3323428689540184e-06, "loss": 0.4568, "step": 5236 }, { "epoch": 0.6, "learning_rate": 7.328775541768336e-06, "loss": 0.4478, "step": 5237 }, { "epoch": 0.6, "learning_rate": 7.3252085806000474e-06, "loss": 0.4481, "step": 5238 }, { "epoch": 0.6, "learning_rate": 7.3216419859379e-06, "loss": 0.4719, "step": 5239 }, { "epoch": 0.6, "learning_rate": 7.318075758270593e-06, "loss": 0.4603, "step": 5240 }, { "epoch": 0.6, "learning_rate": 7.314509898086788e-06, "loss": 0.4593, "step": 5241 }, { "epoch": 0.6, "learning_rate": 7.31094440587508e-06, "loss": 0.4439, "step": 5242 }, { "epoch": 0.6, "learning_rate": 7.30737928212403e-06, "loss": 0.4547, "step": 5243 }, { "epoch": 0.6, "learning_rate": 7.303814527322132e-06, "loss": 0.4527, "step": 5244 }, { "epoch": 0.6, "learning_rate": 7.300250141957839e-06, "loss": 0.4529, "step": 5245 }, { "epoch": 0.6, "learning_rate": 7.296686126519552e-06, "loss": 0.4366, "step": 5246 }, { "epoch": 0.6, "learning_rate": 7.293122481495623e-06, "loss": 0.4555, "step": 5247 }, { "epoch": 0.6, "learning_rate": 7.2895592073743415e-06, "loss": 0.4766, "step": 5248 }, { "epoch": 0.6, "learning_rate": 7.2859963046439665e-06, "loss": 0.4804, "step": 5249 }, { "epoch": 0.6, "learning_rate": 7.282433773792689e-06, "loss": 0.4415, "step": 5250 }, { "epoch": 0.6, "learning_rate": 7.2788716153086604e-06, "loss": 0.4475, "step": 5251 }, { "epoch": 0.6, "learning_rate": 7.275309829679973e-06, "loss": 0.479, "step": 5252 }, { "epoch": 0.6, "learning_rate": 7.271748417394668e-06, "loss": 0.4674, "step": 5253 }, { "epoch": 0.6, "learning_rate": 7.2681873789407435e-06, "loss": 0.4474, "step": 5254 }, { "epoch": 0.6, "learning_rate": 7.264626714806135e-06, "loss": 0.4562, "step": 5255 }, { "epoch": 0.6, "learning_rate": 7.2610664254787425e-06, "loss": 0.4435, "step": 5256 }, { "epoch": 0.6, "learning_rate": 7.257506511446398e-06, "loss": 0.4784, "step": 5257 }, { "epoch": 0.6, "learning_rate": 7.253946973196888e-06, "loss": 0.4483, "step": 5258 }, { "epoch": 0.6, "learning_rate": 7.2503878112179534e-06, "loss": 0.4493, "step": 5259 }, { "epoch": 0.6, "learning_rate": 7.246829025997279e-06, "loss": 0.4603, "step": 5260 }, { "epoch": 0.6, "learning_rate": 7.243270618022492e-06, "loss": 0.4749, "step": 5261 }, { "epoch": 0.6, "learning_rate": 7.2397125877811816e-06, "loss": 0.4541, "step": 5262 }, { "epoch": 0.6, "learning_rate": 7.2361549357608685e-06, "loss": 0.4485, "step": 5263 }, { "epoch": 0.6, "learning_rate": 7.232597662449038e-06, "loss": 0.4716, "step": 5264 }, { "epoch": 0.6, "learning_rate": 7.2290407683331154e-06, "loss": 0.4592, "step": 5265 }, { "epoch": 0.6, "learning_rate": 7.225484253900468e-06, "loss": 0.4722, "step": 5266 }, { "epoch": 0.6, "learning_rate": 7.221928119638426e-06, "loss": 0.4733, "step": 5267 }, { "epoch": 0.6, "learning_rate": 7.218372366034252e-06, "loss": 0.4663, "step": 5268 }, { "epoch": 0.6, "learning_rate": 7.214816993575168e-06, "loss": 0.4417, "step": 5269 }, { "epoch": 0.6, "learning_rate": 7.211262002748341e-06, "loss": 0.4623, "step": 5270 }, { "epoch": 0.6, "learning_rate": 7.207707394040877e-06, "loss": 0.4508, "step": 5271 }, { "epoch": 0.6, "learning_rate": 7.2041531679398445e-06, "loss": 0.4486, "step": 5272 }, { "epoch": 0.6, "learning_rate": 7.200599324932246e-06, "loss": 0.4616, "step": 5273 }, { "epoch": 0.6, "learning_rate": 7.197045865505041e-06, "loss": 0.464, "step": 5274 }, { "epoch": 0.6, "learning_rate": 7.193492790145135e-06, "loss": 0.4784, "step": 5275 }, { "epoch": 0.6, "learning_rate": 7.18994009933937e-06, "loss": 0.441, "step": 5276 }, { "epoch": 0.6, "learning_rate": 7.186387793574554e-06, "loss": 0.4565, "step": 5277 }, { "epoch": 0.6, "learning_rate": 7.182835873337425e-06, "loss": 0.4541, "step": 5278 }, { "epoch": 0.6, "learning_rate": 7.179284339114676e-06, "loss": 0.4627, "step": 5279 }, { "epoch": 0.6, "learning_rate": 7.175733191392952e-06, "loss": 0.4565, "step": 5280 }, { "epoch": 0.6, "learning_rate": 7.172182430658832e-06, "loss": 0.4737, "step": 5281 }, { "epoch": 0.6, "learning_rate": 7.168632057398857e-06, "loss": 0.4672, "step": 5282 }, { "epoch": 0.6, "learning_rate": 7.165082072099503e-06, "loss": 0.453, "step": 5283 }, { "epoch": 0.6, "learning_rate": 7.161532475247195e-06, "loss": 0.4718, "step": 5284 }, { "epoch": 0.6, "learning_rate": 7.157983267328314e-06, "loss": 0.4627, "step": 5285 }, { "epoch": 0.6, "learning_rate": 7.1544344488291725e-06, "loss": 0.4551, "step": 5286 }, { "epoch": 0.6, "learning_rate": 7.150886020236045e-06, "loss": 0.4413, "step": 5287 }, { "epoch": 0.6, "learning_rate": 7.147337982035143e-06, "loss": 0.4505, "step": 5288 }, { "epoch": 0.6, "learning_rate": 7.143790334712623e-06, "loss": 0.4672, "step": 5289 }, { "epoch": 0.6, "learning_rate": 7.140243078754601e-06, "loss": 0.4728, "step": 5290 }, { "epoch": 0.6, "learning_rate": 7.136696214647123e-06, "loss": 0.4598, "step": 5291 }, { "epoch": 0.6, "learning_rate": 7.133149742876187e-06, "loss": 0.4481, "step": 5292 }, { "epoch": 0.6, "learning_rate": 7.129603663927742e-06, "loss": 0.4895, "step": 5293 }, { "epoch": 0.61, "learning_rate": 7.12605797828768e-06, "loss": 0.4599, "step": 5294 }, { "epoch": 0.61, "learning_rate": 7.1225126864418425e-06, "loss": 0.4663, "step": 5295 }, { "epoch": 0.61, "learning_rate": 7.118967788876011e-06, "loss": 0.4485, "step": 5296 }, { "epoch": 0.61, "learning_rate": 7.11542328607591e-06, "loss": 0.4594, "step": 5297 }, { "epoch": 0.61, "learning_rate": 7.111879178527223e-06, "loss": 0.4633, "step": 5298 }, { "epoch": 0.61, "learning_rate": 7.108335466715566e-06, "loss": 0.46, "step": 5299 }, { "epoch": 0.61, "learning_rate": 7.104792151126515e-06, "loss": 0.4562, "step": 5300 }, { "epoch": 0.61, "learning_rate": 7.101249232245576e-06, "loss": 0.4664, "step": 5301 }, { "epoch": 0.61, "learning_rate": 7.09770671055821e-06, "loss": 0.4507, "step": 5302 }, { "epoch": 0.61, "learning_rate": 7.094164586549821e-06, "loss": 0.4531, "step": 5303 }, { "epoch": 0.61, "learning_rate": 7.090622860705764e-06, "loss": 0.4541, "step": 5304 }, { "epoch": 0.61, "learning_rate": 7.087081533511324e-06, "loss": 0.4608, "step": 5305 }, { "epoch": 0.61, "learning_rate": 7.0835406054517505e-06, "loss": 0.4726, "step": 5306 }, { "epoch": 0.61, "learning_rate": 7.080000077012229e-06, "loss": 0.4511, "step": 5307 }, { "epoch": 0.61, "learning_rate": 7.076459948677889e-06, "loss": 0.4427, "step": 5308 }, { "epoch": 0.61, "learning_rate": 7.072920220933808e-06, "loss": 0.4556, "step": 5309 }, { "epoch": 0.61, "learning_rate": 7.069380894265004e-06, "loss": 0.4427, "step": 5310 }, { "epoch": 0.61, "learning_rate": 7.06584196915645e-06, "loss": 0.477, "step": 5311 }, { "epoch": 0.61, "learning_rate": 7.062303446093051e-06, "loss": 0.4334, "step": 5312 }, { "epoch": 0.61, "learning_rate": 7.058765325559673e-06, "loss": 0.4567, "step": 5313 }, { "epoch": 0.61, "learning_rate": 7.055227608041111e-06, "loss": 0.4657, "step": 5314 }, { "epoch": 0.61, "learning_rate": 7.051690294022108e-06, "loss": 0.4766, "step": 5315 }, { "epoch": 0.61, "learning_rate": 7.0481533839873614e-06, "loss": 0.4642, "step": 5316 }, { "epoch": 0.61, "learning_rate": 7.044616878421506e-06, "loss": 0.484, "step": 5317 }, { "epoch": 0.61, "learning_rate": 7.041080777809118e-06, "loss": 0.4496, "step": 5318 }, { "epoch": 0.61, "learning_rate": 7.037545082634729e-06, "loss": 0.456, "step": 5319 }, { "epoch": 0.61, "learning_rate": 7.034009793382799e-06, "loss": 0.4493, "step": 5320 }, { "epoch": 0.61, "learning_rate": 7.030474910537748e-06, "loss": 0.4484, "step": 5321 }, { "epoch": 0.61, "learning_rate": 7.0269404345839356e-06, "loss": 0.4352, "step": 5322 }, { "epoch": 0.61, "learning_rate": 7.023406366005655e-06, "loss": 0.4687, "step": 5323 }, { "epoch": 0.61, "learning_rate": 7.019872705287163e-06, "loss": 0.468, "step": 5324 }, { "epoch": 0.61, "learning_rate": 7.016339452912642e-06, "loss": 0.4487, "step": 5325 }, { "epoch": 0.61, "learning_rate": 7.012806609366231e-06, "loss": 0.4607, "step": 5326 }, { "epoch": 0.61, "learning_rate": 7.009274175132009e-06, "loss": 0.453, "step": 5327 }, { "epoch": 0.61, "learning_rate": 7.005742150693993e-06, "loss": 0.4402, "step": 5328 }, { "epoch": 0.61, "learning_rate": 7.0022105365361555e-06, "loss": 0.4583, "step": 5329 }, { "epoch": 0.61, "learning_rate": 6.998679333142403e-06, "loss": 0.4477, "step": 5330 }, { "epoch": 0.61, "learning_rate": 6.995148540996588e-06, "loss": 0.467, "step": 5331 }, { "epoch": 0.61, "learning_rate": 6.991618160582512e-06, "loss": 0.4758, "step": 5332 }, { "epoch": 0.61, "learning_rate": 6.9880881923839105e-06, "loss": 0.4547, "step": 5333 }, { "epoch": 0.61, "learning_rate": 6.9845586368844755e-06, "loss": 0.4476, "step": 5334 }, { "epoch": 0.61, "learning_rate": 6.981029494567828e-06, "loss": 0.4614, "step": 5335 }, { "epoch": 0.61, "learning_rate": 6.97750076591754e-06, "loss": 0.4657, "step": 5336 }, { "epoch": 0.61, "learning_rate": 6.973972451417132e-06, "loss": 0.4678, "step": 5337 }, { "epoch": 0.61, "learning_rate": 6.9704445515500544e-06, "loss": 0.4482, "step": 5338 }, { "epoch": 0.61, "learning_rate": 6.966917066799714e-06, "loss": 0.4502, "step": 5339 }, { "epoch": 0.61, "learning_rate": 6.9633899976494525e-06, "loss": 0.4655, "step": 5340 }, { "epoch": 0.61, "learning_rate": 6.959863344582554e-06, "loss": 0.4492, "step": 5341 }, { "epoch": 0.61, "learning_rate": 6.956337108082256e-06, "loss": 0.4732, "step": 5342 }, { "epoch": 0.61, "learning_rate": 6.952811288631728e-06, "loss": 0.4797, "step": 5343 }, { "epoch": 0.61, "learning_rate": 6.949285886714081e-06, "loss": 0.4374, "step": 5344 }, { "epoch": 0.61, "learning_rate": 6.9457609028123795e-06, "loss": 0.4326, "step": 5345 }, { "epoch": 0.61, "learning_rate": 6.942236337409623e-06, "loss": 0.4609, "step": 5346 }, { "epoch": 0.61, "learning_rate": 6.93871219098876e-06, "loss": 0.4855, "step": 5347 }, { "epoch": 0.61, "learning_rate": 6.935188464032674e-06, "loss": 0.4507, "step": 5348 }, { "epoch": 0.61, "learning_rate": 6.93166515702419e-06, "loss": 0.4745, "step": 5349 }, { "epoch": 0.61, "learning_rate": 6.928142270446086e-06, "loss": 0.4519, "step": 5350 }, { "epoch": 0.61, "learning_rate": 6.924619804781069e-06, "loss": 0.457, "step": 5351 }, { "epoch": 0.61, "learning_rate": 6.921097760511807e-06, "loss": 0.442, "step": 5352 }, { "epoch": 0.61, "learning_rate": 6.917576138120892e-06, "loss": 0.4732, "step": 5353 }, { "epoch": 0.61, "learning_rate": 6.91405493809086e-06, "loss": 0.4478, "step": 5354 }, { "epoch": 0.61, "learning_rate": 6.9105341609042e-06, "loss": 0.4681, "step": 5355 }, { "epoch": 0.61, "learning_rate": 6.907013807043335e-06, "loss": 0.4417, "step": 5356 }, { "epoch": 0.61, "learning_rate": 6.903493876990637e-06, "loss": 0.4551, "step": 5357 }, { "epoch": 0.61, "learning_rate": 6.899974371228409e-06, "loss": 0.4597, "step": 5358 }, { "epoch": 0.61, "learning_rate": 6.896455290238902e-06, "loss": 0.459, "step": 5359 }, { "epoch": 0.61, "learning_rate": 6.892936634504313e-06, "loss": 0.4587, "step": 5360 }, { "epoch": 0.61, "learning_rate": 6.889418404506774e-06, "loss": 0.467, "step": 5361 }, { "epoch": 0.61, "learning_rate": 6.885900600728358e-06, "loss": 0.4496, "step": 5362 }, { "epoch": 0.61, "learning_rate": 6.882383223651088e-06, "loss": 0.4505, "step": 5363 }, { "epoch": 0.61, "learning_rate": 6.878866273756919e-06, "loss": 0.4636, "step": 5364 }, { "epoch": 0.61, "learning_rate": 6.8753497515277555e-06, "loss": 0.4444, "step": 5365 }, { "epoch": 0.61, "learning_rate": 6.871833657445438e-06, "loss": 0.4537, "step": 5366 }, { "epoch": 0.61, "learning_rate": 6.8683179919917465e-06, "loss": 0.4657, "step": 5367 }, { "epoch": 0.61, "learning_rate": 6.8648027556484095e-06, "loss": 0.4502, "step": 5368 }, { "epoch": 0.61, "learning_rate": 6.861287948897091e-06, "loss": 0.4813, "step": 5369 }, { "epoch": 0.61, "learning_rate": 6.857773572219402e-06, "loss": 0.4466, "step": 5370 }, { "epoch": 0.61, "learning_rate": 6.854259626096888e-06, "loss": 0.4636, "step": 5371 }, { "epoch": 0.61, "learning_rate": 6.850746111011034e-06, "loss": 0.4505, "step": 5372 }, { "epoch": 0.61, "learning_rate": 6.847233027443274e-06, "loss": 0.4592, "step": 5373 }, { "epoch": 0.61, "learning_rate": 6.843720375874983e-06, "loss": 0.4563, "step": 5374 }, { "epoch": 0.61, "learning_rate": 6.8402081567874625e-06, "loss": 0.4667, "step": 5375 }, { "epoch": 0.61, "learning_rate": 6.836696370661975e-06, "loss": 0.4653, "step": 5376 }, { "epoch": 0.61, "learning_rate": 6.833185017979704e-06, "loss": 0.4613, "step": 5377 }, { "epoch": 0.61, "learning_rate": 6.8296740992217915e-06, "loss": 0.4702, "step": 5378 }, { "epoch": 0.61, "learning_rate": 6.82616361486931e-06, "loss": 0.4558, "step": 5379 }, { "epoch": 0.61, "learning_rate": 6.82265356540327e-06, "loss": 0.4441, "step": 5380 }, { "epoch": 0.61, "learning_rate": 6.819143951304632e-06, "loss": 0.4734, "step": 5381 }, { "epoch": 0.62, "learning_rate": 6.815634773054286e-06, "loss": 0.4551, "step": 5382 }, { "epoch": 0.62, "learning_rate": 6.812126031133073e-06, "loss": 0.4691, "step": 5383 }, { "epoch": 0.62, "learning_rate": 6.8086177260217675e-06, "loss": 0.4692, "step": 5384 }, { "epoch": 0.62, "learning_rate": 6.8051098582010825e-06, "loss": 0.4457, "step": 5385 }, { "epoch": 0.62, "learning_rate": 6.801602428151679e-06, "loss": 0.4683, "step": 5386 }, { "epoch": 0.62, "learning_rate": 6.7980954363541506e-06, "loss": 0.4593, "step": 5387 }, { "epoch": 0.62, "learning_rate": 6.79458888328903e-06, "loss": 0.4525, "step": 5388 }, { "epoch": 0.62, "learning_rate": 6.791082769436801e-06, "loss": 0.4436, "step": 5389 }, { "epoch": 0.62, "learning_rate": 6.787577095277873e-06, "loss": 0.4504, "step": 5390 }, { "epoch": 0.62, "learning_rate": 6.784071861292607e-06, "loss": 0.4928, "step": 5391 }, { "epoch": 0.62, "learning_rate": 6.780567067961293e-06, "loss": 0.4695, "step": 5392 }, { "epoch": 0.62, "learning_rate": 6.777062715764166e-06, "loss": 0.4518, "step": 5393 }, { "epoch": 0.62, "learning_rate": 6.773558805181408e-06, "loss": 0.4454, "step": 5394 }, { "epoch": 0.62, "learning_rate": 6.770055336693123e-06, "loss": 0.4695, "step": 5395 }, { "epoch": 0.62, "learning_rate": 6.766552310779374e-06, "loss": 0.4315, "step": 5396 }, { "epoch": 0.62, "learning_rate": 6.763049727920145e-06, "loss": 0.454, "step": 5397 }, { "epoch": 0.62, "learning_rate": 6.759547588595372e-06, "loss": 0.4592, "step": 5398 }, { "epoch": 0.62, "learning_rate": 6.7560458932849306e-06, "loss": 0.457, "step": 5399 }, { "epoch": 0.62, "learning_rate": 6.752544642468626e-06, "loss": 0.4682, "step": 5400 }, { "epoch": 0.62, "learning_rate": 6.749043836626203e-06, "loss": 0.4561, "step": 5401 }, { "epoch": 0.62, "learning_rate": 6.74554347623736e-06, "loss": 0.4611, "step": 5402 }, { "epoch": 0.62, "learning_rate": 6.742043561781717e-06, "loss": 0.4398, "step": 5403 }, { "epoch": 0.62, "learning_rate": 6.738544093738848e-06, "loss": 0.4694, "step": 5404 }, { "epoch": 0.62, "learning_rate": 6.735045072588256e-06, "loss": 0.4432, "step": 5405 }, { "epoch": 0.62, "learning_rate": 6.731546498809376e-06, "loss": 0.4421, "step": 5406 }, { "epoch": 0.62, "learning_rate": 6.7280483728816016e-06, "loss": 0.4487, "step": 5407 }, { "epoch": 0.62, "learning_rate": 6.724550695284247e-06, "loss": 0.4678, "step": 5408 }, { "epoch": 0.62, "learning_rate": 6.72105346649658e-06, "loss": 0.4643, "step": 5409 }, { "epoch": 0.62, "learning_rate": 6.717556686997795e-06, "loss": 0.4759, "step": 5410 }, { "epoch": 0.62, "learning_rate": 6.714060357267023e-06, "loss": 0.4702, "step": 5411 }, { "epoch": 0.62, "learning_rate": 6.7105644777833475e-06, "loss": 0.4544, "step": 5412 }, { "epoch": 0.62, "learning_rate": 6.707069049025781e-06, "loss": 0.4695, "step": 5413 }, { "epoch": 0.62, "learning_rate": 6.703574071473269e-06, "loss": 0.4528, "step": 5414 }, { "epoch": 0.62, "learning_rate": 6.700079545604707e-06, "loss": 0.4569, "step": 5415 }, { "epoch": 0.62, "learning_rate": 6.696585471898922e-06, "loss": 0.4543, "step": 5416 }, { "epoch": 0.62, "learning_rate": 6.693091850834681e-06, "loss": 0.4681, "step": 5417 }, { "epoch": 0.62, "learning_rate": 6.6895986828906886e-06, "loss": 0.4582, "step": 5418 }, { "epoch": 0.62, "learning_rate": 6.686105968545582e-06, "loss": 0.4586, "step": 5419 }, { "epoch": 0.62, "learning_rate": 6.682613708277945e-06, "loss": 0.4444, "step": 5420 }, { "epoch": 0.62, "learning_rate": 6.679121902566294e-06, "loss": 0.4541, "step": 5421 }, { "epoch": 0.62, "learning_rate": 6.675630551889088e-06, "loss": 0.4553, "step": 5422 }, { "epoch": 0.62, "learning_rate": 6.672139656724715e-06, "loss": 0.467, "step": 5423 }, { "epoch": 0.62, "learning_rate": 6.668649217551505e-06, "loss": 0.4665, "step": 5424 }, { "epoch": 0.62, "learning_rate": 6.665159234847731e-06, "loss": 0.4776, "step": 5425 }, { "epoch": 0.62, "learning_rate": 6.6616697090915975e-06, "loss": 0.4475, "step": 5426 }, { "epoch": 0.62, "learning_rate": 6.658180640761241e-06, "loss": 0.4668, "step": 5427 }, { "epoch": 0.62, "learning_rate": 6.654692030334753e-06, "loss": 0.4912, "step": 5428 }, { "epoch": 0.62, "learning_rate": 6.651203878290139e-06, "loss": 0.4346, "step": 5429 }, { "epoch": 0.62, "learning_rate": 6.647716185105362e-06, "loss": 0.4658, "step": 5430 }, { "epoch": 0.62, "learning_rate": 6.644228951258313e-06, "loss": 0.4585, "step": 5431 }, { "epoch": 0.62, "learning_rate": 6.640742177226816e-06, "loss": 0.4507, "step": 5432 }, { "epoch": 0.62, "learning_rate": 6.637255863488643e-06, "loss": 0.4771, "step": 5433 }, { "epoch": 0.62, "learning_rate": 6.63377001052149e-06, "loss": 0.4594, "step": 5434 }, { "epoch": 0.62, "learning_rate": 6.630284618803003e-06, "loss": 0.4394, "step": 5435 }, { "epoch": 0.62, "learning_rate": 6.626799688810759e-06, "loss": 0.4817, "step": 5436 }, { "epoch": 0.62, "learning_rate": 6.623315221022263e-06, "loss": 0.4329, "step": 5437 }, { "epoch": 0.62, "learning_rate": 6.619831215914974e-06, "loss": 0.4537, "step": 5438 }, { "epoch": 0.62, "learning_rate": 6.6163476739662724e-06, "loss": 0.449, "step": 5439 }, { "epoch": 0.62, "learning_rate": 6.612864595653483e-06, "loss": 0.4501, "step": 5440 }, { "epoch": 0.62, "learning_rate": 6.609381981453869e-06, "loss": 0.4529, "step": 5441 }, { "epoch": 0.62, "learning_rate": 6.60589983184462e-06, "loss": 0.4821, "step": 5442 }, { "epoch": 0.62, "learning_rate": 6.602418147302874e-06, "loss": 0.443, "step": 5443 }, { "epoch": 0.62, "learning_rate": 6.598936928305695e-06, "loss": 0.4841, "step": 5444 }, { "epoch": 0.62, "learning_rate": 6.5954561753300885e-06, "loss": 0.4656, "step": 5445 }, { "epoch": 0.62, "learning_rate": 6.591975888852998e-06, "loss": 0.4388, "step": 5446 }, { "epoch": 0.62, "learning_rate": 6.5884960693512965e-06, "loss": 0.463, "step": 5447 }, { "epoch": 0.62, "learning_rate": 6.585016717301805e-06, "loss": 0.4715, "step": 5448 }, { "epoch": 0.62, "learning_rate": 6.581537833181262e-06, "loss": 0.4748, "step": 5449 }, { "epoch": 0.62, "learning_rate": 6.578059417466356e-06, "loss": 0.45, "step": 5450 }, { "epoch": 0.62, "learning_rate": 6.5745814706337115e-06, "loss": 0.4486, "step": 5451 }, { "epoch": 0.62, "learning_rate": 6.57110399315988e-06, "loss": 0.4499, "step": 5452 }, { "epoch": 0.62, "learning_rate": 6.5676269855213585e-06, "loss": 0.4558, "step": 5453 }, { "epoch": 0.62, "learning_rate": 6.56415044819457e-06, "loss": 0.4761, "step": 5454 }, { "epoch": 0.62, "learning_rate": 6.560674381655876e-06, "loss": 0.4435, "step": 5455 }, { "epoch": 0.62, "learning_rate": 6.557198786381584e-06, "loss": 0.4555, "step": 5456 }, { "epoch": 0.62, "learning_rate": 6.553723662847924e-06, "loss": 0.4568, "step": 5457 }, { "epoch": 0.62, "learning_rate": 6.550249011531058e-06, "loss": 0.4636, "step": 5458 }, { "epoch": 0.62, "learning_rate": 6.546774832907101e-06, "loss": 0.461, "step": 5459 }, { "epoch": 0.62, "learning_rate": 6.543301127452086e-06, "loss": 0.4682, "step": 5460 }, { "epoch": 0.62, "learning_rate": 6.539827895641997e-06, "loss": 0.4469, "step": 5461 }, { "epoch": 0.62, "learning_rate": 6.536355137952737e-06, "loss": 0.495, "step": 5462 }, { "epoch": 0.62, "learning_rate": 6.53288285486015e-06, "loss": 0.4454, "step": 5463 }, { "epoch": 0.62, "learning_rate": 6.52941104684002e-06, "loss": 0.4627, "step": 5464 }, { "epoch": 0.62, "learning_rate": 6.52593971436806e-06, "loss": 0.4606, "step": 5465 }, { "epoch": 0.62, "learning_rate": 6.522468857919926e-06, "loss": 0.46, "step": 5466 }, { "epoch": 0.62, "learning_rate": 6.518998477971199e-06, "loss": 0.4615, "step": 5467 }, { "epoch": 0.62, "learning_rate": 6.515528574997394e-06, "loss": 0.4869, "step": 5468 }, { "epoch": 0.63, "learning_rate": 6.512059149473971e-06, "loss": 0.4803, "step": 5469 }, { "epoch": 0.63, "learning_rate": 6.508590201876317e-06, "loss": 0.4653, "step": 5470 }, { "epoch": 0.63, "learning_rate": 6.5051217326797535e-06, "loss": 0.4486, "step": 5471 }, { "epoch": 0.63, "learning_rate": 6.501653742359539e-06, "loss": 0.4593, "step": 5472 }, { "epoch": 0.63, "learning_rate": 6.49818623139087e-06, "loss": 0.4658, "step": 5473 }, { "epoch": 0.63, "learning_rate": 6.494719200248867e-06, "loss": 0.4547, "step": 5474 }, { "epoch": 0.63, "learning_rate": 6.491252649408596e-06, "loss": 0.4492, "step": 5475 }, { "epoch": 0.63, "learning_rate": 6.4877865793450445e-06, "loss": 0.4601, "step": 5476 }, { "epoch": 0.63, "learning_rate": 6.484320990533148e-06, "loss": 0.4599, "step": 5477 }, { "epoch": 0.63, "learning_rate": 6.480855883447767e-06, "loss": 0.4706, "step": 5478 }, { "epoch": 0.63, "learning_rate": 6.4773912585637e-06, "loss": 0.4422, "step": 5479 }, { "epoch": 0.63, "learning_rate": 6.473927116355678e-06, "loss": 0.4583, "step": 5480 }, { "epoch": 0.63, "learning_rate": 6.4704634572983615e-06, "loss": 0.442, "step": 5481 }, { "epoch": 0.63, "learning_rate": 6.4670002818663535e-06, "loss": 0.4692, "step": 5482 }, { "epoch": 0.63, "learning_rate": 6.463537590534188e-06, "loss": 0.4508, "step": 5483 }, { "epoch": 0.63, "learning_rate": 6.4600753837763255e-06, "loss": 0.4677, "step": 5484 }, { "epoch": 0.63, "learning_rate": 6.4566136620671705e-06, "loss": 0.4529, "step": 5485 }, { "epoch": 0.63, "learning_rate": 6.453152425881051e-06, "loss": 0.4515, "step": 5486 }, { "epoch": 0.63, "learning_rate": 6.4496916756922375e-06, "loss": 0.4291, "step": 5487 }, { "epoch": 0.63, "learning_rate": 6.4462314119749315e-06, "loss": 0.464, "step": 5488 }, { "epoch": 0.63, "learning_rate": 6.44277163520326e-06, "loss": 0.4463, "step": 5489 }, { "epoch": 0.63, "learning_rate": 6.439312345851298e-06, "loss": 0.4595, "step": 5490 }, { "epoch": 0.63, "learning_rate": 6.435853544393038e-06, "loss": 0.4468, "step": 5491 }, { "epoch": 0.63, "learning_rate": 6.432395231302418e-06, "loss": 0.451, "step": 5492 }, { "epoch": 0.63, "learning_rate": 6.428937407053304e-06, "loss": 0.4634, "step": 5493 }, { "epoch": 0.63, "learning_rate": 6.425480072119488e-06, "loss": 0.459, "step": 5494 }, { "epoch": 0.63, "learning_rate": 6.422023226974713e-06, "loss": 0.4458, "step": 5495 }, { "epoch": 0.63, "learning_rate": 6.4185668720926365e-06, "loss": 0.455, "step": 5496 }, { "epoch": 0.63, "learning_rate": 6.4151110079468545e-06, "loss": 0.4607, "step": 5497 }, { "epoch": 0.63, "learning_rate": 6.411655635010907e-06, "loss": 0.4528, "step": 5498 }, { "epoch": 0.63, "learning_rate": 6.4082007537582465e-06, "loss": 0.4468, "step": 5499 }, { "epoch": 0.63, "learning_rate": 6.40474636466228e-06, "loss": 0.458, "step": 5500 }, { "epoch": 0.63, "learning_rate": 6.4012924681963255e-06, "loss": 0.4821, "step": 5501 }, { "epoch": 0.63, "learning_rate": 6.397839064833647e-06, "loss": 0.458, "step": 5502 }, { "epoch": 0.63, "learning_rate": 6.394386155047443e-06, "loss": 0.4543, "step": 5503 }, { "epoch": 0.63, "learning_rate": 6.39093373931083e-06, "loss": 0.4515, "step": 5504 }, { "epoch": 0.63, "learning_rate": 6.387481818096877e-06, "loss": 0.4509, "step": 5505 }, { "epoch": 0.63, "learning_rate": 6.384030391878566e-06, "loss": 0.4444, "step": 5506 }, { "epoch": 0.63, "learning_rate": 6.38057946112882e-06, "loss": 0.4718, "step": 5507 }, { "epoch": 0.63, "learning_rate": 6.3771290263205e-06, "loss": 0.4506, "step": 5508 }, { "epoch": 0.63, "learning_rate": 6.373679087926388e-06, "loss": 0.4686, "step": 5509 }, { "epoch": 0.63, "learning_rate": 6.370229646419199e-06, "loss": 0.4743, "step": 5510 }, { "epoch": 0.63, "learning_rate": 6.366780702271589e-06, "loss": 0.458, "step": 5511 }, { "epoch": 0.63, "learning_rate": 6.363332255956136e-06, "loss": 0.4525, "step": 5512 }, { "epoch": 0.63, "learning_rate": 6.359884307945363e-06, "loss": 0.4658, "step": 5513 }, { "epoch": 0.63, "learning_rate": 6.356436858711708e-06, "loss": 0.4587, "step": 5514 }, { "epoch": 0.63, "learning_rate": 6.352989908727546e-06, "loss": 0.4463, "step": 5515 }, { "epoch": 0.63, "learning_rate": 6.349543458465193e-06, "loss": 0.4761, "step": 5516 }, { "epoch": 0.63, "learning_rate": 6.346097508396885e-06, "loss": 0.4726, "step": 5517 }, { "epoch": 0.63, "learning_rate": 6.3426520589947985e-06, "loss": 0.4668, "step": 5518 }, { "epoch": 0.63, "learning_rate": 6.339207110731036e-06, "loss": 0.4606, "step": 5519 }, { "epoch": 0.63, "learning_rate": 6.335762664077627e-06, "loss": 0.454, "step": 5520 }, { "epoch": 0.63, "learning_rate": 6.332318719506543e-06, "loss": 0.469, "step": 5521 }, { "epoch": 0.63, "learning_rate": 6.328875277489677e-06, "loss": 0.4462, "step": 5522 }, { "epoch": 0.63, "learning_rate": 6.325432338498865e-06, "loss": 0.4572, "step": 5523 }, { "epoch": 0.63, "learning_rate": 6.321989903005861e-06, "loss": 0.4478, "step": 5524 }, { "epoch": 0.63, "learning_rate": 6.318547971482352e-06, "loss": 0.4604, "step": 5525 }, { "epoch": 0.63, "learning_rate": 6.315106544399966e-06, "loss": 0.4631, "step": 5526 }, { "epoch": 0.63, "learning_rate": 6.311665622230254e-06, "loss": 0.4559, "step": 5527 }, { "epoch": 0.63, "learning_rate": 6.3082252054446955e-06, "loss": 0.455, "step": 5528 }, { "epoch": 0.63, "learning_rate": 6.304785294514709e-06, "loss": 0.4549, "step": 5529 }, { "epoch": 0.63, "learning_rate": 6.301345889911636e-06, "loss": 0.4664, "step": 5530 }, { "epoch": 0.63, "learning_rate": 6.297906992106755e-06, "loss": 0.4549, "step": 5531 }, { "epoch": 0.63, "learning_rate": 6.29446860157127e-06, "loss": 0.4561, "step": 5532 }, { "epoch": 0.63, "learning_rate": 6.291030718776313e-06, "loss": 0.4534, "step": 5533 }, { "epoch": 0.63, "learning_rate": 6.287593344192957e-06, "loss": 0.4905, "step": 5534 }, { "epoch": 0.63, "learning_rate": 6.284156478292196e-06, "loss": 0.4596, "step": 5535 }, { "epoch": 0.63, "learning_rate": 6.2807201215449584e-06, "loss": 0.4457, "step": 5536 }, { "epoch": 0.63, "learning_rate": 6.277284274422104e-06, "loss": 0.4593, "step": 5537 }, { "epoch": 0.63, "learning_rate": 6.273848937394413e-06, "loss": 0.463, "step": 5538 }, { "epoch": 0.63, "learning_rate": 6.270414110932611e-06, "loss": 0.4587, "step": 5539 }, { "epoch": 0.63, "learning_rate": 6.266979795507346e-06, "loss": 0.4452, "step": 5540 }, { "epoch": 0.63, "learning_rate": 6.2635459915891876e-06, "loss": 0.4585, "step": 5541 }, { "epoch": 0.63, "learning_rate": 6.260112699648653e-06, "loss": 0.4637, "step": 5542 }, { "epoch": 0.63, "learning_rate": 6.256679920156172e-06, "loss": 0.4702, "step": 5543 }, { "epoch": 0.63, "learning_rate": 6.253247653582119e-06, "loss": 0.4526, "step": 5544 }, { "epoch": 0.63, "learning_rate": 6.2498159003967896e-06, "loss": 0.4575, "step": 5545 }, { "epoch": 0.63, "learning_rate": 6.246384661070404e-06, "loss": 0.4568, "step": 5546 }, { "epoch": 0.63, "learning_rate": 6.2429539360731286e-06, "loss": 0.4498, "step": 5547 }, { "epoch": 0.63, "learning_rate": 6.239523725875041e-06, "loss": 0.4679, "step": 5548 }, { "epoch": 0.63, "learning_rate": 6.23609403094616e-06, "loss": 0.4461, "step": 5549 }, { "epoch": 0.63, "learning_rate": 6.232664851756434e-06, "loss": 0.4776, "step": 5550 }, { "epoch": 0.63, "learning_rate": 6.229236188775729e-06, "loss": 0.4537, "step": 5551 }, { "epoch": 0.63, "learning_rate": 6.225808042473857e-06, "loss": 0.4517, "step": 5552 }, { "epoch": 0.63, "learning_rate": 6.222380413320546e-06, "loss": 0.4589, "step": 5553 }, { "epoch": 0.63, "learning_rate": 6.218953301785453e-06, "loss": 0.462, "step": 5554 }, { "epoch": 0.63, "learning_rate": 6.2155267083381795e-06, "loss": 0.4469, "step": 5555 }, { "epoch": 0.63, "learning_rate": 6.212100633448237e-06, "loss": 0.4665, "step": 5556 }, { "epoch": 0.64, "learning_rate": 6.208675077585079e-06, "loss": 0.4465, "step": 5557 }, { "epoch": 0.64, "learning_rate": 6.2052500412180805e-06, "loss": 0.4778, "step": 5558 }, { "epoch": 0.64, "learning_rate": 6.201825524816545e-06, "loss": 0.4497, "step": 5559 }, { "epoch": 0.64, "learning_rate": 6.198401528849717e-06, "loss": 0.4788, "step": 5560 }, { "epoch": 0.64, "learning_rate": 6.194978053786749e-06, "loss": 0.4548, "step": 5561 }, { "epoch": 0.64, "learning_rate": 6.191555100096744e-06, "loss": 0.4663, "step": 5562 }, { "epoch": 0.64, "learning_rate": 6.188132668248716e-06, "loss": 0.4589, "step": 5563 }, { "epoch": 0.64, "learning_rate": 6.184710758711616e-06, "loss": 0.4489, "step": 5564 }, { "epoch": 0.64, "learning_rate": 6.181289371954327e-06, "loss": 0.4458, "step": 5565 }, { "epoch": 0.64, "learning_rate": 6.177868508445651e-06, "loss": 0.4718, "step": 5566 }, { "epoch": 0.64, "learning_rate": 6.174448168654317e-06, "loss": 0.4501, "step": 5567 }, { "epoch": 0.64, "learning_rate": 6.171028353048996e-06, "loss": 0.4906, "step": 5568 }, { "epoch": 0.64, "learning_rate": 6.167609062098276e-06, "loss": 0.4411, "step": 5569 }, { "epoch": 0.64, "learning_rate": 6.164190296270683e-06, "loss": 0.4616, "step": 5570 }, { "epoch": 0.64, "learning_rate": 6.160772056034655e-06, "loss": 0.4449, "step": 5571 }, { "epoch": 0.64, "learning_rate": 6.157354341858568e-06, "loss": 0.4601, "step": 5572 }, { "epoch": 0.64, "learning_rate": 6.1539371542107295e-06, "loss": 0.4472, "step": 5573 }, { "epoch": 0.64, "learning_rate": 6.1505204935593665e-06, "loss": 0.4845, "step": 5574 }, { "epoch": 0.64, "learning_rate": 6.147104360372644e-06, "loss": 0.4442, "step": 5575 }, { "epoch": 0.64, "learning_rate": 6.1436887551186466e-06, "loss": 0.4733, "step": 5576 }, { "epoch": 0.64, "learning_rate": 6.14027367826538e-06, "loss": 0.4424, "step": 5577 }, { "epoch": 0.64, "learning_rate": 6.136859130280794e-06, "loss": 0.4735, "step": 5578 }, { "epoch": 0.64, "learning_rate": 6.133445111632761e-06, "loss": 0.4515, "step": 5579 }, { "epoch": 0.64, "learning_rate": 6.130031622789067e-06, "loss": 0.4605, "step": 5580 }, { "epoch": 0.64, "learning_rate": 6.126618664217448e-06, "loss": 0.4499, "step": 5581 }, { "epoch": 0.64, "learning_rate": 6.123206236385543e-06, "loss": 0.4527, "step": 5582 }, { "epoch": 0.64, "learning_rate": 6.119794339760941e-06, "loss": 0.4556, "step": 5583 }, { "epoch": 0.64, "learning_rate": 6.1163829748111466e-06, "loss": 0.4661, "step": 5584 }, { "epoch": 0.64, "learning_rate": 6.112972142003587e-06, "loss": 0.45, "step": 5585 }, { "epoch": 0.64, "learning_rate": 6.109561841805629e-06, "loss": 0.4588, "step": 5586 }, { "epoch": 0.64, "learning_rate": 6.106152074684556e-06, "loss": 0.4475, "step": 5587 }, { "epoch": 0.64, "learning_rate": 6.102742841107585e-06, "loss": 0.4708, "step": 5588 }, { "epoch": 0.64, "learning_rate": 6.099334141541856e-06, "loss": 0.4573, "step": 5589 }, { "epoch": 0.64, "learning_rate": 6.095925976454433e-06, "loss": 0.4513, "step": 5590 }, { "epoch": 0.64, "learning_rate": 6.092518346312317e-06, "loss": 0.4378, "step": 5591 }, { "epoch": 0.64, "learning_rate": 6.089111251582427e-06, "loss": 0.4679, "step": 5592 }, { "epoch": 0.64, "learning_rate": 6.085704692731609e-06, "loss": 0.4659, "step": 5593 }, { "epoch": 0.64, "learning_rate": 6.082298670226642e-06, "loss": 0.4478, "step": 5594 }, { "epoch": 0.64, "learning_rate": 6.0788931845342205e-06, "loss": 0.452, "step": 5595 }, { "epoch": 0.64, "learning_rate": 6.075488236120978e-06, "loss": 0.4487, "step": 5596 }, { "epoch": 0.64, "learning_rate": 6.0720838254534675e-06, "loss": 0.4547, "step": 5597 }, { "epoch": 0.64, "learning_rate": 6.068679952998167e-06, "loss": 0.4457, "step": 5598 }, { "epoch": 0.64, "learning_rate": 6.065276619221485e-06, "loss": 0.4448, "step": 5599 }, { "epoch": 0.64, "learning_rate": 6.061873824589751e-06, "loss": 0.4378, "step": 5600 }, { "epoch": 0.64, "learning_rate": 6.058471569569228e-06, "loss": 0.462, "step": 5601 }, { "epoch": 0.64, "learning_rate": 6.055069854626102e-06, "loss": 0.4632, "step": 5602 }, { "epoch": 0.64, "learning_rate": 6.051668680226477e-06, "loss": 0.4506, "step": 5603 }, { "epoch": 0.64, "learning_rate": 6.0482680468363964e-06, "loss": 0.4816, "step": 5604 }, { "epoch": 0.64, "learning_rate": 6.044867954921818e-06, "loss": 0.4275, "step": 5605 }, { "epoch": 0.64, "learning_rate": 6.0414684049486335e-06, "loss": 0.4369, "step": 5606 }, { "epoch": 0.64, "learning_rate": 6.0380693973826595e-06, "loss": 0.4646, "step": 5607 }, { "epoch": 0.64, "learning_rate": 6.034670932689629e-06, "loss": 0.4391, "step": 5608 }, { "epoch": 0.64, "learning_rate": 6.031273011335215e-06, "loss": 0.4563, "step": 5609 }, { "epoch": 0.64, "learning_rate": 6.027875633785003e-06, "loss": 0.4534, "step": 5610 }, { "epoch": 0.64, "learning_rate": 6.024478800504509e-06, "loss": 0.4575, "step": 5611 }, { "epoch": 0.64, "learning_rate": 6.0210825119591806e-06, "loss": 0.4483, "step": 5612 }, { "epoch": 0.64, "learning_rate": 6.0176867686143795e-06, "loss": 0.446, "step": 5613 }, { "epoch": 0.64, "learning_rate": 6.014291570935405e-06, "loss": 0.448, "step": 5614 }, { "epoch": 0.64, "learning_rate": 6.0108969193874675e-06, "loss": 0.4926, "step": 5615 }, { "epoch": 0.64, "learning_rate": 6.007502814435713e-06, "loss": 0.4475, "step": 5616 }, { "epoch": 0.64, "learning_rate": 6.0041092565452135e-06, "loss": 0.4339, "step": 5617 }, { "epoch": 0.64, "learning_rate": 6.000716246180953e-06, "loss": 0.4616, "step": 5618 }, { "epoch": 0.64, "learning_rate": 5.9973237838078625e-06, "loss": 0.474, "step": 5619 }, { "epoch": 0.64, "learning_rate": 5.993931869890774e-06, "loss": 0.4726, "step": 5620 }, { "epoch": 0.64, "learning_rate": 5.9905405048944575e-06, "loss": 0.464, "step": 5621 }, { "epoch": 0.64, "learning_rate": 5.987149689283614e-06, "loss": 0.4486, "step": 5622 }, { "epoch": 0.64, "learning_rate": 5.983759423522852e-06, "loss": 0.4448, "step": 5623 }, { "epoch": 0.64, "learning_rate": 5.980369708076713e-06, "loss": 0.4598, "step": 5624 }, { "epoch": 0.64, "learning_rate": 5.976980543409669e-06, "loss": 0.4511, "step": 5625 }, { "epoch": 0.64, "learning_rate": 5.973591929986108e-06, "loss": 0.4508, "step": 5626 }, { "epoch": 0.64, "learning_rate": 5.97020386827035e-06, "loss": 0.4723, "step": 5627 }, { "epoch": 0.64, "learning_rate": 5.966816358726633e-06, "loss": 0.4761, "step": 5628 }, { "epoch": 0.64, "learning_rate": 5.9634294018191145e-06, "loss": 0.4594, "step": 5629 }, { "epoch": 0.64, "learning_rate": 5.960042998011892e-06, "loss": 0.4682, "step": 5630 }, { "epoch": 0.64, "learning_rate": 5.9566571477689735e-06, "loss": 0.4535, "step": 5631 }, { "epoch": 0.64, "learning_rate": 5.953271851554303e-06, "loss": 0.4446, "step": 5632 }, { "epoch": 0.64, "learning_rate": 5.949887109831736e-06, "loss": 0.4797, "step": 5633 }, { "epoch": 0.64, "learning_rate": 5.946502923065054e-06, "loss": 0.4445, "step": 5634 }, { "epoch": 0.64, "learning_rate": 5.943119291717974e-06, "loss": 0.4538, "step": 5635 }, { "epoch": 0.64, "learning_rate": 5.939736216254126e-06, "loss": 0.4487, "step": 5636 }, { "epoch": 0.64, "learning_rate": 5.936353697137063e-06, "loss": 0.4681, "step": 5637 }, { "epoch": 0.64, "learning_rate": 5.932971734830273e-06, "loss": 0.4663, "step": 5638 }, { "epoch": 0.64, "learning_rate": 5.929590329797154e-06, "loss": 0.4624, "step": 5639 }, { "epoch": 0.64, "learning_rate": 5.926209482501037e-06, "loss": 0.4462, "step": 5640 }, { "epoch": 0.64, "learning_rate": 5.9228291934051754e-06, "loss": 0.4564, "step": 5641 }, { "epoch": 0.64, "learning_rate": 5.919449462972737e-06, "loss": 0.4501, "step": 5642 }, { "epoch": 0.64, "learning_rate": 5.916070291666831e-06, "loss": 0.4547, "step": 5643 }, { "epoch": 0.65, "learning_rate": 5.9126916799504685e-06, "loss": 0.4662, "step": 5644 }, { "epoch": 0.65, "learning_rate": 5.9093136282866014e-06, "loss": 0.4753, "step": 5645 }, { "epoch": 0.65, "learning_rate": 5.9059361371381e-06, "loss": 0.4517, "step": 5646 }, { "epoch": 0.65, "learning_rate": 5.9025592069677475e-06, "loss": 0.4549, "step": 5647 }, { "epoch": 0.65, "learning_rate": 5.899182838238265e-06, "loss": 0.4504, "step": 5648 }, { "epoch": 0.65, "learning_rate": 5.895807031412293e-06, "loss": 0.4433, "step": 5649 }, { "epoch": 0.65, "learning_rate": 5.892431786952384e-06, "loss": 0.453, "step": 5650 }, { "epoch": 0.65, "learning_rate": 5.8890571053210295e-06, "loss": 0.4681, "step": 5651 }, { "epoch": 0.65, "learning_rate": 5.88568298698063e-06, "loss": 0.4705, "step": 5652 }, { "epoch": 0.65, "learning_rate": 5.88230943239352e-06, "loss": 0.4575, "step": 5653 }, { "epoch": 0.65, "learning_rate": 5.878936442021952e-06, "loss": 0.4592, "step": 5654 }, { "epoch": 0.65, "learning_rate": 5.875564016328096e-06, "loss": 0.457, "step": 5655 }, { "epoch": 0.65, "learning_rate": 5.872192155774056e-06, "loss": 0.4668, "step": 5656 }, { "epoch": 0.65, "learning_rate": 5.868820860821844e-06, "loss": 0.4524, "step": 5657 }, { "epoch": 0.65, "learning_rate": 5.8654501319334105e-06, "loss": 0.4498, "step": 5658 }, { "epoch": 0.65, "learning_rate": 5.862079969570619e-06, "loss": 0.4785, "step": 5659 }, { "epoch": 0.65, "learning_rate": 5.858710374195251e-06, "loss": 0.4567, "step": 5660 }, { "epoch": 0.65, "learning_rate": 5.855341346269026e-06, "loss": 0.4633, "step": 5661 }, { "epoch": 0.65, "learning_rate": 5.851972886253569e-06, "loss": 0.4638, "step": 5662 }, { "epoch": 0.65, "learning_rate": 5.848604994610434e-06, "loss": 0.441, "step": 5663 }, { "epoch": 0.65, "learning_rate": 5.845237671801103e-06, "loss": 0.4802, "step": 5664 }, { "epoch": 0.65, "learning_rate": 5.841870918286967e-06, "loss": 0.4347, "step": 5665 }, { "epoch": 0.65, "learning_rate": 5.838504734529353e-06, "loss": 0.4517, "step": 5666 }, { "epoch": 0.65, "learning_rate": 5.835139120989503e-06, "loss": 0.4683, "step": 5667 }, { "epoch": 0.65, "learning_rate": 5.831774078128574e-06, "loss": 0.4603, "step": 5668 }, { "epoch": 0.65, "learning_rate": 5.828409606407659e-06, "loss": 0.48, "step": 5669 }, { "epoch": 0.65, "learning_rate": 5.825045706287762e-06, "loss": 0.4576, "step": 5670 }, { "epoch": 0.65, "learning_rate": 5.821682378229813e-06, "loss": 0.4416, "step": 5671 }, { "epoch": 0.65, "learning_rate": 5.818319622694668e-06, "loss": 0.4558, "step": 5672 }, { "epoch": 0.65, "learning_rate": 5.814957440143092e-06, "loss": 0.4724, "step": 5673 }, { "epoch": 0.65, "learning_rate": 5.811595831035786e-06, "loss": 0.4637, "step": 5674 }, { "epoch": 0.65, "learning_rate": 5.8082347958333625e-06, "loss": 0.4548, "step": 5675 }, { "epoch": 0.65, "learning_rate": 5.804874334996353e-06, "loss": 0.4525, "step": 5676 }, { "epoch": 0.65, "learning_rate": 5.801514448985226e-06, "loss": 0.4845, "step": 5677 }, { "epoch": 0.65, "learning_rate": 5.798155138260352e-06, "loss": 0.4575, "step": 5678 }, { "epoch": 0.65, "learning_rate": 5.794796403282035e-06, "loss": 0.4511, "step": 5679 }, { "epoch": 0.65, "learning_rate": 5.791438244510499e-06, "loss": 0.4552, "step": 5680 }, { "epoch": 0.65, "learning_rate": 5.788080662405881e-06, "loss": 0.4433, "step": 5681 }, { "epoch": 0.65, "learning_rate": 5.784723657428255e-06, "loss": 0.4881, "step": 5682 }, { "epoch": 0.65, "learning_rate": 5.781367230037592e-06, "loss": 0.4417, "step": 5683 }, { "epoch": 0.65, "learning_rate": 5.7780113806938095e-06, "loss": 0.4435, "step": 5684 }, { "epoch": 0.65, "learning_rate": 5.774656109856729e-06, "loss": 0.4837, "step": 5685 }, { "epoch": 0.65, "learning_rate": 5.7713014179860925e-06, "loss": 0.4599, "step": 5686 }, { "epoch": 0.65, "learning_rate": 5.767947305541577e-06, "loss": 0.459, "step": 5687 }, { "epoch": 0.65, "learning_rate": 5.764593772982762e-06, "loss": 0.4506, "step": 5688 }, { "epoch": 0.65, "learning_rate": 5.76124082076916e-06, "loss": 0.4723, "step": 5689 }, { "epoch": 0.65, "learning_rate": 5.757888449360205e-06, "loss": 0.4578, "step": 5690 }, { "epoch": 0.65, "learning_rate": 5.754536659215239e-06, "loss": 0.4623, "step": 5691 }, { "epoch": 0.65, "learning_rate": 5.751185450793539e-06, "loss": 0.4391, "step": 5692 }, { "epoch": 0.65, "learning_rate": 5.747834824554293e-06, "loss": 0.458, "step": 5693 }, { "epoch": 0.65, "learning_rate": 5.744484780956605e-06, "loss": 0.4721, "step": 5694 }, { "epoch": 0.65, "learning_rate": 5.741135320459516e-06, "loss": 0.4749, "step": 5695 }, { "epoch": 0.65, "learning_rate": 5.737786443521968e-06, "loss": 0.4534, "step": 5696 }, { "epoch": 0.65, "learning_rate": 5.734438150602841e-06, "loss": 0.449, "step": 5697 }, { "epoch": 0.65, "learning_rate": 5.731090442160917e-06, "loss": 0.4614, "step": 5698 }, { "epoch": 0.65, "learning_rate": 5.727743318654911e-06, "loss": 0.4712, "step": 5699 }, { "epoch": 0.65, "learning_rate": 5.724396780543457e-06, "loss": 0.4552, "step": 5700 }, { "epoch": 0.65, "learning_rate": 5.721050828285097e-06, "loss": 0.4427, "step": 5701 }, { "epoch": 0.65, "learning_rate": 5.717705462338311e-06, "loss": 0.4601, "step": 5702 }, { "epoch": 0.65, "learning_rate": 5.714360683161484e-06, "loss": 0.4697, "step": 5703 }, { "epoch": 0.65, "learning_rate": 5.711016491212922e-06, "loss": 0.4579, "step": 5704 }, { "epoch": 0.65, "learning_rate": 5.707672886950859e-06, "loss": 0.4585, "step": 5705 }, { "epoch": 0.65, "learning_rate": 5.704329870833443e-06, "loss": 0.4581, "step": 5706 }, { "epoch": 0.65, "learning_rate": 5.700987443318737e-06, "loss": 0.4484, "step": 5707 }, { "epoch": 0.65, "learning_rate": 5.697645604864732e-06, "loss": 0.4493, "step": 5708 }, { "epoch": 0.65, "learning_rate": 5.694304355929333e-06, "loss": 0.4515, "step": 5709 }, { "epoch": 0.65, "learning_rate": 5.690963696970371e-06, "loss": 0.4578, "step": 5710 }, { "epoch": 0.65, "learning_rate": 5.687623628445588e-06, "loss": 0.4852, "step": 5711 }, { "epoch": 0.65, "learning_rate": 5.684284150812642e-06, "loss": 0.4439, "step": 5712 }, { "epoch": 0.65, "learning_rate": 5.680945264529125e-06, "loss": 0.4691, "step": 5713 }, { "epoch": 0.65, "learning_rate": 5.67760697005253e-06, "loss": 0.4385, "step": 5714 }, { "epoch": 0.65, "learning_rate": 5.674269267840287e-06, "loss": 0.4582, "step": 5715 }, { "epoch": 0.65, "learning_rate": 5.670932158349732e-06, "loss": 0.4456, "step": 5716 }, { "epoch": 0.65, "learning_rate": 5.667595642038117e-06, "loss": 0.4779, "step": 5717 }, { "epoch": 0.65, "learning_rate": 5.664259719362627e-06, "loss": 0.4467, "step": 5718 }, { "epoch": 0.65, "learning_rate": 5.660924390780359e-06, "loss": 0.4604, "step": 5719 }, { "epoch": 0.65, "learning_rate": 5.657589656748321e-06, "loss": 0.4391, "step": 5720 }, { "epoch": 0.65, "learning_rate": 5.654255517723452e-06, "loss": 0.4577, "step": 5721 }, { "epoch": 0.65, "learning_rate": 5.650921974162598e-06, "loss": 0.45, "step": 5722 }, { "epoch": 0.65, "learning_rate": 5.647589026522535e-06, "loss": 0.4597, "step": 5723 }, { "epoch": 0.65, "learning_rate": 5.644256675259949e-06, "loss": 0.4548, "step": 5724 }, { "epoch": 0.65, "learning_rate": 5.640924920831441e-06, "loss": 0.4683, "step": 5725 }, { "epoch": 0.65, "learning_rate": 5.637593763693545e-06, "loss": 0.4619, "step": 5726 }, { "epoch": 0.65, "learning_rate": 5.634263204302694e-06, "loss": 0.453, "step": 5727 }, { "epoch": 0.65, "learning_rate": 5.630933243115255e-06, "loss": 0.4557, "step": 5728 }, { "epoch": 0.65, "learning_rate": 5.627603880587511e-06, "loss": 0.4494, "step": 5729 }, { "epoch": 0.65, "learning_rate": 5.624275117175649e-06, "loss": 0.4481, "step": 5730 }, { "epoch": 0.65, "learning_rate": 5.620946953335793e-06, "loss": 0.4744, "step": 5731 }, { "epoch": 0.66, "learning_rate": 5.617619389523973e-06, "loss": 0.4303, "step": 5732 }, { "epoch": 0.66, "learning_rate": 5.614292426196133e-06, "loss": 0.4716, "step": 5733 }, { "epoch": 0.66, "learning_rate": 5.610966063808152e-06, "loss": 0.4592, "step": 5734 }, { "epoch": 0.66, "learning_rate": 5.607640302815806e-06, "loss": 0.4709, "step": 5735 }, { "epoch": 0.66, "learning_rate": 5.6043151436748035e-06, "loss": 0.4491, "step": 5736 }, { "epoch": 0.66, "learning_rate": 5.600990586840768e-06, "loss": 0.4589, "step": 5737 }, { "epoch": 0.66, "learning_rate": 5.597666632769232e-06, "loss": 0.4456, "step": 5738 }, { "epoch": 0.66, "learning_rate": 5.594343281915658e-06, "loss": 0.4658, "step": 5739 }, { "epoch": 0.66, "learning_rate": 5.5910205347354114e-06, "loss": 0.4628, "step": 5740 }, { "epoch": 0.66, "learning_rate": 5.587698391683792e-06, "loss": 0.433, "step": 5741 }, { "epoch": 0.66, "learning_rate": 5.584376853216003e-06, "loss": 0.4459, "step": 5742 }, { "epoch": 0.66, "learning_rate": 5.581055919787165e-06, "loss": 0.4464, "step": 5743 }, { "epoch": 0.66, "learning_rate": 5.577735591852327e-06, "loss": 0.4552, "step": 5744 }, { "epoch": 0.66, "learning_rate": 5.574415869866443e-06, "loss": 0.4547, "step": 5745 }, { "epoch": 0.66, "learning_rate": 5.571096754284389e-06, "loss": 0.4586, "step": 5746 }, { "epoch": 0.66, "learning_rate": 5.567778245560966e-06, "loss": 0.5003, "step": 5747 }, { "epoch": 0.66, "learning_rate": 5.564460344150873e-06, "loss": 0.4509, "step": 5748 }, { "epoch": 0.66, "learning_rate": 5.561143050508746e-06, "loss": 0.4781, "step": 5749 }, { "epoch": 0.66, "learning_rate": 5.5578263650891225e-06, "loss": 0.4499, "step": 5750 }, { "epoch": 0.66, "learning_rate": 5.554510288346459e-06, "loss": 0.4647, "step": 5751 }, { "epoch": 0.66, "learning_rate": 5.551194820735144e-06, "loss": 0.4586, "step": 5752 }, { "epoch": 0.66, "learning_rate": 5.547879962709457e-06, "loss": 0.4501, "step": 5753 }, { "epoch": 0.66, "learning_rate": 5.544565714723619e-06, "loss": 0.4588, "step": 5754 }, { "epoch": 0.66, "learning_rate": 5.541252077231746e-06, "loss": 0.4566, "step": 5755 }, { "epoch": 0.66, "learning_rate": 5.537939050687886e-06, "loss": 0.4355, "step": 5756 }, { "epoch": 0.66, "learning_rate": 5.534626635546e-06, "loss": 0.4584, "step": 5757 }, { "epoch": 0.66, "learning_rate": 5.53131483225996e-06, "loss": 0.458, "step": 5758 }, { "epoch": 0.66, "learning_rate": 5.528003641283552e-06, "loss": 0.451, "step": 5759 }, { "epoch": 0.66, "learning_rate": 5.524693063070492e-06, "loss": 0.4604, "step": 5760 }, { "epoch": 0.66, "learning_rate": 5.521383098074395e-06, "loss": 0.4517, "step": 5761 }, { "epoch": 0.66, "learning_rate": 5.5180737467488085e-06, "loss": 0.4649, "step": 5762 }, { "epoch": 0.66, "learning_rate": 5.514765009547181e-06, "loss": 0.4876, "step": 5763 }, { "epoch": 0.66, "learning_rate": 5.511456886922883e-06, "loss": 0.4452, "step": 5764 }, { "epoch": 0.66, "learning_rate": 5.508149379329204e-06, "loss": 0.4783, "step": 5765 }, { "epoch": 0.66, "learning_rate": 5.504842487219344e-06, "loss": 0.4413, "step": 5766 }, { "epoch": 0.66, "learning_rate": 5.5015362110464275e-06, "loss": 0.4431, "step": 5767 }, { "epoch": 0.66, "learning_rate": 5.4982305512634845e-06, "loss": 0.4764, "step": 5768 }, { "epoch": 0.66, "learning_rate": 5.4949255083234585e-06, "loss": 0.4596, "step": 5769 }, { "epoch": 0.66, "learning_rate": 5.491621082679224e-06, "loss": 0.4597, "step": 5770 }, { "epoch": 0.66, "learning_rate": 5.48831727478355e-06, "loss": 0.4672, "step": 5771 }, { "epoch": 0.66, "learning_rate": 5.4850140850891445e-06, "loss": 0.4401, "step": 5772 }, { "epoch": 0.66, "learning_rate": 5.481711514048609e-06, "loss": 0.4626, "step": 5773 }, { "epoch": 0.66, "learning_rate": 5.478409562114469e-06, "loss": 0.444, "step": 5774 }, { "epoch": 0.66, "learning_rate": 5.47510822973917e-06, "loss": 0.4472, "step": 5775 }, { "epoch": 0.66, "learning_rate": 5.4718075173750695e-06, "loss": 0.4574, "step": 5776 }, { "epoch": 0.66, "learning_rate": 5.4685074254744346e-06, "loss": 0.4639, "step": 5777 }, { "epoch": 0.66, "learning_rate": 5.465207954489454e-06, "loss": 0.4587, "step": 5778 }, { "epoch": 0.66, "learning_rate": 5.461909104872226e-06, "loss": 0.4665, "step": 5779 }, { "epoch": 0.66, "learning_rate": 5.458610877074773e-06, "loss": 0.4562, "step": 5780 }, { "epoch": 0.66, "learning_rate": 5.455313271549021e-06, "loss": 0.4441, "step": 5781 }, { "epoch": 0.66, "learning_rate": 5.452016288746813e-06, "loss": 0.4498, "step": 5782 }, { "epoch": 0.66, "learning_rate": 5.448719929119916e-06, "loss": 0.4597, "step": 5783 }, { "epoch": 0.66, "learning_rate": 5.445424193119997e-06, "loss": 0.4465, "step": 5784 }, { "epoch": 0.66, "learning_rate": 5.44212908119865e-06, "loss": 0.442, "step": 5785 }, { "epoch": 0.66, "learning_rate": 5.4388345938073824e-06, "loss": 0.441, "step": 5786 }, { "epoch": 0.66, "learning_rate": 5.435540731397606e-06, "loss": 0.4598, "step": 5787 }, { "epoch": 0.66, "learning_rate": 5.432247494420659e-06, "loss": 0.4435, "step": 5788 }, { "epoch": 0.66, "learning_rate": 5.4289548833277865e-06, "loss": 0.475, "step": 5789 }, { "epoch": 0.66, "learning_rate": 5.425662898570144e-06, "loss": 0.453, "step": 5790 }, { "epoch": 0.66, "learning_rate": 5.422371540598816e-06, "loss": 0.4684, "step": 5791 }, { "epoch": 0.66, "learning_rate": 5.419080809864785e-06, "loss": 0.4355, "step": 5792 }, { "epoch": 0.66, "learning_rate": 5.415790706818958e-06, "loss": 0.4451, "step": 5793 }, { "epoch": 0.66, "learning_rate": 5.412501231912153e-06, "loss": 0.472, "step": 5794 }, { "epoch": 0.66, "learning_rate": 5.409212385595098e-06, "loss": 0.4648, "step": 5795 }, { "epoch": 0.66, "learning_rate": 5.405924168318446e-06, "loss": 0.4761, "step": 5796 }, { "epoch": 0.66, "learning_rate": 5.4026365805327455e-06, "loss": 0.4499, "step": 5797 }, { "epoch": 0.66, "learning_rate": 5.399349622688479e-06, "loss": 0.4524, "step": 5798 }, { "epoch": 0.66, "learning_rate": 5.39606329523603e-06, "loss": 0.4547, "step": 5799 }, { "epoch": 0.66, "learning_rate": 5.392777598625694e-06, "loss": 0.4504, "step": 5800 }, { "epoch": 0.66, "learning_rate": 5.389492533307692e-06, "loss": 0.4597, "step": 5801 }, { "epoch": 0.66, "learning_rate": 5.386208099732144e-06, "loss": 0.461, "step": 5802 }, { "epoch": 0.66, "learning_rate": 5.382924298349095e-06, "loss": 0.4603, "step": 5803 }, { "epoch": 0.66, "learning_rate": 5.379641129608501e-06, "loss": 0.474, "step": 5804 }, { "epoch": 0.66, "learning_rate": 5.3763585939602244e-06, "loss": 0.4792, "step": 5805 }, { "epoch": 0.66, "learning_rate": 5.373076691854054e-06, "loss": 0.448, "step": 5806 }, { "epoch": 0.66, "learning_rate": 5.3697954237396764e-06, "loss": 0.4556, "step": 5807 }, { "epoch": 0.66, "learning_rate": 5.366514790066697e-06, "loss": 0.4481, "step": 5808 }, { "epoch": 0.66, "learning_rate": 5.363234791284644e-06, "loss": 0.4715, "step": 5809 }, { "epoch": 0.66, "learning_rate": 5.3599554278429415e-06, "loss": 0.4523, "step": 5810 }, { "epoch": 0.66, "learning_rate": 5.356676700190944e-06, "loss": 0.483, "step": 5811 }, { "epoch": 0.66, "learning_rate": 5.353398608777901e-06, "loss": 0.4732, "step": 5812 }, { "epoch": 0.66, "learning_rate": 5.35012115405299e-06, "loss": 0.4547, "step": 5813 }, { "epoch": 0.66, "learning_rate": 5.3468443364653e-06, "loss": 0.4648, "step": 5814 }, { "epoch": 0.66, "learning_rate": 5.343568156463821e-06, "loss": 0.4508, "step": 5815 }, { "epoch": 0.66, "learning_rate": 5.3402926144974625e-06, "loss": 0.4693, "step": 5816 }, { "epoch": 0.66, "learning_rate": 5.337017711015052e-06, "loss": 0.4573, "step": 5817 }, { "epoch": 0.66, "learning_rate": 5.333743446465318e-06, "loss": 0.4506, "step": 5818 }, { "epoch": 0.67, "learning_rate": 5.330469821296916e-06, "loss": 0.4474, "step": 5819 }, { "epoch": 0.67, "learning_rate": 5.327196835958402e-06, "loss": 0.4784, "step": 5820 }, { "epoch": 0.67, "learning_rate": 5.323924490898242e-06, "loss": 0.4562, "step": 5821 }, { "epoch": 0.67, "learning_rate": 5.320652786564826e-06, "loss": 0.4497, "step": 5822 }, { "epoch": 0.67, "learning_rate": 5.31738172340645e-06, "loss": 0.4454, "step": 5823 }, { "epoch": 0.67, "learning_rate": 5.314111301871325e-06, "loss": 0.4383, "step": 5824 }, { "epoch": 0.67, "learning_rate": 5.3108415224075725e-06, "loss": 0.4667, "step": 5825 }, { "epoch": 0.67, "learning_rate": 5.307572385463218e-06, "loss": 0.4501, "step": 5826 }, { "epoch": 0.67, "learning_rate": 5.304303891486213e-06, "loss": 0.4514, "step": 5827 }, { "epoch": 0.67, "learning_rate": 5.301036040924412e-06, "loss": 0.4677, "step": 5828 }, { "epoch": 0.67, "learning_rate": 5.297768834225581e-06, "loss": 0.4647, "step": 5829 }, { "epoch": 0.67, "learning_rate": 5.294502271837405e-06, "loss": 0.4455, "step": 5830 }, { "epoch": 0.67, "learning_rate": 5.2912363542074695e-06, "loss": 0.4584, "step": 5831 }, { "epoch": 0.67, "learning_rate": 5.287971081783283e-06, "loss": 0.4672, "step": 5832 }, { "epoch": 0.67, "learning_rate": 5.284706455012263e-06, "loss": 0.4464, "step": 5833 }, { "epoch": 0.67, "learning_rate": 5.281442474341729e-06, "loss": 0.4605, "step": 5834 }, { "epoch": 0.67, "learning_rate": 5.278179140218928e-06, "loss": 0.4518, "step": 5835 }, { "epoch": 0.67, "learning_rate": 5.274916453091001e-06, "loss": 0.4436, "step": 5836 }, { "epoch": 0.67, "learning_rate": 5.271654413405016e-06, "loss": 0.465, "step": 5837 }, { "epoch": 0.67, "learning_rate": 5.268393021607944e-06, "loss": 0.4715, "step": 5838 }, { "epoch": 0.67, "learning_rate": 5.2651322781466606e-06, "loss": 0.445, "step": 5839 }, { "epoch": 0.67, "learning_rate": 5.261872183467972e-06, "loss": 0.468, "step": 5840 }, { "epoch": 0.67, "learning_rate": 5.258612738018574e-06, "loss": 0.4424, "step": 5841 }, { "epoch": 0.67, "learning_rate": 5.255353942245089e-06, "loss": 0.4553, "step": 5842 }, { "epoch": 0.67, "learning_rate": 5.252095796594046e-06, "loss": 0.4456, "step": 5843 }, { "epoch": 0.67, "learning_rate": 5.2488383015118785e-06, "loss": 0.4466, "step": 5844 }, { "epoch": 0.67, "learning_rate": 5.2455814574449415e-06, "loss": 0.456, "step": 5845 }, { "epoch": 0.67, "learning_rate": 5.242325264839494e-06, "loss": 0.4612, "step": 5846 }, { "epoch": 0.67, "learning_rate": 5.239069724141701e-06, "loss": 0.4419, "step": 5847 }, { "epoch": 0.67, "learning_rate": 5.235814835797655e-06, "loss": 0.4759, "step": 5848 }, { "epoch": 0.67, "learning_rate": 5.232560600253336e-06, "loss": 0.4619, "step": 5849 }, { "epoch": 0.67, "learning_rate": 5.229307017954655e-06, "loss": 0.4547, "step": 5850 }, { "epoch": 0.67, "learning_rate": 5.226054089347428e-06, "loss": 0.4444, "step": 5851 }, { "epoch": 0.67, "learning_rate": 5.22280181487737e-06, "loss": 0.4596, "step": 5852 }, { "epoch": 0.67, "learning_rate": 5.219550194990124e-06, "loss": 0.4476, "step": 5853 }, { "epoch": 0.67, "learning_rate": 5.216299230131227e-06, "loss": 0.4702, "step": 5854 }, { "epoch": 0.67, "learning_rate": 5.21304892074614e-06, "loss": 0.4289, "step": 5855 }, { "epoch": 0.67, "learning_rate": 5.209799267280225e-06, "loss": 0.4721, "step": 5856 }, { "epoch": 0.67, "learning_rate": 5.206550270178754e-06, "loss": 0.4441, "step": 5857 }, { "epoch": 0.67, "learning_rate": 5.20330192988692e-06, "loss": 0.4478, "step": 5858 }, { "epoch": 0.67, "learning_rate": 5.2000542468498085e-06, "loss": 0.4388, "step": 5859 }, { "epoch": 0.67, "learning_rate": 5.19680722151243e-06, "loss": 0.456, "step": 5860 }, { "epoch": 0.67, "learning_rate": 5.1935608543197035e-06, "loss": 0.4623, "step": 5861 }, { "epoch": 0.67, "learning_rate": 5.1903151457164445e-06, "loss": 0.4772, "step": 5862 }, { "epoch": 0.67, "learning_rate": 5.187070096147397e-06, "loss": 0.4432, "step": 5863 }, { "epoch": 0.67, "learning_rate": 5.183825706057199e-06, "loss": 0.4853, "step": 5864 }, { "epoch": 0.67, "learning_rate": 5.180581975890404e-06, "loss": 0.4542, "step": 5865 }, { "epoch": 0.67, "learning_rate": 5.177338906091481e-06, "loss": 0.4507, "step": 5866 }, { "epoch": 0.67, "learning_rate": 5.1740964971047945e-06, "loss": 0.4507, "step": 5867 }, { "epoch": 0.67, "learning_rate": 5.1708547493746376e-06, "loss": 0.4551, "step": 5868 }, { "epoch": 0.67, "learning_rate": 5.16761366334519e-06, "loss": 0.4536, "step": 5869 }, { "epoch": 0.67, "learning_rate": 5.164373239460561e-06, "loss": 0.4742, "step": 5870 }, { "epoch": 0.67, "learning_rate": 5.161133478164764e-06, "loss": 0.4438, "step": 5871 }, { "epoch": 0.67, "learning_rate": 5.157894379901711e-06, "loss": 0.4696, "step": 5872 }, { "epoch": 0.67, "learning_rate": 5.154655945115233e-06, "loss": 0.4426, "step": 5873 }, { "epoch": 0.67, "learning_rate": 5.15141817424907e-06, "loss": 0.447, "step": 5874 }, { "epoch": 0.67, "learning_rate": 5.148181067746862e-06, "loss": 0.4607, "step": 5875 }, { "epoch": 0.67, "learning_rate": 5.144944626052178e-06, "loss": 0.4548, "step": 5876 }, { "epoch": 0.67, "learning_rate": 5.141708849608473e-06, "loss": 0.4623, "step": 5877 }, { "epoch": 0.67, "learning_rate": 5.138473738859118e-06, "loss": 0.4585, "step": 5878 }, { "epoch": 0.67, "learning_rate": 5.1352392942474005e-06, "loss": 0.4618, "step": 5879 }, { "epoch": 0.67, "learning_rate": 5.132005516216512e-06, "loss": 0.4381, "step": 5880 }, { "epoch": 0.67, "learning_rate": 5.128772405209556e-06, "loss": 0.4473, "step": 5881 }, { "epoch": 0.67, "learning_rate": 5.1255399616695345e-06, "loss": 0.4759, "step": 5882 }, { "epoch": 0.67, "learning_rate": 5.122308186039364e-06, "loss": 0.4472, "step": 5883 }, { "epoch": 0.67, "learning_rate": 5.119077078761875e-06, "loss": 0.453, "step": 5884 }, { "epoch": 0.67, "learning_rate": 5.115846640279798e-06, "loss": 0.4527, "step": 5885 }, { "epoch": 0.67, "learning_rate": 5.1126168710357735e-06, "loss": 0.4394, "step": 5886 }, { "epoch": 0.67, "learning_rate": 5.109387771472356e-06, "loss": 0.4605, "step": 5887 }, { "epoch": 0.67, "learning_rate": 5.106159342032e-06, "loss": 0.4662, "step": 5888 }, { "epoch": 0.67, "learning_rate": 5.102931583157074e-06, "loss": 0.4503, "step": 5889 }, { "epoch": 0.67, "learning_rate": 5.099704495289859e-06, "loss": 0.4692, "step": 5890 }, { "epoch": 0.67, "learning_rate": 5.096478078872528e-06, "loss": 0.4399, "step": 5891 }, { "epoch": 0.67, "learning_rate": 5.093252334347183e-06, "loss": 0.4462, "step": 5892 }, { "epoch": 0.67, "learning_rate": 5.09002726215581e-06, "loss": 0.4574, "step": 5893 }, { "epoch": 0.67, "learning_rate": 5.08680286274033e-06, "loss": 0.4606, "step": 5894 }, { "epoch": 0.67, "learning_rate": 5.083579136542548e-06, "loss": 0.4525, "step": 5895 }, { "epoch": 0.67, "learning_rate": 5.080356084004187e-06, "loss": 0.4595, "step": 5896 }, { "epoch": 0.67, "learning_rate": 5.0771337055668826e-06, "loss": 0.4541, "step": 5897 }, { "epoch": 0.67, "learning_rate": 5.073912001672165e-06, "loss": 0.4641, "step": 5898 }, { "epoch": 0.67, "learning_rate": 5.070690972761484e-06, "loss": 0.4504, "step": 5899 }, { "epoch": 0.67, "learning_rate": 5.067470619276196e-06, "loss": 0.4616, "step": 5900 }, { "epoch": 0.67, "learning_rate": 5.064250941657555e-06, "loss": 0.4527, "step": 5901 }, { "epoch": 0.67, "learning_rate": 5.061031940346734e-06, "loss": 0.4591, "step": 5902 }, { "epoch": 0.67, "learning_rate": 5.057813615784806e-06, "loss": 0.4393, "step": 5903 }, { "epoch": 0.67, "learning_rate": 5.054595968412748e-06, "loss": 0.4637, "step": 5904 }, { "epoch": 0.67, "learning_rate": 5.051378998671459e-06, "loss": 0.4544, "step": 5905 }, { "epoch": 0.67, "learning_rate": 5.048162707001727e-06, "loss": 0.4612, "step": 5906 }, { "epoch": 0.68, "learning_rate": 5.044947093844259e-06, "loss": 0.4416, "step": 5907 }, { "epoch": 0.68, "learning_rate": 5.0417321596396715e-06, "loss": 0.4594, "step": 5908 }, { "epoch": 0.68, "learning_rate": 5.038517904828473e-06, "loss": 0.4519, "step": 5909 }, { "epoch": 0.68, "learning_rate": 5.035304329851096e-06, "loss": 0.4565, "step": 5910 }, { "epoch": 0.68, "learning_rate": 5.032091435147867e-06, "loss": 0.4487, "step": 5911 }, { "epoch": 0.68, "learning_rate": 5.028879221159025e-06, "loss": 0.4597, "step": 5912 }, { "epoch": 0.68, "learning_rate": 5.025667688324718e-06, "loss": 0.4687, "step": 5913 }, { "epoch": 0.68, "learning_rate": 5.02245683708499e-06, "loss": 0.4769, "step": 5914 }, { "epoch": 0.68, "learning_rate": 5.0192466678798116e-06, "loss": 0.4546, "step": 5915 }, { "epoch": 0.68, "learning_rate": 5.016037181149036e-06, "loss": 0.4698, "step": 5916 }, { "epoch": 0.68, "learning_rate": 5.012828377332438e-06, "loss": 0.447, "step": 5917 }, { "epoch": 0.68, "learning_rate": 5.009620256869703e-06, "loss": 0.4466, "step": 5918 }, { "epoch": 0.68, "learning_rate": 5.0064128202004025e-06, "loss": 0.4612, "step": 5919 }, { "epoch": 0.68, "learning_rate": 5.003206067764039e-06, "loss": 0.4515, "step": 5920 }, { "epoch": 0.68, "learning_rate": 5.000000000000003e-06, "loss": 0.4684, "step": 5921 }, { "epoch": 0.68, "learning_rate": 4.996794617347593e-06, "loss": 0.4616, "step": 5922 }, { "epoch": 0.68, "learning_rate": 4.993589920246028e-06, "loss": 0.4691, "step": 5923 }, { "epoch": 0.68, "learning_rate": 4.9903859091344175e-06, "loss": 0.46, "step": 5924 }, { "epoch": 0.68, "learning_rate": 4.987182584451778e-06, "loss": 0.4516, "step": 5925 }, { "epoch": 0.68, "learning_rate": 4.983979946637043e-06, "loss": 0.4487, "step": 5926 }, { "epoch": 0.68, "learning_rate": 4.980777996129043e-06, "loss": 0.4312, "step": 5927 }, { "epoch": 0.68, "learning_rate": 4.977576733366521e-06, "loss": 0.4613, "step": 5928 }, { "epoch": 0.68, "learning_rate": 4.974376158788119e-06, "loss": 0.4487, "step": 5929 }, { "epoch": 0.68, "learning_rate": 4.971176272832382e-06, "loss": 0.4573, "step": 5930 }, { "epoch": 0.68, "learning_rate": 4.967977075937774e-06, "loss": 0.4519, "step": 5931 }, { "epoch": 0.68, "learning_rate": 4.964778568542649e-06, "loss": 0.4419, "step": 5932 }, { "epoch": 0.68, "learning_rate": 4.9615807510852795e-06, "loss": 0.448, "step": 5933 }, { "epoch": 0.68, "learning_rate": 4.958383624003836e-06, "loss": 0.4687, "step": 5934 }, { "epoch": 0.68, "learning_rate": 4.955187187736393e-06, "loss": 0.4446, "step": 5935 }, { "epoch": 0.68, "learning_rate": 4.951991442720937e-06, "loss": 0.4657, "step": 5936 }, { "epoch": 0.68, "learning_rate": 4.948796389395355e-06, "loss": 0.4441, "step": 5937 }, { "epoch": 0.68, "learning_rate": 4.945602028197447e-06, "loss": 0.4799, "step": 5938 }, { "epoch": 0.68, "learning_rate": 4.942408359564906e-06, "loss": 0.4605, "step": 5939 }, { "epoch": 0.68, "learning_rate": 4.939215383935331e-06, "loss": 0.4591, "step": 5940 }, { "epoch": 0.68, "learning_rate": 4.936023101746242e-06, "loss": 0.4457, "step": 5941 }, { "epoch": 0.68, "learning_rate": 4.932831513435045e-06, "loss": 0.4516, "step": 5942 }, { "epoch": 0.68, "learning_rate": 4.929640619439059e-06, "loss": 0.4394, "step": 5943 }, { "epoch": 0.68, "learning_rate": 4.926450420195513e-06, "loss": 0.4495, "step": 5944 }, { "epoch": 0.68, "learning_rate": 4.92326091614153e-06, "loss": 0.4513, "step": 5945 }, { "epoch": 0.68, "learning_rate": 4.920072107714145e-06, "loss": 0.4674, "step": 5946 }, { "epoch": 0.68, "learning_rate": 4.916883995350299e-06, "loss": 0.4625, "step": 5947 }, { "epoch": 0.68, "learning_rate": 4.913696579486829e-06, "loss": 0.4644, "step": 5948 }, { "epoch": 0.68, "learning_rate": 4.91050986056049e-06, "loss": 0.4591, "step": 5949 }, { "epoch": 0.68, "learning_rate": 4.907323839007925e-06, "loss": 0.4544, "step": 5950 }, { "epoch": 0.68, "learning_rate": 4.904138515265696e-06, "loss": 0.4634, "step": 5951 }, { "epoch": 0.68, "learning_rate": 4.900953889770264e-06, "loss": 0.4425, "step": 5952 }, { "epoch": 0.68, "learning_rate": 4.897769962957986e-06, "loss": 0.4416, "step": 5953 }, { "epoch": 0.68, "learning_rate": 4.89458673526514e-06, "loss": 0.4747, "step": 5954 }, { "epoch": 0.68, "learning_rate": 4.891404207127892e-06, "loss": 0.4554, "step": 5955 }, { "epoch": 0.68, "learning_rate": 4.888222378982323e-06, "loss": 0.4564, "step": 5956 }, { "epoch": 0.68, "learning_rate": 4.885041251264419e-06, "loss": 0.4421, "step": 5957 }, { "epoch": 0.68, "learning_rate": 4.881860824410056e-06, "loss": 0.4374, "step": 5958 }, { "epoch": 0.68, "learning_rate": 4.8786810988550326e-06, "loss": 0.4528, "step": 5959 }, { "epoch": 0.68, "learning_rate": 4.875502075035039e-06, "loss": 0.474, "step": 5960 }, { "epoch": 0.68, "learning_rate": 4.872323753385667e-06, "loss": 0.4414, "step": 5961 }, { "epoch": 0.68, "learning_rate": 4.869146134342426e-06, "loss": 0.4653, "step": 5962 }, { "epoch": 0.68, "learning_rate": 4.8659692183407135e-06, "loss": 0.4524, "step": 5963 }, { "epoch": 0.68, "learning_rate": 4.862793005815841e-06, "loss": 0.4981, "step": 5964 }, { "epoch": 0.68, "learning_rate": 4.859617497203024e-06, "loss": 0.4381, "step": 5965 }, { "epoch": 0.68, "learning_rate": 4.856442692937372e-06, "loss": 0.4612, "step": 5966 }, { "epoch": 0.68, "learning_rate": 4.85326859345391e-06, "loss": 0.4269, "step": 5967 }, { "epoch": 0.68, "learning_rate": 4.850095199187559e-06, "loss": 0.4602, "step": 5968 }, { "epoch": 0.68, "learning_rate": 4.846922510573139e-06, "loss": 0.4351, "step": 5969 }, { "epoch": 0.68, "learning_rate": 4.843750528045387e-06, "loss": 0.4577, "step": 5970 }, { "epoch": 0.68, "learning_rate": 4.8405792520389275e-06, "loss": 0.4465, "step": 5971 }, { "epoch": 0.68, "learning_rate": 4.837408682988305e-06, "loss": 0.4765, "step": 5972 }, { "epoch": 0.68, "learning_rate": 4.83423882132795e-06, "loss": 0.4499, "step": 5973 }, { "epoch": 0.68, "learning_rate": 4.831069667492209e-06, "loss": 0.4669, "step": 5974 }, { "epoch": 0.68, "learning_rate": 4.8279012219153284e-06, "loss": 0.479, "step": 5975 }, { "epoch": 0.68, "learning_rate": 4.8247334850314495e-06, "loss": 0.4517, "step": 5976 }, { "epoch": 0.68, "learning_rate": 4.821566457274632e-06, "loss": 0.4491, "step": 5977 }, { "epoch": 0.68, "learning_rate": 4.818400139078824e-06, "loss": 0.4552, "step": 5978 }, { "epoch": 0.68, "learning_rate": 4.815234530877879e-06, "loss": 0.4508, "step": 5979 }, { "epoch": 0.68, "learning_rate": 4.812069633105563e-06, "loss": 0.4679, "step": 5980 }, { "epoch": 0.68, "learning_rate": 4.808905446195532e-06, "loss": 0.4566, "step": 5981 }, { "epoch": 0.68, "learning_rate": 4.80574197058135e-06, "loss": 0.4555, "step": 5982 }, { "epoch": 0.68, "learning_rate": 4.802579206696486e-06, "loss": 0.4574, "step": 5983 }, { "epoch": 0.68, "learning_rate": 4.7994171549743085e-06, "loss": 0.4367, "step": 5984 }, { "epoch": 0.68, "learning_rate": 4.796255815848094e-06, "loss": 0.4542, "step": 5985 }, { "epoch": 0.68, "learning_rate": 4.7930951897510126e-06, "loss": 0.4746, "step": 5986 }, { "epoch": 0.68, "learning_rate": 4.7899352771161355e-06, "loss": 0.4405, "step": 5987 }, { "epoch": 0.68, "learning_rate": 4.786776078376451e-06, "loss": 0.4694, "step": 5988 }, { "epoch": 0.68, "learning_rate": 4.783617593964831e-06, "loss": 0.466, "step": 5989 }, { "epoch": 0.68, "learning_rate": 4.7804598243140664e-06, "loss": 0.4495, "step": 5990 }, { "epoch": 0.68, "learning_rate": 4.777302769856838e-06, "loss": 0.4656, "step": 5991 }, { "epoch": 0.68, "learning_rate": 4.7741464310257305e-06, "loss": 0.4563, "step": 5992 }, { "epoch": 0.68, "learning_rate": 4.770990808253234e-06, "loss": 0.4475, "step": 5993 }, { "epoch": 0.69, "learning_rate": 4.767835901971745e-06, "loss": 0.4664, "step": 5994 }, { "epoch": 0.69, "learning_rate": 4.764681712613547e-06, "loss": 0.4534, "step": 5995 }, { "epoch": 0.69, "learning_rate": 4.761528240610842e-06, "loss": 0.4654, "step": 5996 }, { "epoch": 0.69, "learning_rate": 4.758375486395721e-06, "loss": 0.4525, "step": 5997 }, { "epoch": 0.69, "learning_rate": 4.755223450400186e-06, "loss": 0.4443, "step": 5998 }, { "epoch": 0.69, "learning_rate": 4.752072133056135e-06, "loss": 0.456, "step": 5999 }, { "epoch": 0.69, "learning_rate": 4.748921534795365e-06, "loss": 0.459, "step": 6000 }, { "epoch": 0.69, "learning_rate": 4.745771656049584e-06, "loss": 0.4575, "step": 6001 }, { "epoch": 0.69, "learning_rate": 4.742622497250389e-06, "loss": 0.4503, "step": 6002 }, { "epoch": 0.69, "learning_rate": 4.739474058829288e-06, "loss": 0.451, "step": 6003 }, { "epoch": 0.69, "learning_rate": 4.736326341217694e-06, "loss": 0.4712, "step": 6004 }, { "epoch": 0.69, "learning_rate": 4.7331793448469045e-06, "loss": 0.4605, "step": 6005 }, { "epoch": 0.69, "learning_rate": 4.730033070148135e-06, "loss": 0.4639, "step": 6006 }, { "epoch": 0.69, "learning_rate": 4.726887517552495e-06, "loss": 0.4432, "step": 6007 }, { "epoch": 0.69, "learning_rate": 4.723742687490988e-06, "loss": 0.4674, "step": 6008 }, { "epoch": 0.69, "learning_rate": 4.7205985803945375e-06, "loss": 0.4835, "step": 6009 }, { "epoch": 0.69, "learning_rate": 4.717455196693945e-06, "loss": 0.4496, "step": 6010 }, { "epoch": 0.69, "learning_rate": 4.7143125368199335e-06, "loss": 0.4478, "step": 6011 }, { "epoch": 0.69, "learning_rate": 4.71117060120311e-06, "loss": 0.4502, "step": 6012 }, { "epoch": 0.69, "learning_rate": 4.708029390273994e-06, "loss": 0.4507, "step": 6013 }, { "epoch": 0.69, "learning_rate": 4.704888904463003e-06, "loss": 0.4554, "step": 6014 }, { "epoch": 0.69, "learning_rate": 4.701749144200449e-06, "loss": 0.4624, "step": 6015 }, { "epoch": 0.69, "learning_rate": 4.698610109916556e-06, "loss": 0.4803, "step": 6016 }, { "epoch": 0.69, "learning_rate": 4.695471802041437e-06, "loss": 0.4823, "step": 6017 }, { "epoch": 0.69, "learning_rate": 4.692334221005108e-06, "loss": 0.4486, "step": 6018 }, { "epoch": 0.69, "learning_rate": 4.689197367237494e-06, "loss": 0.4389, "step": 6019 }, { "epoch": 0.69, "learning_rate": 4.686061241168406e-06, "loss": 0.4453, "step": 6020 }, { "epoch": 0.69, "learning_rate": 4.6829258432275685e-06, "loss": 0.4557, "step": 6021 }, { "epoch": 0.69, "learning_rate": 4.679791173844604e-06, "loss": 0.4706, "step": 6022 }, { "epoch": 0.69, "learning_rate": 4.676657233449025e-06, "loss": 0.4546, "step": 6023 }, { "epoch": 0.69, "learning_rate": 4.673524022470259e-06, "loss": 0.4494, "step": 6024 }, { "epoch": 0.69, "learning_rate": 4.67039154133762e-06, "loss": 0.4828, "step": 6025 }, { "epoch": 0.69, "learning_rate": 4.667259790480327e-06, "loss": 0.459, "step": 6026 }, { "epoch": 0.69, "learning_rate": 4.664128770327506e-06, "loss": 0.4288, "step": 6027 }, { "epoch": 0.69, "learning_rate": 4.66099848130817e-06, "loss": 0.4452, "step": 6028 }, { "epoch": 0.69, "learning_rate": 4.657868923851244e-06, "loss": 0.4451, "step": 6029 }, { "epoch": 0.69, "learning_rate": 4.6547400983855415e-06, "loss": 0.4561, "step": 6030 }, { "epoch": 0.69, "learning_rate": 4.651612005339786e-06, "loss": 0.461, "step": 6031 }, { "epoch": 0.69, "learning_rate": 4.648484645142597e-06, "loss": 0.4506, "step": 6032 }, { "epoch": 0.69, "learning_rate": 4.645358018222486e-06, "loss": 0.4559, "step": 6033 }, { "epoch": 0.69, "learning_rate": 4.642232125007881e-06, "loss": 0.4586, "step": 6034 }, { "epoch": 0.69, "learning_rate": 4.639106965927093e-06, "loss": 0.4874, "step": 6035 }, { "epoch": 0.69, "learning_rate": 4.635982541408334e-06, "loss": 0.454, "step": 6036 }, { "epoch": 0.69, "learning_rate": 4.632858851879729e-06, "loss": 0.4698, "step": 6037 }, { "epoch": 0.69, "learning_rate": 4.629735897769289e-06, "loss": 0.4706, "step": 6038 }, { "epoch": 0.69, "learning_rate": 4.626613679504924e-06, "loss": 0.4483, "step": 6039 }, { "epoch": 0.69, "learning_rate": 4.623492197514453e-06, "loss": 0.476, "step": 6040 }, { "epoch": 0.69, "learning_rate": 4.620371452225587e-06, "loss": 0.464, "step": 6041 }, { "epoch": 0.69, "learning_rate": 4.6172514440659435e-06, "loss": 0.4384, "step": 6042 }, { "epoch": 0.69, "learning_rate": 4.614132173463027e-06, "loss": 0.4674, "step": 6043 }, { "epoch": 0.69, "learning_rate": 4.611013640844245e-06, "loss": 0.4489, "step": 6044 }, { "epoch": 0.69, "learning_rate": 4.607895846636914e-06, "loss": 0.4501, "step": 6045 }, { "epoch": 0.69, "learning_rate": 4.604778791268233e-06, "loss": 0.4437, "step": 6046 }, { "epoch": 0.69, "learning_rate": 4.601662475165316e-06, "loss": 0.4566, "step": 6047 }, { "epoch": 0.69, "learning_rate": 4.598546898755164e-06, "loss": 0.4739, "step": 6048 }, { "epoch": 0.69, "learning_rate": 4.595432062464678e-06, "loss": 0.454, "step": 6049 }, { "epoch": 0.69, "learning_rate": 4.592317966720661e-06, "loss": 0.432, "step": 6050 }, { "epoch": 0.69, "learning_rate": 4.589204611949819e-06, "loss": 0.4652, "step": 6051 }, { "epoch": 0.69, "learning_rate": 4.5860919985787454e-06, "loss": 0.4672, "step": 6052 }, { "epoch": 0.69, "learning_rate": 4.582980127033943e-06, "loss": 0.4432, "step": 6053 }, { "epoch": 0.69, "learning_rate": 4.5798689977418e-06, "loss": 0.451, "step": 6054 }, { "epoch": 0.69, "learning_rate": 4.576758611128619e-06, "loss": 0.4519, "step": 6055 }, { "epoch": 0.69, "learning_rate": 4.573648967620589e-06, "loss": 0.4571, "step": 6056 }, { "epoch": 0.69, "learning_rate": 4.570540067643796e-06, "loss": 0.4493, "step": 6057 }, { "epoch": 0.69, "learning_rate": 4.567431911624236e-06, "loss": 0.481, "step": 6058 }, { "epoch": 0.69, "learning_rate": 4.56432449998779e-06, "loss": 0.4614, "step": 6059 }, { "epoch": 0.69, "learning_rate": 4.5612178331602445e-06, "loss": 0.4561, "step": 6060 }, { "epoch": 0.69, "learning_rate": 4.558111911567287e-06, "loss": 0.4479, "step": 6061 }, { "epoch": 0.69, "learning_rate": 4.55500673563449e-06, "loss": 0.4753, "step": 6062 }, { "epoch": 0.69, "learning_rate": 4.55190230578734e-06, "loss": 0.4457, "step": 6063 }, { "epoch": 0.69, "learning_rate": 4.54879862245121e-06, "loss": 0.4726, "step": 6064 }, { "epoch": 0.69, "learning_rate": 4.545695686051369e-06, "loss": 0.4457, "step": 6065 }, { "epoch": 0.69, "learning_rate": 4.542593497012996e-06, "loss": 0.4729, "step": 6066 }, { "epoch": 0.69, "learning_rate": 4.539492055761153e-06, "loss": 0.4398, "step": 6067 }, { "epoch": 0.69, "learning_rate": 4.536391362720816e-06, "loss": 0.4609, "step": 6068 }, { "epoch": 0.69, "learning_rate": 4.533291418316837e-06, "loss": 0.4608, "step": 6069 }, { "epoch": 0.69, "learning_rate": 4.530192222973987e-06, "loss": 0.443, "step": 6070 }, { "epoch": 0.69, "learning_rate": 4.527093777116925e-06, "loss": 0.4677, "step": 6071 }, { "epoch": 0.69, "learning_rate": 4.523996081170201e-06, "loss": 0.4473, "step": 6072 }, { "epoch": 0.69, "learning_rate": 4.520899135558276e-06, "loss": 0.455, "step": 6073 }, { "epoch": 0.69, "learning_rate": 4.5178029407054965e-06, "loss": 0.4453, "step": 6074 }, { "epoch": 0.69, "learning_rate": 4.514707497036107e-06, "loss": 0.4705, "step": 6075 }, { "epoch": 0.69, "learning_rate": 4.511612804974259e-06, "loss": 0.4396, "step": 6076 }, { "epoch": 0.69, "learning_rate": 4.508518864943989e-06, "loss": 0.4703, "step": 6077 }, { "epoch": 0.69, "learning_rate": 4.505425677369238e-06, "loss": 0.4372, "step": 6078 }, { "epoch": 0.69, "learning_rate": 4.5023332426738445e-06, "loss": 0.4476, "step": 6079 }, { "epoch": 0.69, "learning_rate": 4.4992415612815355e-06, "loss": 0.4527, "step": 6080 }, { "epoch": 0.69, "learning_rate": 4.496150633615947e-06, "loss": 0.4683, "step": 6081 }, { "epoch": 0.7, "learning_rate": 4.4930604601006025e-06, "loss": 0.4637, "step": 6082 }, { "epoch": 0.7, "learning_rate": 4.489971041158919e-06, "loss": 0.4505, "step": 6083 }, { "epoch": 0.7, "learning_rate": 4.486882377214226e-06, "loss": 0.4505, "step": 6084 }, { "epoch": 0.7, "learning_rate": 4.483794468689728e-06, "loss": 0.4463, "step": 6085 }, { "epoch": 0.7, "learning_rate": 4.480707316008549e-06, "loss": 0.4404, "step": 6086 }, { "epoch": 0.7, "learning_rate": 4.477620919593688e-06, "loss": 0.4671, "step": 6087 }, { "epoch": 0.7, "learning_rate": 4.474535279868055e-06, "loss": 0.449, "step": 6088 }, { "epoch": 0.7, "learning_rate": 4.4714503972544545e-06, "loss": 0.4668, "step": 6089 }, { "epoch": 0.7, "learning_rate": 4.4683662721755805e-06, "loss": 0.4563, "step": 6090 }, { "epoch": 0.7, "learning_rate": 4.465282905054025e-06, "loss": 0.4432, "step": 6091 }, { "epoch": 0.7, "learning_rate": 4.462200296312284e-06, "loss": 0.4485, "step": 6092 }, { "epoch": 0.7, "learning_rate": 4.459118446372736e-06, "loss": 0.4552, "step": 6093 }, { "epoch": 0.7, "learning_rate": 4.45603735565767e-06, "loss": 0.4486, "step": 6094 }, { "epoch": 0.7, "learning_rate": 4.4529570245892625e-06, "loss": 0.4531, "step": 6095 }, { "epoch": 0.7, "learning_rate": 4.449877453589584e-06, "loss": 0.4359, "step": 6096 }, { "epoch": 0.7, "learning_rate": 4.446798643080608e-06, "loss": 0.4864, "step": 6097 }, { "epoch": 0.7, "learning_rate": 4.443720593484198e-06, "loss": 0.4502, "step": 6098 }, { "epoch": 0.7, "learning_rate": 4.440643305222121e-06, "loss": 0.4621, "step": 6099 }, { "epoch": 0.7, "learning_rate": 4.43756677871603e-06, "loss": 0.4472, "step": 6100 }, { "epoch": 0.7, "learning_rate": 4.4344910143874755e-06, "loss": 0.4595, "step": 6101 }, { "epoch": 0.7, "learning_rate": 4.431416012657912e-06, "loss": 0.4382, "step": 6102 }, { "epoch": 0.7, "learning_rate": 4.42834177394868e-06, "loss": 0.4416, "step": 6103 }, { "epoch": 0.7, "learning_rate": 4.425268298681015e-06, "loss": 0.4432, "step": 6104 }, { "epoch": 0.7, "learning_rate": 4.422195587276058e-06, "loss": 0.4588, "step": 6105 }, { "epoch": 0.7, "learning_rate": 4.419123640154834e-06, "loss": 0.4484, "step": 6106 }, { "epoch": 0.7, "learning_rate": 4.416052457738271e-06, "loss": 0.4875, "step": 6107 }, { "epoch": 0.7, "learning_rate": 4.412982040447193e-06, "loss": 0.4492, "step": 6108 }, { "epoch": 0.7, "learning_rate": 4.409912388702308e-06, "loss": 0.4476, "step": 6109 }, { "epoch": 0.7, "learning_rate": 4.406843502924235e-06, "loss": 0.4601, "step": 6110 }, { "epoch": 0.7, "learning_rate": 4.403775383533472e-06, "loss": 0.4618, "step": 6111 }, { "epoch": 0.7, "learning_rate": 4.400708030950428e-06, "loss": 0.4439, "step": 6112 }, { "epoch": 0.7, "learning_rate": 4.397641445595393e-06, "loss": 0.4651, "step": 6113 }, { "epoch": 0.7, "learning_rate": 4.394575627888558e-06, "loss": 0.4394, "step": 6114 }, { "epoch": 0.7, "learning_rate": 4.391510578250011e-06, "loss": 0.4715, "step": 6115 }, { "epoch": 0.7, "learning_rate": 4.388446297099728e-06, "loss": 0.4585, "step": 6116 }, { "epoch": 0.7, "learning_rate": 4.385382784857587e-06, "loss": 0.4418, "step": 6117 }, { "epoch": 0.7, "learning_rate": 4.382320041943361e-06, "loss": 0.4464, "step": 6118 }, { "epoch": 0.7, "learning_rate": 4.379258068776706e-06, "loss": 0.4421, "step": 6119 }, { "epoch": 0.7, "learning_rate": 4.3761968657771905e-06, "loss": 0.4487, "step": 6120 }, { "epoch": 0.7, "learning_rate": 4.3731364333642615e-06, "loss": 0.4634, "step": 6121 }, { "epoch": 0.7, "learning_rate": 4.370076771957264e-06, "loss": 0.4363, "step": 6122 }, { "epoch": 0.7, "learning_rate": 4.367017881975446e-06, "loss": 0.4684, "step": 6123 }, { "epoch": 0.7, "learning_rate": 4.363959763837938e-06, "loss": 0.4628, "step": 6124 }, { "epoch": 0.7, "learning_rate": 4.360902417963777e-06, "loss": 0.4726, "step": 6125 }, { "epoch": 0.7, "learning_rate": 4.357845844771881e-06, "loss": 0.4525, "step": 6126 }, { "epoch": 0.7, "learning_rate": 4.354790044681072e-06, "loss": 0.4496, "step": 6127 }, { "epoch": 0.7, "learning_rate": 4.351735018110066e-06, "loss": 0.4513, "step": 6128 }, { "epoch": 0.7, "learning_rate": 4.348680765477463e-06, "loss": 0.4627, "step": 6129 }, { "epoch": 0.7, "learning_rate": 4.3456272872017725e-06, "loss": 0.4446, "step": 6130 }, { "epoch": 0.7, "learning_rate": 4.342574583701382e-06, "loss": 0.4567, "step": 6131 }, { "epoch": 0.7, "learning_rate": 4.33952265539458e-06, "loss": 0.4456, "step": 6132 }, { "epoch": 0.7, "learning_rate": 4.336471502699554e-06, "loss": 0.4527, "step": 6133 }, { "epoch": 0.7, "learning_rate": 4.333421126034374e-06, "loss": 0.4668, "step": 6134 }, { "epoch": 0.7, "learning_rate": 4.330371525817012e-06, "loss": 0.4575, "step": 6135 }, { "epoch": 0.7, "learning_rate": 4.327322702465335e-06, "loss": 0.4421, "step": 6136 }, { "epoch": 0.7, "learning_rate": 4.324274656397095e-06, "loss": 0.4728, "step": 6137 }, { "epoch": 0.7, "learning_rate": 4.321227388029947e-06, "loss": 0.4593, "step": 6138 }, { "epoch": 0.7, "learning_rate": 4.318180897781432e-06, "loss": 0.4651, "step": 6139 }, { "epoch": 0.7, "learning_rate": 4.315135186068984e-06, "loss": 0.4454, "step": 6140 }, { "epoch": 0.7, "learning_rate": 4.312090253309941e-06, "loss": 0.4575, "step": 6141 }, { "epoch": 0.7, "learning_rate": 4.309046099921518e-06, "loss": 0.4456, "step": 6142 }, { "epoch": 0.7, "learning_rate": 4.306002726320839e-06, "loss": 0.4633, "step": 6143 }, { "epoch": 0.7, "learning_rate": 4.302960132924909e-06, "loss": 0.4532, "step": 6144 }, { "epoch": 0.7, "learning_rate": 4.299918320150634e-06, "loss": 0.4513, "step": 6145 }, { "epoch": 0.7, "learning_rate": 4.296877288414815e-06, "loss": 0.4538, "step": 6146 }, { "epoch": 0.7, "learning_rate": 4.2938370381341355e-06, "loss": 0.445, "step": 6147 }, { "epoch": 0.7, "learning_rate": 4.290797569725175e-06, "loss": 0.4534, "step": 6148 }, { "epoch": 0.7, "learning_rate": 4.287758883604415e-06, "loss": 0.4542, "step": 6149 }, { "epoch": 0.7, "learning_rate": 4.284720980188216e-06, "loss": 0.4479, "step": 6150 }, { "epoch": 0.7, "learning_rate": 4.281683859892849e-06, "loss": 0.4849, "step": 6151 }, { "epoch": 0.7, "learning_rate": 4.278647523134459e-06, "loss": 0.4355, "step": 6152 }, { "epoch": 0.7, "learning_rate": 4.275611970329092e-06, "loss": 0.4748, "step": 6153 }, { "epoch": 0.7, "learning_rate": 4.272577201892688e-06, "loss": 0.4573, "step": 6154 }, { "epoch": 0.7, "learning_rate": 4.269543218241079e-06, "loss": 0.4502, "step": 6155 }, { "epoch": 0.7, "learning_rate": 4.266510019789993e-06, "loss": 0.464, "step": 6156 }, { "epoch": 0.7, "learning_rate": 4.26347760695504e-06, "loss": 0.4589, "step": 6157 }, { "epoch": 0.7, "learning_rate": 4.260445980151725e-06, "loss": 0.4541, "step": 6158 }, { "epoch": 0.7, "learning_rate": 4.257415139795458e-06, "loss": 0.4498, "step": 6159 }, { "epoch": 0.7, "learning_rate": 4.2543850863015266e-06, "loss": 0.451, "step": 6160 }, { "epoch": 0.7, "learning_rate": 4.2513558200851115e-06, "loss": 0.4428, "step": 6161 }, { "epoch": 0.7, "learning_rate": 4.248327341561298e-06, "loss": 0.4627, "step": 6162 }, { "epoch": 0.7, "learning_rate": 4.245299651145048e-06, "loss": 0.4586, "step": 6163 }, { "epoch": 0.7, "learning_rate": 4.242272749251228e-06, "loss": 0.4486, "step": 6164 }, { "epoch": 0.7, "learning_rate": 4.239246636294591e-06, "loss": 0.4699, "step": 6165 }, { "epoch": 0.7, "learning_rate": 4.236221312689777e-06, "loss": 0.4538, "step": 6166 }, { "epoch": 0.7, "learning_rate": 4.2331967788513295e-06, "loss": 0.4742, "step": 6167 }, { "epoch": 0.7, "learning_rate": 4.230173035193671e-06, "loss": 0.4524, "step": 6168 }, { "epoch": 0.71, "learning_rate": 4.227150082131128e-06, "loss": 0.4548, "step": 6169 }, { "epoch": 0.71, "learning_rate": 4.2241279200779105e-06, "loss": 0.4454, "step": 6170 }, { "epoch": 0.71, "learning_rate": 4.221106549448116e-06, "loss": 0.4473, "step": 6171 }, { "epoch": 0.71, "learning_rate": 4.21808597065575e-06, "loss": 0.4565, "step": 6172 }, { "epoch": 0.71, "learning_rate": 4.215066184114689e-06, "loss": 0.4502, "step": 6173 }, { "epoch": 0.71, "learning_rate": 4.212047190238716e-06, "loss": 0.4569, "step": 6174 }, { "epoch": 0.71, "learning_rate": 4.209028989441505e-06, "loss": 0.4568, "step": 6175 }, { "epoch": 0.71, "learning_rate": 4.2060115821366085e-06, "loss": 0.4514, "step": 6176 }, { "epoch": 0.71, "learning_rate": 4.202994968737487e-06, "loss": 0.4507, "step": 6177 }, { "epoch": 0.71, "learning_rate": 4.199979149657481e-06, "loss": 0.4546, "step": 6178 }, { "epoch": 0.71, "learning_rate": 4.196964125309818e-06, "loss": 0.4484, "step": 6179 }, { "epoch": 0.71, "learning_rate": 4.1939498961076345e-06, "loss": 0.451, "step": 6180 }, { "epoch": 0.71, "learning_rate": 4.190936462463937e-06, "loss": 0.4628, "step": 6181 }, { "epoch": 0.71, "learning_rate": 4.187923824791642e-06, "loss": 0.4572, "step": 6182 }, { "epoch": 0.71, "learning_rate": 4.184911983503541e-06, "loss": 0.483, "step": 6183 }, { "epoch": 0.71, "learning_rate": 4.1819009390123276e-06, "loss": 0.4448, "step": 6184 }, { "epoch": 0.71, "learning_rate": 4.178890691730585e-06, "loss": 0.4624, "step": 6185 }, { "epoch": 0.71, "learning_rate": 4.17588124207078e-06, "loss": 0.4336, "step": 6186 }, { "epoch": 0.71, "learning_rate": 4.172872590445273e-06, "loss": 0.4823, "step": 6187 }, { "epoch": 0.71, "learning_rate": 4.169864737266321e-06, "loss": 0.4495, "step": 6188 }, { "epoch": 0.71, "learning_rate": 4.166857682946061e-06, "loss": 0.4592, "step": 6189 }, { "epoch": 0.71, "learning_rate": 4.163851427896534e-06, "loss": 0.4319, "step": 6190 }, { "epoch": 0.71, "learning_rate": 4.160845972529656e-06, "loss": 0.4667, "step": 6191 }, { "epoch": 0.71, "learning_rate": 4.157841317257245e-06, "loss": 0.4676, "step": 6192 }, { "epoch": 0.71, "learning_rate": 4.154837462491012e-06, "loss": 0.4332, "step": 6193 }, { "epoch": 0.71, "learning_rate": 4.151834408642542e-06, "loss": 0.4331, "step": 6194 }, { "epoch": 0.71, "learning_rate": 4.148832156123329e-06, "loss": 0.4461, "step": 6195 }, { "epoch": 0.71, "learning_rate": 4.145830705344746e-06, "loss": 0.4527, "step": 6196 }, { "epoch": 0.71, "learning_rate": 4.142830056718052e-06, "loss": 0.4627, "step": 6197 }, { "epoch": 0.71, "learning_rate": 4.139830210654413e-06, "loss": 0.4456, "step": 6198 }, { "epoch": 0.71, "learning_rate": 4.136831167564867e-06, "loss": 0.4483, "step": 6199 }, { "epoch": 0.71, "learning_rate": 4.133832927860356e-06, "loss": 0.4507, "step": 6200 }, { "epoch": 0.71, "learning_rate": 4.130835491951699e-06, "loss": 0.4712, "step": 6201 }, { "epoch": 0.71, "learning_rate": 4.127838860249617e-06, "loss": 0.4428, "step": 6202 }, { "epoch": 0.71, "learning_rate": 4.124843033164716e-06, "loss": 0.4576, "step": 6203 }, { "epoch": 0.71, "learning_rate": 4.12184801110749e-06, "loss": 0.4357, "step": 6204 }, { "epoch": 0.71, "learning_rate": 4.11885379448832e-06, "loss": 0.4641, "step": 6205 }, { "epoch": 0.71, "learning_rate": 4.115860383717486e-06, "loss": 0.4702, "step": 6206 }, { "epoch": 0.71, "learning_rate": 4.1128677792051465e-06, "loss": 0.4636, "step": 6207 }, { "epoch": 0.71, "learning_rate": 4.109875981361363e-06, "loss": 0.4425, "step": 6208 }, { "epoch": 0.71, "learning_rate": 4.106884990596073e-06, "loss": 0.4679, "step": 6209 }, { "epoch": 0.71, "learning_rate": 4.103894807319106e-06, "loss": 0.4445, "step": 6210 }, { "epoch": 0.71, "learning_rate": 4.100905431940189e-06, "loss": 0.4616, "step": 6211 }, { "epoch": 0.71, "learning_rate": 4.097916864868932e-06, "loss": 0.4389, "step": 6212 }, { "epoch": 0.71, "learning_rate": 4.0949291065148375e-06, "loss": 0.4391, "step": 6213 }, { "epoch": 0.71, "learning_rate": 4.091942157287294e-06, "loss": 0.4661, "step": 6214 }, { "epoch": 0.71, "learning_rate": 4.088956017595575e-06, "loss": 0.453, "step": 6215 }, { "epoch": 0.71, "learning_rate": 4.085970687848857e-06, "loss": 0.4618, "step": 6216 }, { "epoch": 0.71, "learning_rate": 4.082986168456192e-06, "loss": 0.4677, "step": 6217 }, { "epoch": 0.71, "learning_rate": 4.080002459826523e-06, "loss": 0.439, "step": 6218 }, { "epoch": 0.71, "learning_rate": 4.077019562368691e-06, "loss": 0.4778, "step": 6219 }, { "epoch": 0.71, "learning_rate": 4.074037476491414e-06, "loss": 0.4595, "step": 6220 }, { "epoch": 0.71, "learning_rate": 4.071056202603305e-06, "loss": 0.446, "step": 6221 }, { "epoch": 0.71, "learning_rate": 4.0680757411128714e-06, "loss": 0.4495, "step": 6222 }, { "epoch": 0.71, "learning_rate": 4.0650960924284945e-06, "loss": 0.4578, "step": 6223 }, { "epoch": 0.71, "learning_rate": 4.06211725695846e-06, "loss": 0.4525, "step": 6224 }, { "epoch": 0.71, "learning_rate": 4.059139235110928e-06, "loss": 0.4576, "step": 6225 }, { "epoch": 0.71, "learning_rate": 4.056162027293962e-06, "loss": 0.4491, "step": 6226 }, { "epoch": 0.71, "learning_rate": 4.053185633915501e-06, "loss": 0.4703, "step": 6227 }, { "epoch": 0.71, "learning_rate": 4.050210055383373e-06, "loss": 0.447, "step": 6228 }, { "epoch": 0.71, "learning_rate": 4.047235292105308e-06, "loss": 0.4667, "step": 6229 }, { "epoch": 0.71, "learning_rate": 4.0442613444889065e-06, "loss": 0.4357, "step": 6230 }, { "epoch": 0.71, "learning_rate": 4.04128821294167e-06, "loss": 0.455, "step": 6231 }, { "epoch": 0.71, "learning_rate": 4.0383158978709865e-06, "loss": 0.4835, "step": 6232 }, { "epoch": 0.71, "learning_rate": 4.035344399684124e-06, "loss": 0.4562, "step": 6233 }, { "epoch": 0.71, "learning_rate": 4.032373718788248e-06, "loss": 0.4429, "step": 6234 }, { "epoch": 0.71, "learning_rate": 4.029403855590409e-06, "loss": 0.4534, "step": 6235 }, { "epoch": 0.71, "learning_rate": 4.026434810497538e-06, "loss": 0.4701, "step": 6236 }, { "epoch": 0.71, "learning_rate": 4.023466583916469e-06, "loss": 0.4494, "step": 6237 }, { "epoch": 0.71, "learning_rate": 4.020499176253907e-06, "loss": 0.4445, "step": 6238 }, { "epoch": 0.71, "learning_rate": 4.017532587916461e-06, "loss": 0.4381, "step": 6239 }, { "epoch": 0.71, "learning_rate": 4.014566819310612e-06, "loss": 0.4701, "step": 6240 }, { "epoch": 0.71, "learning_rate": 4.011601870842739e-06, "loss": 0.4726, "step": 6241 }, { "epoch": 0.71, "learning_rate": 4.008637742919114e-06, "loss": 0.4449, "step": 6242 }, { "epoch": 0.71, "learning_rate": 4.005674435945881e-06, "loss": 0.461, "step": 6243 }, { "epoch": 0.71, "learning_rate": 4.0027119503290776e-06, "loss": 0.4431, "step": 6244 }, { "epoch": 0.71, "learning_rate": 3.999750286474637e-06, "loss": 0.4566, "step": 6245 }, { "epoch": 0.71, "learning_rate": 3.996789444788366e-06, "loss": 0.4659, "step": 6246 }, { "epoch": 0.71, "learning_rate": 3.993829425675974e-06, "loss": 0.4216, "step": 6247 }, { "epoch": 0.71, "learning_rate": 3.99087022954304e-06, "loss": 0.4622, "step": 6248 }, { "epoch": 0.71, "learning_rate": 3.987911856795047e-06, "loss": 0.4577, "step": 6249 }, { "epoch": 0.71, "learning_rate": 3.98495430783736e-06, "loss": 0.4687, "step": 6250 }, { "epoch": 0.71, "learning_rate": 3.981997583075222e-06, "loss": 0.4482, "step": 6251 }, { "epoch": 0.71, "learning_rate": 3.979041682913777e-06, "loss": 0.4611, "step": 6252 }, { "epoch": 0.71, "learning_rate": 3.976086607758047e-06, "loss": 0.4587, "step": 6253 }, { "epoch": 0.71, "learning_rate": 3.973132358012939e-06, "loss": 0.4507, "step": 6254 }, { "epoch": 0.71, "learning_rate": 3.970178934083259e-06, "loss": 0.4569, "step": 6255 }, { "epoch": 0.71, "learning_rate": 3.967226336373686e-06, "loss": 0.4404, "step": 6256 }, { "epoch": 0.72, "learning_rate": 3.964274565288792e-06, "loss": 0.4412, "step": 6257 }, { "epoch": 0.72, "learning_rate": 3.961323621233036e-06, "loss": 0.465, "step": 6258 }, { "epoch": 0.72, "learning_rate": 3.9583735046107655e-06, "loss": 0.4492, "step": 6259 }, { "epoch": 0.72, "learning_rate": 3.9554242158262134e-06, "loss": 0.4508, "step": 6260 }, { "epoch": 0.72, "learning_rate": 3.952475755283497e-06, "loss": 0.4388, "step": 6261 }, { "epoch": 0.72, "learning_rate": 3.949528123386617e-06, "loss": 0.4523, "step": 6262 }, { "epoch": 0.72, "learning_rate": 3.94658132053947e-06, "loss": 0.4702, "step": 6263 }, { "epoch": 0.72, "learning_rate": 3.943635347145829e-06, "loss": 0.4598, "step": 6264 }, { "epoch": 0.72, "learning_rate": 3.940690203609364e-06, "loss": 0.4392, "step": 6265 }, { "epoch": 0.72, "learning_rate": 3.937745890333623e-06, "loss": 0.4792, "step": 6266 }, { "epoch": 0.72, "learning_rate": 3.934802407722038e-06, "loss": 0.4307, "step": 6267 }, { "epoch": 0.72, "learning_rate": 3.931859756177936e-06, "loss": 0.4622, "step": 6268 }, { "epoch": 0.72, "learning_rate": 3.928917936104529e-06, "loss": 0.4523, "step": 6269 }, { "epoch": 0.72, "learning_rate": 3.925976947904906e-06, "loss": 0.4647, "step": 6270 }, { "epoch": 0.72, "learning_rate": 3.923036791982053e-06, "loss": 0.4302, "step": 6271 }, { "epoch": 0.72, "learning_rate": 3.920097468738833e-06, "loss": 0.4587, "step": 6272 }, { "epoch": 0.72, "learning_rate": 3.917158978578003e-06, "loss": 0.4541, "step": 6273 }, { "epoch": 0.72, "learning_rate": 3.914221321902199e-06, "loss": 0.4458, "step": 6274 }, { "epoch": 0.72, "learning_rate": 3.911284499113943e-06, "loss": 0.4601, "step": 6275 }, { "epoch": 0.72, "learning_rate": 3.908348510615653e-06, "loss": 0.4432, "step": 6276 }, { "epoch": 0.72, "learning_rate": 3.905413356809615e-06, "loss": 0.4498, "step": 6277 }, { "epoch": 0.72, "learning_rate": 3.902479038098017e-06, "loss": 0.4558, "step": 6278 }, { "epoch": 0.72, "learning_rate": 3.899545554882927e-06, "loss": 0.4669, "step": 6279 }, { "epoch": 0.72, "learning_rate": 3.896612907566294e-06, "loss": 0.4479, "step": 6280 }, { "epoch": 0.72, "learning_rate": 3.893681096549961e-06, "loss": 0.4509, "step": 6281 }, { "epoch": 0.72, "learning_rate": 3.890750122235645e-06, "loss": 0.4552, "step": 6282 }, { "epoch": 0.72, "learning_rate": 3.887819985024962e-06, "loss": 0.4569, "step": 6283 }, { "epoch": 0.72, "learning_rate": 3.884890685319402e-06, "loss": 0.4695, "step": 6284 }, { "epoch": 0.72, "learning_rate": 3.881962223520343e-06, "loss": 0.4291, "step": 6285 }, { "epoch": 0.72, "learning_rate": 3.879034600029054e-06, "loss": 0.4662, "step": 6286 }, { "epoch": 0.72, "learning_rate": 3.876107815246678e-06, "loss": 0.4642, "step": 6287 }, { "epoch": 0.72, "learning_rate": 3.873181869574256e-06, "loss": 0.4396, "step": 6288 }, { "epoch": 0.72, "learning_rate": 3.87025676341271e-06, "loss": 0.4598, "step": 6289 }, { "epoch": 0.72, "learning_rate": 3.867332497162836e-06, "loss": 0.4541, "step": 6290 }, { "epoch": 0.72, "learning_rate": 3.864409071225334e-06, "loss": 0.4548, "step": 6291 }, { "epoch": 0.72, "learning_rate": 3.861486486000771e-06, "loss": 0.4845, "step": 6292 }, { "epoch": 0.72, "learning_rate": 3.858564741889608e-06, "loss": 0.451, "step": 6293 }, { "epoch": 0.72, "learning_rate": 3.855643839292193e-06, "loss": 0.4693, "step": 6294 }, { "epoch": 0.72, "learning_rate": 3.852723778608748e-06, "loss": 0.4537, "step": 6295 }, { "epoch": 0.72, "learning_rate": 3.849804560239394e-06, "loss": 0.4532, "step": 6296 }, { "epoch": 0.72, "learning_rate": 3.846886184584122e-06, "loss": 0.4356, "step": 6297 }, { "epoch": 0.72, "learning_rate": 3.8439686520428185e-06, "loss": 0.4561, "step": 6298 }, { "epoch": 0.72, "learning_rate": 3.841051963015254e-06, "loss": 0.4448, "step": 6299 }, { "epoch": 0.72, "learning_rate": 3.8381361179010755e-06, "loss": 0.4528, "step": 6300 }, { "epoch": 0.72, "learning_rate": 3.8352211170998165e-06, "loss": 0.4597, "step": 6301 }, { "epoch": 0.72, "learning_rate": 3.8323069610109046e-06, "loss": 0.4527, "step": 6302 }, { "epoch": 0.72, "learning_rate": 3.829393650033635e-06, "loss": 0.4397, "step": 6303 }, { "epoch": 0.72, "learning_rate": 3.8264811845672055e-06, "loss": 0.4605, "step": 6304 }, { "epoch": 0.72, "learning_rate": 3.823569565010682e-06, "loss": 0.4474, "step": 6305 }, { "epoch": 0.72, "learning_rate": 3.820658791763023e-06, "loss": 0.4566, "step": 6306 }, { "epoch": 0.72, "learning_rate": 3.817748865223075e-06, "loss": 0.4645, "step": 6307 }, { "epoch": 0.72, "learning_rate": 3.814839785789555e-06, "loss": 0.4646, "step": 6308 }, { "epoch": 0.72, "learning_rate": 3.811931553861078e-06, "loss": 0.4435, "step": 6309 }, { "epoch": 0.72, "learning_rate": 3.809024169836134e-06, "loss": 0.4757, "step": 6310 }, { "epoch": 0.72, "learning_rate": 3.8061176341130955e-06, "loss": 0.4353, "step": 6311 }, { "epoch": 0.72, "learning_rate": 3.803211947090232e-06, "loss": 0.4753, "step": 6312 }, { "epoch": 0.72, "learning_rate": 3.8003071091656806e-06, "loss": 0.4374, "step": 6313 }, { "epoch": 0.72, "learning_rate": 3.7974031207374685e-06, "loss": 0.4449, "step": 6314 }, { "epoch": 0.72, "learning_rate": 3.7944999822035077e-06, "loss": 0.4608, "step": 6315 }, { "epoch": 0.72, "learning_rate": 3.791597693961596e-06, "loss": 0.4467, "step": 6316 }, { "epoch": 0.72, "learning_rate": 3.788696256409412e-06, "loss": 0.4641, "step": 6317 }, { "epoch": 0.72, "learning_rate": 3.7857956699445164e-06, "loss": 0.467, "step": 6318 }, { "epoch": 0.72, "learning_rate": 3.78289593496435e-06, "loss": 0.448, "step": 6319 }, { "epoch": 0.72, "learning_rate": 3.7799970518662477e-06, "loss": 0.4555, "step": 6320 }, { "epoch": 0.72, "learning_rate": 3.7770990210474147e-06, "loss": 0.4534, "step": 6321 }, { "epoch": 0.72, "learning_rate": 3.774201842904953e-06, "loss": 0.4596, "step": 6322 }, { "epoch": 0.72, "learning_rate": 3.771305517835837e-06, "loss": 0.4588, "step": 6323 }, { "epoch": 0.72, "learning_rate": 3.7684100462369244e-06, "loss": 0.466, "step": 6324 }, { "epoch": 0.72, "learning_rate": 3.765515428504963e-06, "loss": 0.4445, "step": 6325 }, { "epoch": 0.72, "learning_rate": 3.7626216650365833e-06, "loss": 0.4649, "step": 6326 }, { "epoch": 0.72, "learning_rate": 3.7597287562282892e-06, "loss": 0.4526, "step": 6327 }, { "epoch": 0.72, "learning_rate": 3.7568367024764794e-06, "loss": 0.4537, "step": 6328 }, { "epoch": 0.72, "learning_rate": 3.7539455041774255e-06, "loss": 0.4432, "step": 6329 }, { "epoch": 0.72, "learning_rate": 3.7510551617272907e-06, "loss": 0.4636, "step": 6330 }, { "epoch": 0.72, "learning_rate": 3.748165675522113e-06, "loss": 0.4407, "step": 6331 }, { "epoch": 0.72, "learning_rate": 3.7452770459578134e-06, "loss": 0.4403, "step": 6332 }, { "epoch": 0.72, "learning_rate": 3.742389273430208e-06, "loss": 0.4471, "step": 6333 }, { "epoch": 0.72, "learning_rate": 3.7395023583349755e-06, "loss": 0.4537, "step": 6334 }, { "epoch": 0.72, "learning_rate": 3.7366163010676937e-06, "loss": 0.4709, "step": 6335 }, { "epoch": 0.72, "learning_rate": 3.733731102023819e-06, "loss": 0.4529, "step": 6336 }, { "epoch": 0.72, "learning_rate": 3.730846761598682e-06, "loss": 0.4427, "step": 6337 }, { "epoch": 0.72, "learning_rate": 3.7279632801875076e-06, "loss": 0.4683, "step": 6338 }, { "epoch": 0.72, "learning_rate": 3.725080658185395e-06, "loss": 0.4596, "step": 6339 }, { "epoch": 0.72, "learning_rate": 3.7221988959873232e-06, "loss": 0.4385, "step": 6340 }, { "epoch": 0.72, "learning_rate": 3.7193179939881665e-06, "loss": 0.4397, "step": 6341 }, { "epoch": 0.72, "learning_rate": 3.716437952582663e-06, "loss": 0.4779, "step": 6342 }, { "epoch": 0.72, "learning_rate": 3.7135587721654533e-06, "loss": 0.4569, "step": 6343 }, { "epoch": 0.73, "learning_rate": 3.710680453131039e-06, "loss": 0.4611, "step": 6344 }, { "epoch": 0.73, "learning_rate": 3.7078029958738194e-06, "loss": 0.4375, "step": 6345 }, { "epoch": 0.73, "learning_rate": 3.7049264007880735e-06, "loss": 0.4601, "step": 6346 }, { "epoch": 0.73, "learning_rate": 3.7020506682679524e-06, "loss": 0.4459, "step": 6347 }, { "epoch": 0.73, "learning_rate": 3.699175798707502e-06, "loss": 0.4453, "step": 6348 }, { "epoch": 0.73, "learning_rate": 3.6963017925006407e-06, "loss": 0.4557, "step": 6349 }, { "epoch": 0.73, "learning_rate": 3.6934286500411675e-06, "loss": 0.4617, "step": 6350 }, { "epoch": 0.73, "learning_rate": 3.690556371722774e-06, "loss": 0.46, "step": 6351 }, { "epoch": 0.73, "learning_rate": 3.6876849579390205e-06, "loss": 0.4603, "step": 6352 }, { "epoch": 0.73, "learning_rate": 3.6848144090833602e-06, "loss": 0.4403, "step": 6353 }, { "epoch": 0.73, "learning_rate": 3.681944725549117e-06, "loss": 0.4655, "step": 6354 }, { "epoch": 0.73, "learning_rate": 3.6790759077295046e-06, "loss": 0.4291, "step": 6355 }, { "epoch": 0.73, "learning_rate": 3.676207956017618e-06, "loss": 0.4618, "step": 6356 }, { "epoch": 0.73, "learning_rate": 3.6733408708064265e-06, "loss": 0.4499, "step": 6357 }, { "epoch": 0.73, "learning_rate": 3.6704746524887835e-06, "loss": 0.5017, "step": 6358 }, { "epoch": 0.73, "learning_rate": 3.667609301457431e-06, "loss": 0.4465, "step": 6359 }, { "epoch": 0.73, "learning_rate": 3.664744818104977e-06, "loss": 0.4627, "step": 6360 }, { "epoch": 0.73, "learning_rate": 3.6618812028239304e-06, "loss": 0.4456, "step": 6361 }, { "epoch": 0.73, "learning_rate": 3.65901845600666e-06, "loss": 0.465, "step": 6362 }, { "epoch": 0.73, "learning_rate": 3.656156578045431e-06, "loss": 0.4447, "step": 6363 }, { "epoch": 0.73, "learning_rate": 3.653295569332389e-06, "loss": 0.4692, "step": 6364 }, { "epoch": 0.73, "learning_rate": 3.650435430259548e-06, "loss": 0.4425, "step": 6365 }, { "epoch": 0.73, "learning_rate": 3.6475761612188177e-06, "loss": 0.4569, "step": 6366 }, { "epoch": 0.73, "learning_rate": 3.644717762601978e-06, "loss": 0.4629, "step": 6367 }, { "epoch": 0.73, "learning_rate": 3.6418602348006903e-06, "loss": 0.4604, "step": 6368 }, { "epoch": 0.73, "learning_rate": 3.639003578206508e-06, "loss": 0.4635, "step": 6369 }, { "epoch": 0.73, "learning_rate": 3.6361477932108513e-06, "loss": 0.4692, "step": 6370 }, { "epoch": 0.73, "learning_rate": 3.633292880205024e-06, "loss": 0.4452, "step": 6371 }, { "epoch": 0.73, "learning_rate": 3.630438839580217e-06, "loss": 0.4524, "step": 6372 }, { "epoch": 0.73, "learning_rate": 3.627585671727496e-06, "loss": 0.4447, "step": 6373 }, { "epoch": 0.73, "learning_rate": 3.6247333770378133e-06, "loss": 0.4762, "step": 6374 }, { "epoch": 0.73, "learning_rate": 3.6218819559019934e-06, "loss": 0.4542, "step": 6375 }, { "epoch": 0.73, "learning_rate": 3.6190314087107415e-06, "loss": 0.4638, "step": 6376 }, { "epoch": 0.73, "learning_rate": 3.6161817358546513e-06, "loss": 0.4357, "step": 6377 }, { "epoch": 0.73, "learning_rate": 3.6133329377241866e-06, "loss": 0.4745, "step": 6378 }, { "epoch": 0.73, "learning_rate": 3.6104850147097035e-06, "loss": 0.4524, "step": 6379 }, { "epoch": 0.73, "learning_rate": 3.6076379672014263e-06, "loss": 0.4682, "step": 6380 }, { "epoch": 0.73, "learning_rate": 3.6047917955894606e-06, "loss": 0.4454, "step": 6381 }, { "epoch": 0.73, "learning_rate": 3.6019465002638e-06, "loss": 0.4475, "step": 6382 }, { "epoch": 0.73, "learning_rate": 3.5991020816143164e-06, "loss": 0.452, "step": 6383 }, { "epoch": 0.73, "learning_rate": 3.5962585400307504e-06, "loss": 0.4758, "step": 6384 }, { "epoch": 0.73, "learning_rate": 3.5934158759027405e-06, "loss": 0.4591, "step": 6385 }, { "epoch": 0.73, "learning_rate": 3.590574089619786e-06, "loss": 0.4632, "step": 6386 }, { "epoch": 0.73, "learning_rate": 3.587733181571282e-06, "loss": 0.4452, "step": 6387 }, { "epoch": 0.73, "learning_rate": 3.5848931521464947e-06, "loss": 0.4504, "step": 6388 }, { "epoch": 0.73, "learning_rate": 3.5820540017345663e-06, "loss": 0.4659, "step": 6389 }, { "epoch": 0.73, "learning_rate": 3.5792157307245313e-06, "loss": 0.4513, "step": 6390 }, { "epoch": 0.73, "learning_rate": 3.5763783395052887e-06, "loss": 0.4511, "step": 6391 }, { "epoch": 0.73, "learning_rate": 3.5735418284656287e-06, "loss": 0.4506, "step": 6392 }, { "epoch": 0.73, "learning_rate": 3.5707061979942205e-06, "loss": 0.4609, "step": 6393 }, { "epoch": 0.73, "learning_rate": 3.5678714484796006e-06, "loss": 0.4443, "step": 6394 }, { "epoch": 0.73, "learning_rate": 3.565037580310201e-06, "loss": 0.4451, "step": 6395 }, { "epoch": 0.73, "learning_rate": 3.56220459387432e-06, "loss": 0.4531, "step": 6396 }, { "epoch": 0.73, "learning_rate": 3.559372489560139e-06, "loss": 0.4487, "step": 6397 }, { "epoch": 0.73, "learning_rate": 3.5565412677557233e-06, "loss": 0.4554, "step": 6398 }, { "epoch": 0.73, "learning_rate": 3.553710928849009e-06, "loss": 0.4365, "step": 6399 }, { "epoch": 0.73, "learning_rate": 3.550881473227822e-06, "loss": 0.4724, "step": 6400 }, { "epoch": 0.73, "learning_rate": 3.548052901279854e-06, "loss": 0.4517, "step": 6401 }, { "epoch": 0.73, "learning_rate": 3.5452252133926856e-06, "loss": 0.4618, "step": 6402 }, { "epoch": 0.73, "learning_rate": 3.5423984099537754e-06, "loss": 0.4458, "step": 6403 }, { "epoch": 0.73, "learning_rate": 3.5395724913504546e-06, "loss": 0.4444, "step": 6404 }, { "epoch": 0.73, "learning_rate": 3.536747457969942e-06, "loss": 0.4485, "step": 6405 }, { "epoch": 0.73, "learning_rate": 3.5339233101993287e-06, "loss": 0.4616, "step": 6406 }, { "epoch": 0.73, "learning_rate": 3.5311000484255796e-06, "loss": 0.4301, "step": 6407 }, { "epoch": 0.73, "learning_rate": 3.5282776730355537e-06, "loss": 0.4606, "step": 6408 }, { "epoch": 0.73, "learning_rate": 3.5254561844159718e-06, "loss": 0.4518, "step": 6409 }, { "epoch": 0.73, "learning_rate": 3.5226355829534475e-06, "loss": 0.4358, "step": 6410 }, { "epoch": 0.73, "learning_rate": 3.51981586903446e-06, "loss": 0.4838, "step": 6411 }, { "epoch": 0.73, "learning_rate": 3.516997043045376e-06, "loss": 0.4628, "step": 6412 }, { "epoch": 0.73, "learning_rate": 3.5141791053724405e-06, "loss": 0.4449, "step": 6413 }, { "epoch": 0.73, "learning_rate": 3.5113620564017727e-06, "loss": 0.4448, "step": 6414 }, { "epoch": 0.73, "learning_rate": 3.5085458965193654e-06, "loss": 0.4661, "step": 6415 }, { "epoch": 0.73, "learning_rate": 3.5057306261111024e-06, "loss": 0.4502, "step": 6416 }, { "epoch": 0.73, "learning_rate": 3.502916245562733e-06, "loss": 0.4547, "step": 6417 }, { "epoch": 0.73, "learning_rate": 3.5001027552598952e-06, "loss": 0.4459, "step": 6418 }, { "epoch": 0.73, "learning_rate": 3.4972901555880957e-06, "loss": 0.4551, "step": 6419 }, { "epoch": 0.73, "learning_rate": 3.4944784469327253e-06, "loss": 0.4592, "step": 6420 }, { "epoch": 0.73, "learning_rate": 3.491667629679054e-06, "loss": 0.4369, "step": 6421 }, { "epoch": 0.73, "learning_rate": 3.488857704212224e-06, "loss": 0.4437, "step": 6422 }, { "epoch": 0.73, "learning_rate": 3.4860486709172536e-06, "loss": 0.4401, "step": 6423 }, { "epoch": 0.73, "learning_rate": 3.4832405301790507e-06, "loss": 0.4533, "step": 6424 }, { "epoch": 0.73, "learning_rate": 3.4804332823823862e-06, "loss": 0.4487, "step": 6425 }, { "epoch": 0.73, "learning_rate": 3.477626927911921e-06, "loss": 0.4677, "step": 6426 }, { "epoch": 0.73, "learning_rate": 3.4748214671521875e-06, "loss": 0.4409, "step": 6427 }, { "epoch": 0.73, "learning_rate": 3.4720169004875914e-06, "loss": 0.4481, "step": 6428 }, { "epoch": 0.73, "learning_rate": 3.469213228302425e-06, "loss": 0.4797, "step": 6429 }, { "epoch": 0.73, "learning_rate": 3.466410450980854e-06, "loss": 0.4376, "step": 6430 }, { "epoch": 0.73, "learning_rate": 3.4636085689069244e-06, "loss": 0.4519, "step": 6431 }, { "epoch": 0.74, "learning_rate": 3.4608075824645524e-06, "loss": 0.4359, "step": 6432 }, { "epoch": 0.74, "learning_rate": 3.4580074920375352e-06, "loss": 0.4585, "step": 6433 }, { "epoch": 0.74, "learning_rate": 3.4552082980095514e-06, "loss": 0.4479, "step": 6434 }, { "epoch": 0.74, "learning_rate": 3.4524100007641517e-06, "loss": 0.4467, "step": 6435 }, { "epoch": 0.74, "learning_rate": 3.4496126006847596e-06, "loss": 0.4351, "step": 6436 }, { "epoch": 0.74, "learning_rate": 3.446816098154692e-06, "loss": 0.4652, "step": 6437 }, { "epoch": 0.74, "learning_rate": 3.4440204935571208e-06, "loss": 0.443, "step": 6438 }, { "epoch": 0.74, "learning_rate": 3.441225787275113e-06, "loss": 0.4518, "step": 6439 }, { "epoch": 0.74, "learning_rate": 3.4384319796916075e-06, "loss": 0.4392, "step": 6440 }, { "epoch": 0.74, "learning_rate": 3.435639071189413e-06, "loss": 0.4458, "step": 6441 }, { "epoch": 0.74, "learning_rate": 3.4328470621512257e-06, "loss": 0.462, "step": 6442 }, { "epoch": 0.74, "learning_rate": 3.430055952959607e-06, "loss": 0.4441, "step": 6443 }, { "epoch": 0.74, "learning_rate": 3.427265743997007e-06, "loss": 0.4649, "step": 6444 }, { "epoch": 0.74, "learning_rate": 3.4244764356457438e-06, "loss": 0.4703, "step": 6445 }, { "epoch": 0.74, "learning_rate": 3.4216880282880128e-06, "loss": 0.4514, "step": 6446 }, { "epoch": 0.74, "learning_rate": 3.4189005223058937e-06, "loss": 0.4628, "step": 6447 }, { "epoch": 0.74, "learning_rate": 3.416113918081331e-06, "loss": 0.4485, "step": 6448 }, { "epoch": 0.74, "learning_rate": 3.4133282159961535e-06, "loss": 0.4489, "step": 6449 }, { "epoch": 0.74, "learning_rate": 3.4105434164320695e-06, "loss": 0.4353, "step": 6450 }, { "epoch": 0.74, "learning_rate": 3.4077595197706505e-06, "loss": 0.4739, "step": 6451 }, { "epoch": 0.74, "learning_rate": 3.404976526393361e-06, "loss": 0.4615, "step": 6452 }, { "epoch": 0.74, "learning_rate": 3.4021944366815286e-06, "loss": 0.4412, "step": 6453 }, { "epoch": 0.74, "learning_rate": 3.399413251016359e-06, "loss": 0.4565, "step": 6454 }, { "epoch": 0.74, "learning_rate": 3.3966329697789424e-06, "loss": 0.4467, "step": 6455 }, { "epoch": 0.74, "learning_rate": 3.393853593350235e-06, "loss": 0.4398, "step": 6456 }, { "epoch": 0.74, "learning_rate": 3.391075122111077e-06, "loss": 0.4441, "step": 6457 }, { "epoch": 0.74, "learning_rate": 3.3882975564421773e-06, "loss": 0.4504, "step": 6458 }, { "epoch": 0.74, "learning_rate": 3.3855208967241247e-06, "loss": 0.46, "step": 6459 }, { "epoch": 0.74, "learning_rate": 3.3827451433373904e-06, "loss": 0.4562, "step": 6460 }, { "epoch": 0.74, "learning_rate": 3.379970296662305e-06, "loss": 0.468, "step": 6461 }, { "epoch": 0.74, "learning_rate": 3.3771963570790924e-06, "loss": 0.4444, "step": 6462 }, { "epoch": 0.74, "learning_rate": 3.3744233249678403e-06, "loss": 0.4594, "step": 6463 }, { "epoch": 0.74, "learning_rate": 3.3716512007085133e-06, "loss": 0.4506, "step": 6464 }, { "epoch": 0.74, "learning_rate": 3.368879984680962e-06, "loss": 0.4545, "step": 6465 }, { "epoch": 0.74, "learning_rate": 3.366109677264895e-06, "loss": 0.4571, "step": 6466 }, { "epoch": 0.74, "learning_rate": 3.363340278839916e-06, "loss": 0.4337, "step": 6467 }, { "epoch": 0.74, "learning_rate": 3.3605717897854872e-06, "loss": 0.4496, "step": 6468 }, { "epoch": 0.74, "learning_rate": 3.357804210480955e-06, "loss": 0.4677, "step": 6469 }, { "epoch": 0.74, "learning_rate": 3.355037541305545e-06, "loss": 0.441, "step": 6470 }, { "epoch": 0.74, "learning_rate": 3.3522717826383477e-06, "loss": 0.4474, "step": 6471 }, { "epoch": 0.74, "learning_rate": 3.349506934858331e-06, "loss": 0.4609, "step": 6472 }, { "epoch": 0.74, "learning_rate": 3.3467429983443477e-06, "loss": 0.4565, "step": 6473 }, { "epoch": 0.74, "learning_rate": 3.3439799734751132e-06, "loss": 0.4461, "step": 6474 }, { "epoch": 0.74, "learning_rate": 3.3412178606292276e-06, "loss": 0.465, "step": 6475 }, { "epoch": 0.74, "learning_rate": 3.3384566601851574e-06, "loss": 0.4509, "step": 6476 }, { "epoch": 0.74, "learning_rate": 3.3356963725212523e-06, "loss": 0.4677, "step": 6477 }, { "epoch": 0.74, "learning_rate": 3.3329369980157345e-06, "loss": 0.4562, "step": 6478 }, { "epoch": 0.74, "learning_rate": 3.330178537046699e-06, "loss": 0.4441, "step": 6479 }, { "epoch": 0.74, "learning_rate": 3.327420989992112e-06, "loss": 0.4541, "step": 6480 }, { "epoch": 0.74, "learning_rate": 3.3246643572298253e-06, "loss": 0.466, "step": 6481 }, { "epoch": 0.74, "learning_rate": 3.321908639137553e-06, "loss": 0.4409, "step": 6482 }, { "epoch": 0.74, "learning_rate": 3.3191538360928977e-06, "loss": 0.447, "step": 6483 }, { "epoch": 0.74, "learning_rate": 3.3163999484733232e-06, "loss": 0.4702, "step": 6484 }, { "epoch": 0.74, "learning_rate": 3.313646976656172e-06, "loss": 0.4823, "step": 6485 }, { "epoch": 0.74, "learning_rate": 3.3108949210186657e-06, "loss": 0.4589, "step": 6486 }, { "epoch": 0.74, "learning_rate": 3.308143781937898e-06, "loss": 0.46, "step": 6487 }, { "epoch": 0.74, "learning_rate": 3.305393559790838e-06, "loss": 0.4426, "step": 6488 }, { "epoch": 0.74, "learning_rate": 3.302644254954326e-06, "loss": 0.4549, "step": 6489 }, { "epoch": 0.74, "learning_rate": 3.299895867805074e-06, "loss": 0.4496, "step": 6490 }, { "epoch": 0.74, "learning_rate": 3.2971483987196783e-06, "loss": 0.4512, "step": 6491 }, { "epoch": 0.74, "learning_rate": 3.294401848074602e-06, "loss": 0.4596, "step": 6492 }, { "epoch": 0.74, "learning_rate": 3.2916562162461784e-06, "loss": 0.4452, "step": 6493 }, { "epoch": 0.74, "learning_rate": 3.288911503610629e-06, "loss": 0.4427, "step": 6494 }, { "epoch": 0.74, "learning_rate": 3.2861677105440335e-06, "loss": 0.4639, "step": 6495 }, { "epoch": 0.74, "learning_rate": 3.2834248374223556e-06, "loss": 0.4535, "step": 6496 }, { "epoch": 0.74, "learning_rate": 3.2806828846214324e-06, "loss": 0.4548, "step": 6497 }, { "epoch": 0.74, "learning_rate": 3.277941852516968e-06, "loss": 0.4639, "step": 6498 }, { "epoch": 0.74, "learning_rate": 3.2752017414845514e-06, "loss": 0.4343, "step": 6499 }, { "epoch": 0.74, "learning_rate": 3.2724625518996322e-06, "loss": 0.449, "step": 6500 }, { "epoch": 0.74, "learning_rate": 3.2697242841375452e-06, "loss": 0.4611, "step": 6501 }, { "epoch": 0.74, "learning_rate": 3.2669869385734943e-06, "loss": 0.4584, "step": 6502 }, { "epoch": 0.74, "learning_rate": 3.264250515582551e-06, "loss": 0.4496, "step": 6503 }, { "epoch": 0.74, "learning_rate": 3.2615150155396747e-06, "loss": 0.4493, "step": 6504 }, { "epoch": 0.74, "learning_rate": 3.258780438819681e-06, "loss": 0.4551, "step": 6505 }, { "epoch": 0.74, "learning_rate": 3.2560467857972744e-06, "loss": 0.4449, "step": 6506 }, { "epoch": 0.74, "learning_rate": 3.2533140568470266e-06, "loss": 0.4602, "step": 6507 }, { "epoch": 0.74, "learning_rate": 3.2505822523433785e-06, "loss": 0.4392, "step": 6508 }, { "epoch": 0.74, "learning_rate": 3.247851372660653e-06, "loss": 0.4686, "step": 6509 }, { "epoch": 0.74, "learning_rate": 3.2451214181730396e-06, "loss": 0.4433, "step": 6510 }, { "epoch": 0.74, "learning_rate": 3.2423923892545994e-06, "loss": 0.461, "step": 6511 }, { "epoch": 0.74, "learning_rate": 3.239664286279276e-06, "loss": 0.4404, "step": 6512 }, { "epoch": 0.74, "learning_rate": 3.2369371096208744e-06, "loss": 0.4545, "step": 6513 }, { "epoch": 0.74, "learning_rate": 3.2342108596530865e-06, "loss": 0.44, "step": 6514 }, { "epoch": 0.74, "learning_rate": 3.23148553674946e-06, "loss": 0.4454, "step": 6515 }, { "epoch": 0.74, "learning_rate": 3.2287611412834306e-06, "loss": 0.4478, "step": 6516 }, { "epoch": 0.74, "learning_rate": 3.226037673628305e-06, "loss": 0.4523, "step": 6517 }, { "epoch": 0.74, "learning_rate": 3.223315134157253e-06, "loss": 0.4633, "step": 6518 }, { "epoch": 0.75, "learning_rate": 3.220593523243324e-06, "loss": 0.4656, "step": 6519 }, { "epoch": 0.75, "learning_rate": 3.2178728412594417e-06, "loss": 0.4449, "step": 6520 }, { "epoch": 0.75, "learning_rate": 3.2151530885783967e-06, "loss": 0.4725, "step": 6521 }, { "epoch": 0.75, "learning_rate": 3.212434265572861e-06, "loss": 0.4602, "step": 6522 }, { "epoch": 0.75, "learning_rate": 3.209716372615369e-06, "loss": 0.4637, "step": 6523 }, { "epoch": 0.75, "learning_rate": 3.2069994100783376e-06, "loss": 0.4622, "step": 6524 }, { "epoch": 0.75, "learning_rate": 3.2042833783340453e-06, "loss": 0.4492, "step": 6525 }, { "epoch": 0.75, "learning_rate": 3.201568277754652e-06, "loss": 0.4493, "step": 6526 }, { "epoch": 0.75, "learning_rate": 3.1988541087121916e-06, "loss": 0.4665, "step": 6527 }, { "epoch": 0.75, "learning_rate": 3.1961408715785615e-06, "loss": 0.435, "step": 6528 }, { "epoch": 0.75, "learning_rate": 3.193428566725534e-06, "loss": 0.4442, "step": 6529 }, { "epoch": 0.75, "learning_rate": 3.1907171945247595e-06, "loss": 0.4554, "step": 6530 }, { "epoch": 0.75, "learning_rate": 3.1880067553477513e-06, "loss": 0.4353, "step": 6531 }, { "epoch": 0.75, "learning_rate": 3.1852972495659064e-06, "loss": 0.463, "step": 6532 }, { "epoch": 0.75, "learning_rate": 3.182588677550482e-06, "loss": 0.4648, "step": 6533 }, { "epoch": 0.75, "learning_rate": 3.179881039672619e-06, "loss": 0.4438, "step": 6534 }, { "epoch": 0.75, "learning_rate": 3.1771743363033156e-06, "loss": 0.4627, "step": 6535 }, { "epoch": 0.75, "learning_rate": 3.174468567813461e-06, "loss": 0.4732, "step": 6536 }, { "epoch": 0.75, "learning_rate": 3.171763734573796e-06, "loss": 0.434, "step": 6537 }, { "epoch": 0.75, "learning_rate": 3.169059836954952e-06, "loss": 0.4621, "step": 6538 }, { "epoch": 0.75, "learning_rate": 3.1663568753274153e-06, "loss": 0.4477, "step": 6539 }, { "epoch": 0.75, "learning_rate": 3.1636548500615583e-06, "loss": 0.4271, "step": 6540 }, { "epoch": 0.75, "learning_rate": 3.1609537615276174e-06, "loss": 0.4784, "step": 6541 }, { "epoch": 0.75, "learning_rate": 3.1582536100956973e-06, "loss": 0.4413, "step": 6542 }, { "epoch": 0.75, "learning_rate": 3.1555543961357824e-06, "loss": 0.4723, "step": 6543 }, { "epoch": 0.75, "learning_rate": 3.1528561200177254e-06, "loss": 0.4543, "step": 6544 }, { "epoch": 0.75, "learning_rate": 3.1501587821112532e-06, "loss": 0.4522, "step": 6545 }, { "epoch": 0.75, "learning_rate": 3.14746238278596e-06, "loss": 0.4649, "step": 6546 }, { "epoch": 0.75, "learning_rate": 3.1447669224113074e-06, "loss": 0.4431, "step": 6547 }, { "epoch": 0.75, "learning_rate": 3.1420724013566408e-06, "loss": 0.4451, "step": 6548 }, { "epoch": 0.75, "learning_rate": 3.1393788199911657e-06, "loss": 0.4428, "step": 6549 }, { "epoch": 0.75, "learning_rate": 3.136686178683961e-06, "loss": 0.468, "step": 6550 }, { "epoch": 0.75, "learning_rate": 3.1339944778039844e-06, "loss": 0.4625, "step": 6551 }, { "epoch": 0.75, "learning_rate": 3.131303717720053e-06, "loss": 0.4479, "step": 6552 }, { "epoch": 0.75, "learning_rate": 3.128613898800864e-06, "loss": 0.4522, "step": 6553 }, { "epoch": 0.75, "learning_rate": 3.125925021414985e-06, "loss": 0.4741, "step": 6554 }, { "epoch": 0.75, "learning_rate": 3.123237085930847e-06, "loss": 0.4563, "step": 6555 }, { "epoch": 0.75, "learning_rate": 3.1205500927167644e-06, "loss": 0.4503, "step": 6556 }, { "epoch": 0.75, "learning_rate": 3.1178640421409057e-06, "loss": 0.4515, "step": 6557 }, { "epoch": 0.75, "learning_rate": 3.11517893457133e-06, "loss": 0.4671, "step": 6558 }, { "epoch": 0.75, "learning_rate": 3.112494770375951e-06, "loss": 0.4659, "step": 6559 }, { "epoch": 0.75, "learning_rate": 3.1098115499225567e-06, "loss": 0.4397, "step": 6560 }, { "epoch": 0.75, "learning_rate": 3.107129273578815e-06, "loss": 0.4652, "step": 6561 }, { "epoch": 0.75, "learning_rate": 3.104447941712251e-06, "loss": 0.4627, "step": 6562 }, { "epoch": 0.75, "learning_rate": 3.1017675546902704e-06, "loss": 0.5041, "step": 6563 }, { "epoch": 0.75, "learning_rate": 3.0990881128801487e-06, "loss": 0.4534, "step": 6564 }, { "epoch": 0.75, "learning_rate": 3.096409616649023e-06, "loss": 0.4516, "step": 6565 }, { "epoch": 0.75, "learning_rate": 3.0937320663639148e-06, "loss": 0.4326, "step": 6566 }, { "epoch": 0.75, "learning_rate": 3.091055462391703e-06, "loss": 0.4685, "step": 6567 }, { "epoch": 0.75, "learning_rate": 3.088379805099141e-06, "loss": 0.4364, "step": 6568 }, { "epoch": 0.75, "learning_rate": 3.0857050948528576e-06, "loss": 0.4616, "step": 6569 }, { "epoch": 0.75, "learning_rate": 3.083031332019344e-06, "loss": 0.4496, "step": 6570 }, { "epoch": 0.75, "learning_rate": 3.0803585169649696e-06, "loss": 0.4441, "step": 6571 }, { "epoch": 0.75, "learning_rate": 3.0776866500559654e-06, "loss": 0.4711, "step": 6572 }, { "epoch": 0.75, "learning_rate": 3.0750157316584375e-06, "loss": 0.4634, "step": 6573 }, { "epoch": 0.75, "learning_rate": 3.0723457621383666e-06, "loss": 0.4329, "step": 6574 }, { "epoch": 0.75, "learning_rate": 3.0696767418615945e-06, "loss": 0.4494, "step": 6575 }, { "epoch": 0.75, "learning_rate": 3.067008671193833e-06, "loss": 0.4572, "step": 6576 }, { "epoch": 0.75, "learning_rate": 3.0643415505006733e-06, "loss": 0.4618, "step": 6577 }, { "epoch": 0.75, "learning_rate": 3.0616753801475653e-06, "loss": 0.4343, "step": 6578 }, { "epoch": 0.75, "learning_rate": 3.059010160499839e-06, "loss": 0.4473, "step": 6579 }, { "epoch": 0.75, "learning_rate": 3.056345891922684e-06, "loss": 0.4555, "step": 6580 }, { "epoch": 0.75, "learning_rate": 3.0536825747811695e-06, "loss": 0.4598, "step": 6581 }, { "epoch": 0.75, "learning_rate": 3.0510202094402242e-06, "loss": 0.4601, "step": 6582 }, { "epoch": 0.75, "learning_rate": 3.0483587962646545e-06, "loss": 0.4466, "step": 6583 }, { "epoch": 0.75, "learning_rate": 3.045698335619135e-06, "loss": 0.4614, "step": 6584 }, { "epoch": 0.75, "learning_rate": 3.0430388278682078e-06, "loss": 0.4739, "step": 6585 }, { "epoch": 0.75, "learning_rate": 3.04038027337628e-06, "loss": 0.4521, "step": 6586 }, { "epoch": 0.75, "learning_rate": 3.0377226725076394e-06, "loss": 0.4688, "step": 6587 }, { "epoch": 0.75, "learning_rate": 3.035066025626434e-06, "loss": 0.4473, "step": 6588 }, { "epoch": 0.75, "learning_rate": 3.0324103330966804e-06, "loss": 0.4427, "step": 6589 }, { "epoch": 0.75, "learning_rate": 3.02975559528227e-06, "loss": 0.4678, "step": 6590 }, { "epoch": 0.75, "learning_rate": 3.027101812546965e-06, "loss": 0.4627, "step": 6591 }, { "epoch": 0.75, "learning_rate": 3.024448985254387e-06, "loss": 0.4567, "step": 6592 }, { "epoch": 0.75, "learning_rate": 3.021797113768039e-06, "loss": 0.4516, "step": 6593 }, { "epoch": 0.75, "learning_rate": 3.0191461984512794e-06, "loss": 0.4481, "step": 6594 }, { "epoch": 0.75, "learning_rate": 3.016496239667349e-06, "loss": 0.4717, "step": 6595 }, { "epoch": 0.75, "learning_rate": 3.013847237779346e-06, "loss": 0.4614, "step": 6596 }, { "epoch": 0.75, "learning_rate": 3.0111991931502484e-06, "loss": 0.4335, "step": 6597 }, { "epoch": 0.75, "learning_rate": 3.0085521061428945e-06, "loss": 0.4489, "step": 6598 }, { "epoch": 0.75, "learning_rate": 3.005905977119992e-06, "loss": 0.4609, "step": 6599 }, { "epoch": 0.75, "learning_rate": 3.0032608064441206e-06, "loss": 0.4218, "step": 6600 }, { "epoch": 0.75, "learning_rate": 3.0006165944777333e-06, "loss": 0.4688, "step": 6601 }, { "epoch": 0.75, "learning_rate": 2.997973341583138e-06, "loss": 0.4433, "step": 6602 }, { "epoch": 0.75, "learning_rate": 2.9953310481225275e-06, "loss": 0.4752, "step": 6603 }, { "epoch": 0.75, "learning_rate": 2.992689714457947e-06, "loss": 0.4381, "step": 6604 }, { "epoch": 0.75, "learning_rate": 2.9900493409513256e-06, "loss": 0.459, "step": 6605 }, { "epoch": 0.75, "learning_rate": 2.9874099279644487e-06, "loss": 0.4376, "step": 6606 }, { "epoch": 0.76, "learning_rate": 2.984771475858973e-06, "loss": 0.4624, "step": 6607 }, { "epoch": 0.76, "learning_rate": 2.9821339849964324e-06, "loss": 0.4495, "step": 6608 }, { "epoch": 0.76, "learning_rate": 2.979497455738214e-06, "loss": 0.4727, "step": 6609 }, { "epoch": 0.76, "learning_rate": 2.976861888445586e-06, "loss": 0.4405, "step": 6610 }, { "epoch": 0.76, "learning_rate": 2.9742272834796813e-06, "loss": 0.4884, "step": 6611 }, { "epoch": 0.76, "learning_rate": 2.9715936412014945e-06, "loss": 0.4645, "step": 6612 }, { "epoch": 0.76, "learning_rate": 2.9689609619718996e-06, "loss": 0.4535, "step": 6613 }, { "epoch": 0.76, "learning_rate": 2.966329246151626e-06, "loss": 0.4459, "step": 6614 }, { "epoch": 0.76, "learning_rate": 2.9636984941012835e-06, "loss": 0.4543, "step": 6615 }, { "epoch": 0.76, "learning_rate": 2.9610687061813405e-06, "loss": 0.4395, "step": 6616 }, { "epoch": 0.76, "learning_rate": 2.9584398827521343e-06, "loss": 0.4394, "step": 6617 }, { "epoch": 0.76, "learning_rate": 2.9558120241738786e-06, "loss": 0.451, "step": 6618 }, { "epoch": 0.76, "learning_rate": 2.9531851308066426e-06, "loss": 0.468, "step": 6619 }, { "epoch": 0.76, "learning_rate": 2.950559203010371e-06, "loss": 0.4386, "step": 6620 }, { "epoch": 0.76, "learning_rate": 2.9479342411448797e-06, "loss": 0.4552, "step": 6621 }, { "epoch": 0.76, "learning_rate": 2.945310245569839e-06, "loss": 0.4542, "step": 6622 }, { "epoch": 0.76, "learning_rate": 2.942687216644803e-06, "loss": 0.4395, "step": 6623 }, { "epoch": 0.76, "learning_rate": 2.94006515472918e-06, "loss": 0.4551, "step": 6624 }, { "epoch": 0.76, "learning_rate": 2.9374440601822495e-06, "loss": 0.4472, "step": 6625 }, { "epoch": 0.76, "learning_rate": 2.9348239333631655e-06, "loss": 0.4362, "step": 6626 }, { "epoch": 0.76, "learning_rate": 2.9322047746309377e-06, "loss": 0.4542, "step": 6627 }, { "epoch": 0.76, "learning_rate": 2.929586584344456e-06, "loss": 0.4466, "step": 6628 }, { "epoch": 0.76, "learning_rate": 2.926969362862465e-06, "loss": 0.4727, "step": 6629 }, { "epoch": 0.76, "learning_rate": 2.924353110543584e-06, "loss": 0.4393, "step": 6630 }, { "epoch": 0.76, "learning_rate": 2.9217378277463025e-06, "loss": 0.4731, "step": 6631 }, { "epoch": 0.76, "learning_rate": 2.919123514828969e-06, "loss": 0.4454, "step": 6632 }, { "epoch": 0.76, "learning_rate": 2.916510172149799e-06, "loss": 0.4309, "step": 6633 }, { "epoch": 0.76, "learning_rate": 2.913897800066887e-06, "loss": 0.4529, "step": 6634 }, { "epoch": 0.76, "learning_rate": 2.911286398938178e-06, "loss": 0.4504, "step": 6635 }, { "epoch": 0.76, "learning_rate": 2.9086759691214994e-06, "loss": 0.4542, "step": 6636 }, { "epoch": 0.76, "learning_rate": 2.9060665109745324e-06, "loss": 0.4558, "step": 6637 }, { "epoch": 0.76, "learning_rate": 2.9034580248548363e-06, "loss": 0.458, "step": 6638 }, { "epoch": 0.76, "learning_rate": 2.900850511119826e-06, "loss": 0.4515, "step": 6639 }, { "epoch": 0.76, "learning_rate": 2.898243970126793e-06, "loss": 0.4648, "step": 6640 }, { "epoch": 0.76, "learning_rate": 2.8956384022328943e-06, "loss": 0.4455, "step": 6641 }, { "epoch": 0.76, "learning_rate": 2.893033807795147e-06, "loss": 0.4698, "step": 6642 }, { "epoch": 0.76, "learning_rate": 2.8904301871704377e-06, "loss": 0.4463, "step": 6643 }, { "epoch": 0.76, "learning_rate": 2.8878275407155244e-06, "loss": 0.4796, "step": 6644 }, { "epoch": 0.76, "learning_rate": 2.885225868787025e-06, "loss": 0.4443, "step": 6645 }, { "epoch": 0.76, "learning_rate": 2.8826251717414245e-06, "loss": 0.458, "step": 6646 }, { "epoch": 0.76, "learning_rate": 2.8800254499350797e-06, "loss": 0.4368, "step": 6647 }, { "epoch": 0.76, "learning_rate": 2.8774267037242133e-06, "loss": 0.4671, "step": 6648 }, { "epoch": 0.76, "learning_rate": 2.8748289334649036e-06, "loss": 0.4454, "step": 6649 }, { "epoch": 0.76, "learning_rate": 2.8722321395131127e-06, "loss": 0.433, "step": 6650 }, { "epoch": 0.76, "learning_rate": 2.8696363222246504e-06, "loss": 0.4398, "step": 6651 }, { "epoch": 0.76, "learning_rate": 2.8670414819552082e-06, "loss": 0.4618, "step": 6652 }, { "epoch": 0.76, "learning_rate": 2.864447619060333e-06, "loss": 0.4626, "step": 6653 }, { "epoch": 0.76, "learning_rate": 2.861854733895446e-06, "loss": 0.4605, "step": 6654 }, { "epoch": 0.76, "learning_rate": 2.8592628268158273e-06, "loss": 0.4402, "step": 6655 }, { "epoch": 0.76, "learning_rate": 2.8566718981766238e-06, "loss": 0.4339, "step": 6656 }, { "epoch": 0.76, "learning_rate": 2.854081948332854e-06, "loss": 0.4739, "step": 6657 }, { "epoch": 0.76, "learning_rate": 2.8514929776394006e-06, "loss": 0.4559, "step": 6658 }, { "epoch": 0.76, "learning_rate": 2.8489049864510053e-06, "loss": 0.4355, "step": 6659 }, { "epoch": 0.76, "learning_rate": 2.846317975122287e-06, "loss": 0.4431, "step": 6660 }, { "epoch": 0.76, "learning_rate": 2.843731944007717e-06, "loss": 0.4666, "step": 6661 }, { "epoch": 0.76, "learning_rate": 2.841146893461646e-06, "loss": 0.4639, "step": 6662 }, { "epoch": 0.76, "learning_rate": 2.8385628238382803e-06, "loss": 0.4551, "step": 6663 }, { "epoch": 0.76, "learning_rate": 2.8359797354916907e-06, "loss": 0.4547, "step": 6664 }, { "epoch": 0.76, "learning_rate": 2.833397628775827e-06, "loss": 0.4457, "step": 6665 }, { "epoch": 0.76, "learning_rate": 2.830816504044488e-06, "loss": 0.4398, "step": 6666 }, { "epoch": 0.76, "learning_rate": 2.8282363616513475e-06, "loss": 0.4445, "step": 6667 }, { "epoch": 0.76, "learning_rate": 2.8256572019499474e-06, "loss": 0.4753, "step": 6668 }, { "epoch": 0.76, "learning_rate": 2.8230790252936826e-06, "loss": 0.4523, "step": 6669 }, { "epoch": 0.76, "learning_rate": 2.8205018320358268e-06, "loss": 0.4613, "step": 6670 }, { "epoch": 0.76, "learning_rate": 2.8179256225295114e-06, "loss": 0.467, "step": 6671 }, { "epoch": 0.76, "learning_rate": 2.815350397127732e-06, "loss": 0.469, "step": 6672 }, { "epoch": 0.76, "learning_rate": 2.8127761561833554e-06, "loss": 0.4359, "step": 6673 }, { "epoch": 0.76, "learning_rate": 2.810202900049106e-06, "loss": 0.4473, "step": 6674 }, { "epoch": 0.76, "learning_rate": 2.8076306290775823e-06, "loss": 0.4625, "step": 6675 }, { "epoch": 0.76, "learning_rate": 2.8050593436212394e-06, "loss": 0.451, "step": 6676 }, { "epoch": 0.76, "learning_rate": 2.8024890440324e-06, "loss": 0.4503, "step": 6677 }, { "epoch": 0.76, "learning_rate": 2.7999197306632576e-06, "loss": 0.4582, "step": 6678 }, { "epoch": 0.76, "learning_rate": 2.79735140386586e-06, "loss": 0.4593, "step": 6679 }, { "epoch": 0.76, "learning_rate": 2.7947840639921308e-06, "loss": 0.4524, "step": 6680 }, { "epoch": 0.76, "learning_rate": 2.792217711393849e-06, "loss": 0.4527, "step": 6681 }, { "epoch": 0.76, "learning_rate": 2.78965234642266e-06, "loss": 0.452, "step": 6682 }, { "epoch": 0.76, "learning_rate": 2.7870879694300825e-06, "loss": 0.4344, "step": 6683 }, { "epoch": 0.76, "learning_rate": 2.7845245807674893e-06, "loss": 0.4756, "step": 6684 }, { "epoch": 0.76, "learning_rate": 2.7819621807861197e-06, "loss": 0.4306, "step": 6685 }, { "epoch": 0.76, "learning_rate": 2.779400769837083e-06, "loss": 0.4731, "step": 6686 }, { "epoch": 0.76, "learning_rate": 2.776840348271348e-06, "loss": 0.4586, "step": 6687 }, { "epoch": 0.76, "learning_rate": 2.7742809164397546e-06, "loss": 0.4586, "step": 6688 }, { "epoch": 0.76, "learning_rate": 2.7717224746929984e-06, "loss": 0.4355, "step": 6689 }, { "epoch": 0.76, "learning_rate": 2.769165023381639e-06, "loss": 0.453, "step": 6690 }, { "epoch": 0.76, "learning_rate": 2.7666085628561126e-06, "loss": 0.4595, "step": 6691 }, { "epoch": 0.76, "learning_rate": 2.764053093466702e-06, "loss": 0.4609, "step": 6692 }, { "epoch": 0.76, "learning_rate": 2.7614986155635737e-06, "loss": 0.4531, "step": 6693 }, { "epoch": 0.77, "learning_rate": 2.7589451294967383e-06, "loss": 0.4557, "step": 6694 }, { "epoch": 0.77, "learning_rate": 2.75639263561609e-06, "loss": 0.4522, "step": 6695 }, { "epoch": 0.77, "learning_rate": 2.753841134271368e-06, "loss": 0.468, "step": 6696 }, { "epoch": 0.77, "learning_rate": 2.7512906258121907e-06, "loss": 0.4466, "step": 6697 }, { "epoch": 0.77, "learning_rate": 2.7487411105880356e-06, "loss": 0.454, "step": 6698 }, { "epoch": 0.77, "learning_rate": 2.7461925889482422e-06, "loss": 0.4294, "step": 6699 }, { "epoch": 0.77, "learning_rate": 2.7436450612420098e-06, "loss": 0.4556, "step": 6700 }, { "epoch": 0.77, "learning_rate": 2.7410985278184144e-06, "loss": 0.4682, "step": 6701 }, { "epoch": 0.77, "learning_rate": 2.738552989026384e-06, "loss": 0.4551, "step": 6702 }, { "epoch": 0.77, "learning_rate": 2.7360084452147108e-06, "loss": 0.4589, "step": 6703 }, { "epoch": 0.77, "learning_rate": 2.7334648967320587e-06, "loss": 0.4527, "step": 6704 }, { "epoch": 0.77, "learning_rate": 2.7309223439269516e-06, "loss": 0.4516, "step": 6705 }, { "epoch": 0.77, "learning_rate": 2.728380787147772e-06, "loss": 0.4418, "step": 6706 }, { "epoch": 0.77, "learning_rate": 2.725840226742774e-06, "loss": 0.4448, "step": 6707 }, { "epoch": 0.77, "learning_rate": 2.7233006630600667e-06, "loss": 0.4588, "step": 6708 }, { "epoch": 0.77, "learning_rate": 2.7207620964476323e-06, "loss": 0.4534, "step": 6709 }, { "epoch": 0.77, "learning_rate": 2.7182245272533046e-06, "loss": 0.4508, "step": 6710 }, { "epoch": 0.77, "learning_rate": 2.715687955824795e-06, "loss": 0.4542, "step": 6711 }, { "epoch": 0.77, "learning_rate": 2.713152382509665e-06, "loss": 0.451, "step": 6712 }, { "epoch": 0.77, "learning_rate": 2.7106178076553446e-06, "loss": 0.4442, "step": 6713 }, { "epoch": 0.77, "learning_rate": 2.7080842316091273e-06, "loss": 0.4464, "step": 6714 }, { "epoch": 0.77, "learning_rate": 2.7055516547181736e-06, "loss": 0.4548, "step": 6715 }, { "epoch": 0.77, "learning_rate": 2.703020077329498e-06, "loss": 0.4454, "step": 6716 }, { "epoch": 0.77, "learning_rate": 2.7004894997899878e-06, "loss": 0.438, "step": 6717 }, { "epoch": 0.77, "learning_rate": 2.6979599224463838e-06, "loss": 0.4595, "step": 6718 }, { "epoch": 0.77, "learning_rate": 2.6954313456452995e-06, "loss": 0.4586, "step": 6719 }, { "epoch": 0.77, "learning_rate": 2.6929037697332037e-06, "loss": 0.4458, "step": 6720 }, { "epoch": 0.77, "learning_rate": 2.6903771950564294e-06, "loss": 0.4398, "step": 6721 }, { "epoch": 0.77, "learning_rate": 2.6878516219611773e-06, "loss": 0.4544, "step": 6722 }, { "epoch": 0.77, "learning_rate": 2.6853270507935013e-06, "loss": 0.4588, "step": 6723 }, { "epoch": 0.77, "learning_rate": 2.6828034818993285e-06, "loss": 0.4461, "step": 6724 }, { "epoch": 0.77, "learning_rate": 2.680280915624448e-06, "loss": 0.4515, "step": 6725 }, { "epoch": 0.77, "learning_rate": 2.6777593523144986e-06, "loss": 0.4567, "step": 6726 }, { "epoch": 0.77, "learning_rate": 2.675238792314999e-06, "loss": 0.4453, "step": 6727 }, { "epoch": 0.77, "learning_rate": 2.6727192359713196e-06, "loss": 0.4547, "step": 6728 }, { "epoch": 0.77, "learning_rate": 2.670200683628691e-06, "loss": 0.4584, "step": 6729 }, { "epoch": 0.77, "learning_rate": 2.6676831356322184e-06, "loss": 0.4569, "step": 6730 }, { "epoch": 0.77, "learning_rate": 2.6651665923268555e-06, "loss": 0.4601, "step": 6731 }, { "epoch": 0.77, "learning_rate": 2.6626510540574314e-06, "loss": 0.4423, "step": 6732 }, { "epoch": 0.77, "learning_rate": 2.6601365211686248e-06, "loss": 0.459, "step": 6733 }, { "epoch": 0.77, "learning_rate": 2.657622994004986e-06, "loss": 0.4568, "step": 6734 }, { "epoch": 0.77, "learning_rate": 2.655110472910927e-06, "loss": 0.4484, "step": 6735 }, { "epoch": 0.77, "learning_rate": 2.652598958230713e-06, "loss": 0.4592, "step": 6736 }, { "epoch": 0.77, "learning_rate": 2.6500884503084857e-06, "loss": 0.4461, "step": 6737 }, { "epoch": 0.77, "learning_rate": 2.647578949488234e-06, "loss": 0.4984, "step": 6738 }, { "epoch": 0.77, "learning_rate": 2.645070456113816e-06, "loss": 0.4566, "step": 6739 }, { "epoch": 0.77, "learning_rate": 2.6425629705289556e-06, "loss": 0.4459, "step": 6740 }, { "epoch": 0.77, "learning_rate": 2.640056493077231e-06, "loss": 0.4461, "step": 6741 }, { "epoch": 0.77, "learning_rate": 2.637551024102084e-06, "loss": 0.4478, "step": 6742 }, { "epoch": 0.77, "learning_rate": 2.6350465639468213e-06, "loss": 0.44, "step": 6743 }, { "epoch": 0.77, "learning_rate": 2.6325431129546107e-06, "loss": 0.4568, "step": 6744 }, { "epoch": 0.77, "learning_rate": 2.6300406714684834e-06, "loss": 0.4455, "step": 6745 }, { "epoch": 0.77, "learning_rate": 2.627539239831328e-06, "loss": 0.4659, "step": 6746 }, { "epoch": 0.77, "learning_rate": 2.625038818385892e-06, "loss": 0.4441, "step": 6747 }, { "epoch": 0.77, "learning_rate": 2.6225394074747956e-06, "loss": 0.4484, "step": 6748 }, { "epoch": 0.77, "learning_rate": 2.620041007440508e-06, "loss": 0.4494, "step": 6749 }, { "epoch": 0.77, "learning_rate": 2.617543618625371e-06, "loss": 0.4613, "step": 6750 }, { "epoch": 0.77, "learning_rate": 2.615047241371581e-06, "loss": 0.4473, "step": 6751 }, { "epoch": 0.77, "learning_rate": 2.6125518760211933e-06, "loss": 0.459, "step": 6752 }, { "epoch": 0.77, "learning_rate": 2.610057522916132e-06, "loss": 0.456, "step": 6753 }, { "epoch": 0.77, "learning_rate": 2.6075641823981814e-06, "loss": 0.4547, "step": 6754 }, { "epoch": 0.77, "learning_rate": 2.6050718548089804e-06, "loss": 0.4559, "step": 6755 }, { "epoch": 0.77, "learning_rate": 2.602580540490038e-06, "loss": 0.463, "step": 6756 }, { "epoch": 0.77, "learning_rate": 2.6000902397827154e-06, "loss": 0.4474, "step": 6757 }, { "epoch": 0.77, "learning_rate": 2.5976009530282455e-06, "loss": 0.4649, "step": 6758 }, { "epoch": 0.77, "learning_rate": 2.595112680567711e-06, "loss": 0.4483, "step": 6759 }, { "epoch": 0.77, "learning_rate": 2.592625422742059e-06, "loss": 0.4602, "step": 6760 }, { "epoch": 0.77, "learning_rate": 2.5901391798921018e-06, "loss": 0.4647, "step": 6761 }, { "epoch": 0.77, "learning_rate": 2.5876539523585144e-06, "loss": 0.4619, "step": 6762 }, { "epoch": 0.77, "learning_rate": 2.585169740481822e-06, "loss": 0.4544, "step": 6763 }, { "epoch": 0.77, "learning_rate": 2.582686544602423e-06, "loss": 0.4573, "step": 6764 }, { "epoch": 0.77, "learning_rate": 2.5802043650605645e-06, "loss": 0.4429, "step": 6765 }, { "epoch": 0.77, "learning_rate": 2.577723202196366e-06, "loss": 0.4496, "step": 6766 }, { "epoch": 0.77, "learning_rate": 2.575243056349801e-06, "loss": 0.4589, "step": 6767 }, { "epoch": 0.77, "learning_rate": 2.5727639278606997e-06, "loss": 0.4451, "step": 6768 }, { "epoch": 0.77, "learning_rate": 2.570285817068765e-06, "loss": 0.4611, "step": 6769 }, { "epoch": 0.77, "learning_rate": 2.5678087243135476e-06, "loss": 0.4572, "step": 6770 }, { "epoch": 0.77, "learning_rate": 2.565332649934468e-06, "loss": 0.4633, "step": 6771 }, { "epoch": 0.77, "learning_rate": 2.5628575942708047e-06, "loss": 0.4609, "step": 6772 }, { "epoch": 0.77, "learning_rate": 2.560383557661692e-06, "loss": 0.454, "step": 6773 }, { "epoch": 0.77, "learning_rate": 2.5579105404461325e-06, "loss": 0.4556, "step": 6774 }, { "epoch": 0.77, "learning_rate": 2.555438542962979e-06, "loss": 0.4432, "step": 6775 }, { "epoch": 0.77, "learning_rate": 2.5529675655509567e-06, "loss": 0.4549, "step": 6776 }, { "epoch": 0.77, "learning_rate": 2.550497608548642e-06, "loss": 0.4414, "step": 6777 }, { "epoch": 0.77, "learning_rate": 2.5480286722944712e-06, "loss": 0.4531, "step": 6778 }, { "epoch": 0.77, "learning_rate": 2.5455607571267484e-06, "loss": 0.4699, "step": 6779 }, { "epoch": 0.77, "learning_rate": 2.543093863383629e-06, "loss": 0.4576, "step": 6780 }, { "epoch": 0.77, "learning_rate": 2.540627991403134e-06, "loss": 0.4535, "step": 6781 }, { "epoch": 0.78, "learning_rate": 2.5381631415231455e-06, "loss": 0.479, "step": 6782 }, { "epoch": 0.78, "learning_rate": 2.535699314081399e-06, "loss": 0.4589, "step": 6783 }, { "epoch": 0.78, "learning_rate": 2.5332365094154975e-06, "loss": 0.4563, "step": 6784 }, { "epoch": 0.78, "learning_rate": 2.530774727862899e-06, "loss": 0.4539, "step": 6785 }, { "epoch": 0.78, "learning_rate": 2.5283139697609195e-06, "loss": 0.4446, "step": 6786 }, { "epoch": 0.78, "learning_rate": 2.525854235446743e-06, "loss": 0.4636, "step": 6787 }, { "epoch": 0.78, "learning_rate": 2.5233955252574027e-06, "loss": 0.4485, "step": 6788 }, { "epoch": 0.78, "learning_rate": 2.5209378395298013e-06, "loss": 0.4408, "step": 6789 }, { "epoch": 0.78, "learning_rate": 2.5184811786006923e-06, "loss": 0.4678, "step": 6790 }, { "epoch": 0.78, "learning_rate": 2.516025542806696e-06, "loss": 0.4418, "step": 6791 }, { "epoch": 0.78, "learning_rate": 2.5135709324842906e-06, "loss": 0.4579, "step": 6792 }, { "epoch": 0.78, "learning_rate": 2.511117347969809e-06, "loss": 0.453, "step": 6793 }, { "epoch": 0.78, "learning_rate": 2.508664789599451e-06, "loss": 0.4449, "step": 6794 }, { "epoch": 0.78, "learning_rate": 2.50621325770927e-06, "loss": 0.4601, "step": 6795 }, { "epoch": 0.78, "learning_rate": 2.503762752635177e-06, "loss": 0.4701, "step": 6796 }, { "epoch": 0.78, "learning_rate": 2.501313274712952e-06, "loss": 0.4432, "step": 6797 }, { "epoch": 0.78, "learning_rate": 2.4988648242782255e-06, "loss": 0.4596, "step": 6798 }, { "epoch": 0.78, "learning_rate": 2.4964174016664865e-06, "loss": 0.4429, "step": 6799 }, { "epoch": 0.78, "learning_rate": 2.4939710072130895e-06, "loss": 0.4535, "step": 6800 }, { "epoch": 0.78, "learning_rate": 2.4915256412532463e-06, "loss": 0.4357, "step": 6801 }, { "epoch": 0.78, "learning_rate": 2.4890813041220286e-06, "loss": 0.4536, "step": 6802 }, { "epoch": 0.78, "learning_rate": 2.486637996154362e-06, "loss": 0.442, "step": 6803 }, { "epoch": 0.78, "learning_rate": 2.4841957176850306e-06, "loss": 0.4543, "step": 6804 }, { "epoch": 0.78, "learning_rate": 2.4817544690486896e-06, "loss": 0.4535, "step": 6805 }, { "epoch": 0.78, "learning_rate": 2.4793142505798363e-06, "loss": 0.4411, "step": 6806 }, { "epoch": 0.78, "learning_rate": 2.4768750626128414e-06, "loss": 0.4497, "step": 6807 }, { "epoch": 0.78, "learning_rate": 2.4744369054819252e-06, "loss": 0.4533, "step": 6808 }, { "epoch": 0.78, "learning_rate": 2.4719997795211683e-06, "loss": 0.4417, "step": 6809 }, { "epoch": 0.78, "learning_rate": 2.4695636850645112e-06, "loss": 0.4485, "step": 6810 }, { "epoch": 0.78, "learning_rate": 2.467128622445759e-06, "loss": 0.4413, "step": 6811 }, { "epoch": 0.78, "learning_rate": 2.464694591998563e-06, "loss": 0.4554, "step": 6812 }, { "epoch": 0.78, "learning_rate": 2.4622615940564454e-06, "loss": 0.4551, "step": 6813 }, { "epoch": 0.78, "learning_rate": 2.4598296289527745e-06, "loss": 0.4501, "step": 6814 }, { "epoch": 0.78, "learning_rate": 2.4573986970207906e-06, "loss": 0.4521, "step": 6815 }, { "epoch": 0.78, "learning_rate": 2.4549687985935832e-06, "loss": 0.4545, "step": 6816 }, { "epoch": 0.78, "learning_rate": 2.452539934004099e-06, "loss": 0.436, "step": 6817 }, { "epoch": 0.78, "learning_rate": 2.4501121035851494e-06, "loss": 0.4512, "step": 6818 }, { "epoch": 0.78, "learning_rate": 2.447685307669405e-06, "loss": 0.4505, "step": 6819 }, { "epoch": 0.78, "learning_rate": 2.4452595465893847e-06, "loss": 0.4493, "step": 6820 }, { "epoch": 0.78, "learning_rate": 2.4428348206774775e-06, "loss": 0.4526, "step": 6821 }, { "epoch": 0.78, "learning_rate": 2.4404111302659195e-06, "loss": 0.4747, "step": 6822 }, { "epoch": 0.78, "learning_rate": 2.4379884756868167e-06, "loss": 0.4277, "step": 6823 }, { "epoch": 0.78, "learning_rate": 2.4355668572721224e-06, "loss": 0.4578, "step": 6824 }, { "epoch": 0.78, "learning_rate": 2.433146275353652e-06, "loss": 0.4408, "step": 6825 }, { "epoch": 0.78, "learning_rate": 2.4307267302630834e-06, "loss": 0.4679, "step": 6826 }, { "epoch": 0.78, "learning_rate": 2.428308222331942e-06, "loss": 0.4573, "step": 6827 }, { "epoch": 0.78, "learning_rate": 2.4258907518916207e-06, "loss": 0.4575, "step": 6828 }, { "epoch": 0.78, "learning_rate": 2.4234743192733713e-06, "loss": 0.4426, "step": 6829 }, { "epoch": 0.78, "learning_rate": 2.4210589248082914e-06, "loss": 0.4606, "step": 6830 }, { "epoch": 0.78, "learning_rate": 2.4186445688273508e-06, "loss": 0.4585, "step": 6831 }, { "epoch": 0.78, "learning_rate": 2.416231251661364e-06, "loss": 0.4363, "step": 6832 }, { "epoch": 0.78, "learning_rate": 2.4138189736410144e-06, "loss": 0.4513, "step": 6833 }, { "epoch": 0.78, "learning_rate": 2.411407735096836e-06, "loss": 0.4403, "step": 6834 }, { "epoch": 0.78, "learning_rate": 2.40899753635922e-06, "loss": 0.435, "step": 6835 }, { "epoch": 0.78, "learning_rate": 2.406588377758421e-06, "loss": 0.4783, "step": 6836 }, { "epoch": 0.78, "learning_rate": 2.4041802596245444e-06, "loss": 0.4533, "step": 6837 }, { "epoch": 0.78, "learning_rate": 2.4017731822875566e-06, "loss": 0.4545, "step": 6838 }, { "epoch": 0.78, "learning_rate": 2.399367146077286e-06, "loss": 0.4624, "step": 6839 }, { "epoch": 0.78, "learning_rate": 2.3969621513234066e-06, "loss": 0.46, "step": 6840 }, { "epoch": 0.78, "learning_rate": 2.394558198355462e-06, "loss": 0.4667, "step": 6841 }, { "epoch": 0.78, "learning_rate": 2.3921552875028443e-06, "loss": 0.4611, "step": 6842 }, { "epoch": 0.78, "learning_rate": 2.3897534190948034e-06, "loss": 0.4417, "step": 6843 }, { "epoch": 0.78, "learning_rate": 2.387352593460455e-06, "loss": 0.4708, "step": 6844 }, { "epoch": 0.78, "learning_rate": 2.384952810928759e-06, "loss": 0.456, "step": 6845 }, { "epoch": 0.78, "learning_rate": 2.3825540718285454e-06, "loss": 0.4431, "step": 6846 }, { "epoch": 0.78, "learning_rate": 2.3801563764884905e-06, "loss": 0.4557, "step": 6847 }, { "epoch": 0.78, "learning_rate": 2.377759725237133e-06, "loss": 0.4571, "step": 6848 }, { "epoch": 0.78, "learning_rate": 2.375364118402872e-06, "loss": 0.4388, "step": 6849 }, { "epoch": 0.78, "learning_rate": 2.3729695563139554e-06, "loss": 0.4392, "step": 6850 }, { "epoch": 0.78, "learning_rate": 2.3705760392984887e-06, "loss": 0.4436, "step": 6851 }, { "epoch": 0.78, "learning_rate": 2.3681835676844444e-06, "loss": 0.4396, "step": 6852 }, { "epoch": 0.78, "learning_rate": 2.3657921417996364e-06, "loss": 0.4496, "step": 6853 }, { "epoch": 0.78, "learning_rate": 2.363401761971752e-06, "loss": 0.4712, "step": 6854 }, { "epoch": 0.78, "learning_rate": 2.361012428528321e-06, "loss": 0.4381, "step": 6855 }, { "epoch": 0.78, "learning_rate": 2.3586241417967336e-06, "loss": 0.4399, "step": 6856 }, { "epoch": 0.78, "learning_rate": 2.356236902104242e-06, "loss": 0.4752, "step": 6857 }, { "epoch": 0.78, "learning_rate": 2.3538507097779505e-06, "loss": 0.4426, "step": 6858 }, { "epoch": 0.78, "learning_rate": 2.351465565144825e-06, "loss": 0.4458, "step": 6859 }, { "epoch": 0.78, "learning_rate": 2.3490814685316777e-06, "loss": 0.4235, "step": 6860 }, { "epoch": 0.78, "learning_rate": 2.3466984202651833e-06, "loss": 0.4463, "step": 6861 }, { "epoch": 0.78, "learning_rate": 2.344316420671876e-06, "loss": 0.4494, "step": 6862 }, { "epoch": 0.78, "learning_rate": 2.3419354700781393e-06, "loss": 0.4436, "step": 6863 }, { "epoch": 0.78, "learning_rate": 2.339555568810221e-06, "loss": 0.4534, "step": 6864 }, { "epoch": 0.78, "learning_rate": 2.3371767171942183e-06, "loss": 0.4484, "step": 6865 }, { "epoch": 0.78, "learning_rate": 2.3347989155560835e-06, "loss": 0.4561, "step": 6866 }, { "epoch": 0.78, "learning_rate": 2.3324221642216328e-06, "loss": 0.457, "step": 6867 }, { "epoch": 0.78, "learning_rate": 2.3300464635165353e-06, "loss": 0.4517, "step": 6868 }, { "epoch": 0.79, "learning_rate": 2.32767181376631e-06, "loss": 0.4567, "step": 6869 }, { "epoch": 0.79, "learning_rate": 2.3252982152963434e-06, "loss": 0.4546, "step": 6870 }, { "epoch": 0.79, "learning_rate": 2.3229256684318646e-06, "loss": 0.4425, "step": 6871 }, { "epoch": 0.79, "learning_rate": 2.320554173497972e-06, "loss": 0.4547, "step": 6872 }, { "epoch": 0.79, "learning_rate": 2.31818373081961e-06, "loss": 0.4633, "step": 6873 }, { "epoch": 0.79, "learning_rate": 2.3158143407215796e-06, "loss": 0.4514, "step": 6874 }, { "epoch": 0.79, "learning_rate": 2.3134460035285433e-06, "loss": 0.4556, "step": 6875 }, { "epoch": 0.79, "learning_rate": 2.3110787195650173e-06, "loss": 0.4472, "step": 6876 }, { "epoch": 0.79, "learning_rate": 2.3087124891553703e-06, "loss": 0.4514, "step": 6877 }, { "epoch": 0.79, "learning_rate": 2.30634731262383e-06, "loss": 0.4429, "step": 6878 }, { "epoch": 0.79, "learning_rate": 2.3039831902944766e-06, "loss": 0.4412, "step": 6879 }, { "epoch": 0.79, "learning_rate": 2.3016201224912504e-06, "loss": 0.4455, "step": 6880 }, { "epoch": 0.79, "learning_rate": 2.299258109537943e-06, "loss": 0.4689, "step": 6881 }, { "epoch": 0.79, "learning_rate": 2.2968971517581994e-06, "loss": 0.4426, "step": 6882 }, { "epoch": 0.79, "learning_rate": 2.2945372494755304e-06, "loss": 0.4538, "step": 6883 }, { "epoch": 0.79, "learning_rate": 2.2921784030132886e-06, "loss": 0.4454, "step": 6884 }, { "epoch": 0.79, "learning_rate": 2.289820612694692e-06, "loss": 0.4694, "step": 6885 }, { "epoch": 0.79, "learning_rate": 2.2874638788428128e-06, "loss": 0.4444, "step": 6886 }, { "epoch": 0.79, "learning_rate": 2.2851082017805704e-06, "loss": 0.4471, "step": 6887 }, { "epoch": 0.79, "learning_rate": 2.2827535818307513e-06, "loss": 0.4536, "step": 6888 }, { "epoch": 0.79, "learning_rate": 2.2804000193159848e-06, "loss": 0.453, "step": 6889 }, { "epoch": 0.79, "learning_rate": 2.278047514558769e-06, "loss": 0.47, "step": 6890 }, { "epoch": 0.79, "learning_rate": 2.2756960678814444e-06, "loss": 0.4648, "step": 6891 }, { "epoch": 0.79, "learning_rate": 2.2733456796062093e-06, "loss": 0.4424, "step": 6892 }, { "epoch": 0.79, "learning_rate": 2.270996350055126e-06, "loss": 0.4472, "step": 6893 }, { "epoch": 0.79, "learning_rate": 2.2686480795500986e-06, "loss": 0.4621, "step": 6894 }, { "epoch": 0.79, "learning_rate": 2.2663008684128964e-06, "loss": 0.4299, "step": 6895 }, { "epoch": 0.79, "learning_rate": 2.2639547169651423e-06, "loss": 0.453, "step": 6896 }, { "epoch": 0.79, "learning_rate": 2.2616096255283048e-06, "loss": 0.4602, "step": 6897 }, { "epoch": 0.79, "learning_rate": 2.25926559442372e-06, "loss": 0.447, "step": 6898 }, { "epoch": 0.79, "learning_rate": 2.2569226239725695e-06, "loss": 0.4674, "step": 6899 }, { "epoch": 0.79, "learning_rate": 2.2545807144958896e-06, "loss": 0.4247, "step": 6900 }, { "epoch": 0.79, "learning_rate": 2.252239866314582e-06, "loss": 0.4581, "step": 6901 }, { "epoch": 0.79, "learning_rate": 2.249900079749385e-06, "loss": 0.4323, "step": 6902 }, { "epoch": 0.79, "learning_rate": 2.247561355120912e-06, "loss": 0.442, "step": 6903 }, { "epoch": 0.79, "learning_rate": 2.245223692749612e-06, "loss": 0.4487, "step": 6904 }, { "epoch": 0.79, "learning_rate": 2.2428870929558012e-06, "loss": 0.4701, "step": 6905 }, { "epoch": 0.79, "learning_rate": 2.240551556059647e-06, "loss": 0.4617, "step": 6906 }, { "epoch": 0.79, "learning_rate": 2.238217082381169e-06, "loss": 0.4767, "step": 6907 }, { "epoch": 0.79, "learning_rate": 2.235883672240239e-06, "loss": 0.45, "step": 6908 }, { "epoch": 0.79, "learning_rate": 2.233551325956591e-06, "loss": 0.4683, "step": 6909 }, { "epoch": 0.79, "learning_rate": 2.2312200438498043e-06, "loss": 0.4498, "step": 6910 }, { "epoch": 0.79, "learning_rate": 2.2288898262393212e-06, "loss": 0.452, "step": 6911 }, { "epoch": 0.79, "learning_rate": 2.2265606734444314e-06, "loss": 0.4564, "step": 6912 }, { "epoch": 0.79, "learning_rate": 2.2242325857842773e-06, "loss": 0.4566, "step": 6913 }, { "epoch": 0.79, "learning_rate": 2.2219055635778618e-06, "loss": 0.4514, "step": 6914 }, { "epoch": 0.79, "learning_rate": 2.219579607144039e-06, "loss": 0.4527, "step": 6915 }, { "epoch": 0.79, "learning_rate": 2.21725471680152e-06, "loss": 0.4504, "step": 6916 }, { "epoch": 0.79, "learning_rate": 2.214930892868864e-06, "loss": 0.4526, "step": 6917 }, { "epoch": 0.79, "learning_rate": 2.2126081356644836e-06, "loss": 0.4445, "step": 6918 }, { "epoch": 0.79, "learning_rate": 2.210286445506654e-06, "loss": 0.4556, "step": 6919 }, { "epoch": 0.79, "learning_rate": 2.207965822713496e-06, "loss": 0.4578, "step": 6920 }, { "epoch": 0.79, "learning_rate": 2.205646267602983e-06, "loss": 0.4627, "step": 6921 }, { "epoch": 0.79, "learning_rate": 2.203327780492953e-06, "loss": 0.454, "step": 6922 }, { "epoch": 0.79, "learning_rate": 2.2010103617010836e-06, "loss": 0.4572, "step": 6923 }, { "epoch": 0.79, "learning_rate": 2.1986940115449173e-06, "loss": 0.4375, "step": 6924 }, { "epoch": 0.79, "learning_rate": 2.196378730341846e-06, "loss": 0.4548, "step": 6925 }, { "epoch": 0.79, "learning_rate": 2.1940645184091115e-06, "loss": 0.4455, "step": 6926 }, { "epoch": 0.79, "learning_rate": 2.1917513760638177e-06, "loss": 0.4483, "step": 6927 }, { "epoch": 0.79, "learning_rate": 2.18943930362291e-06, "loss": 0.4536, "step": 6928 }, { "epoch": 0.79, "learning_rate": 2.1871283014032007e-06, "loss": 0.4454, "step": 6929 }, { "epoch": 0.79, "learning_rate": 2.1848183697213467e-06, "loss": 0.4693, "step": 6930 }, { "epoch": 0.79, "learning_rate": 2.1825095088938553e-06, "loss": 0.4515, "step": 6931 }, { "epoch": 0.79, "learning_rate": 2.1802017192370963e-06, "loss": 0.451, "step": 6932 }, { "epoch": 0.79, "learning_rate": 2.1778950010672895e-06, "loss": 0.4543, "step": 6933 }, { "epoch": 0.79, "learning_rate": 2.1755893547005036e-06, "loss": 0.4561, "step": 6934 }, { "epoch": 0.79, "learning_rate": 2.173284780452667e-06, "loss": 0.4421, "step": 6935 }, { "epoch": 0.79, "learning_rate": 2.1709812786395545e-06, "loss": 0.4498, "step": 6936 }, { "epoch": 0.79, "learning_rate": 2.1686788495768006e-06, "loss": 0.4632, "step": 6937 }, { "epoch": 0.79, "learning_rate": 2.1663774935798886e-06, "loss": 0.4392, "step": 6938 }, { "epoch": 0.79, "learning_rate": 2.1640772109641504e-06, "loss": 0.4639, "step": 6939 }, { "epoch": 0.79, "learning_rate": 2.1617780020447854e-06, "loss": 0.4477, "step": 6940 }, { "epoch": 0.79, "learning_rate": 2.1594798671368265e-06, "loss": 0.4378, "step": 6941 }, { "epoch": 0.79, "learning_rate": 2.157182806555177e-06, "loss": 0.4584, "step": 6942 }, { "epoch": 0.79, "learning_rate": 2.1548868206145846e-06, "loss": 0.4768, "step": 6943 }, { "epoch": 0.79, "learning_rate": 2.1525919096296455e-06, "loss": 0.4334, "step": 6944 }, { "epoch": 0.79, "learning_rate": 2.1502980739148215e-06, "loss": 0.4477, "step": 6945 }, { "epoch": 0.79, "learning_rate": 2.1480053137844115e-06, "loss": 0.4488, "step": 6946 }, { "epoch": 0.79, "learning_rate": 2.1457136295525817e-06, "loss": 0.4608, "step": 6947 }, { "epoch": 0.79, "learning_rate": 2.1434230215333407e-06, "loss": 0.4605, "step": 6948 }, { "epoch": 0.79, "learning_rate": 2.14113349004055e-06, "loss": 0.4562, "step": 6949 }, { "epoch": 0.79, "learning_rate": 2.138845035387932e-06, "loss": 0.4482, "step": 6950 }, { "epoch": 0.79, "learning_rate": 2.1365576578890513e-06, "loss": 0.4535, "step": 6951 }, { "epoch": 0.79, "learning_rate": 2.1342713578573327e-06, "loss": 0.44, "step": 6952 }, { "epoch": 0.79, "learning_rate": 2.131986135606051e-06, "loss": 0.447, "step": 6953 }, { "epoch": 0.79, "learning_rate": 2.1297019914483297e-06, "loss": 0.4267, "step": 6954 }, { "epoch": 0.79, "learning_rate": 2.1274189256971523e-06, "loss": 0.442, "step": 6955 }, { "epoch": 0.79, "learning_rate": 2.1251369386653454e-06, "loss": 0.4605, "step": 6956 }, { "epoch": 0.8, "learning_rate": 2.122856030665591e-06, "loss": 0.4559, "step": 6957 }, { "epoch": 0.8, "learning_rate": 2.1205762020104303e-06, "loss": 0.4631, "step": 6958 }, { "epoch": 0.8, "learning_rate": 2.1182974530122435e-06, "loss": 0.4636, "step": 6959 }, { "epoch": 0.8, "learning_rate": 2.1160197839832774e-06, "loss": 0.4414, "step": 6960 }, { "epoch": 0.8, "learning_rate": 2.113743195235617e-06, "loss": 0.4593, "step": 6961 }, { "epoch": 0.8, "learning_rate": 2.111467687081209e-06, "loss": 0.4448, "step": 6962 }, { "epoch": 0.8, "learning_rate": 2.109193259831851e-06, "loss": 0.4518, "step": 6963 }, { "epoch": 0.8, "learning_rate": 2.106919913799188e-06, "loss": 0.4534, "step": 6964 }, { "epoch": 0.8, "learning_rate": 2.1046476492947155e-06, "loss": 0.4483, "step": 6965 }, { "epoch": 0.8, "learning_rate": 2.102376466629792e-06, "loss": 0.4542, "step": 6966 }, { "epoch": 0.8, "learning_rate": 2.100106366115613e-06, "loss": 0.4583, "step": 6967 }, { "epoch": 0.8, "learning_rate": 2.0978373480632386e-06, "loss": 0.4349, "step": 6968 }, { "epoch": 0.8, "learning_rate": 2.0955694127835736e-06, "loss": 0.447, "step": 6969 }, { "epoch": 0.8, "learning_rate": 2.0933025605873702e-06, "loss": 0.4611, "step": 6970 }, { "epoch": 0.8, "learning_rate": 2.0910367917852437e-06, "loss": 0.4435, "step": 6971 }, { "epoch": 0.8, "learning_rate": 2.088772106687653e-06, "loss": 0.4551, "step": 6972 }, { "epoch": 0.8, "learning_rate": 2.0865085056049138e-06, "loss": 0.4698, "step": 6973 }, { "epoch": 0.8, "learning_rate": 2.084245988847188e-06, "loss": 0.4405, "step": 6974 }, { "epoch": 0.8, "learning_rate": 2.0819845567244868e-06, "loss": 0.4661, "step": 6975 }, { "epoch": 0.8, "learning_rate": 2.079724209546683e-06, "loss": 0.4539, "step": 6976 }, { "epoch": 0.8, "learning_rate": 2.077464947623492e-06, "loss": 0.4373, "step": 6977 }, { "epoch": 0.8, "learning_rate": 2.0752067712644807e-06, "loss": 0.4411, "step": 6978 }, { "epoch": 0.8, "learning_rate": 2.0729496807790737e-06, "loss": 0.4557, "step": 6979 }, { "epoch": 0.8, "learning_rate": 2.0706936764765393e-06, "loss": 0.4516, "step": 6980 }, { "epoch": 0.8, "learning_rate": 2.0684387586660027e-06, "loss": 0.4538, "step": 6981 }, { "epoch": 0.8, "learning_rate": 2.0661849276564394e-06, "loss": 0.4527, "step": 6982 }, { "epoch": 0.8, "learning_rate": 2.0639321837566696e-06, "loss": 0.4482, "step": 6983 }, { "epoch": 0.8, "learning_rate": 2.0616805272753758e-06, "loss": 0.4652, "step": 6984 }, { "epoch": 0.8, "learning_rate": 2.0594299585210796e-06, "loss": 0.4302, "step": 6985 }, { "epoch": 0.8, "learning_rate": 2.057180477802164e-06, "loss": 0.4535, "step": 6986 }, { "epoch": 0.8, "learning_rate": 2.054932085426856e-06, "loss": 0.4474, "step": 6987 }, { "epoch": 0.8, "learning_rate": 2.0526847817032326e-06, "loss": 0.4389, "step": 6988 }, { "epoch": 0.8, "learning_rate": 2.0504385669392268e-06, "loss": 0.4523, "step": 6989 }, { "epoch": 0.8, "learning_rate": 2.048193441442623e-06, "loss": 0.4341, "step": 6990 }, { "epoch": 0.8, "learning_rate": 2.0459494055210495e-06, "loss": 0.462, "step": 6991 }, { "epoch": 0.8, "learning_rate": 2.043706459481992e-06, "loss": 0.4544, "step": 6992 }, { "epoch": 0.8, "learning_rate": 2.0414646036327813e-06, "loss": 0.4574, "step": 6993 }, { "epoch": 0.8, "learning_rate": 2.039223838280606e-06, "loss": 0.4469, "step": 6994 }, { "epoch": 0.8, "learning_rate": 2.0369841637324992e-06, "loss": 0.4479, "step": 6995 }, { "epoch": 0.8, "learning_rate": 2.034745580295342e-06, "loss": 0.4353, "step": 6996 }, { "epoch": 0.8, "learning_rate": 2.0325080882758775e-06, "loss": 0.4502, "step": 6997 }, { "epoch": 0.8, "learning_rate": 2.030271687980685e-06, "loss": 0.4471, "step": 6998 }, { "epoch": 0.8, "learning_rate": 2.028036379716205e-06, "loss": 0.457, "step": 6999 }, { "epoch": 0.8, "learning_rate": 2.025802163788727e-06, "loss": 0.4307, "step": 7000 }, { "epoch": 0.8, "learning_rate": 2.023569040504384e-06, "loss": 0.4597, "step": 7001 }, { "epoch": 0.8, "learning_rate": 2.0213370101691675e-06, "loss": 0.4454, "step": 7002 }, { "epoch": 0.8, "learning_rate": 2.0191060730889132e-06, "loss": 0.44, "step": 7003 }, { "epoch": 0.8, "learning_rate": 2.016876229569308e-06, "loss": 0.4463, "step": 7004 }, { "epoch": 0.8, "learning_rate": 2.0146474799158935e-06, "loss": 0.4651, "step": 7005 }, { "epoch": 0.8, "learning_rate": 2.0124198244340543e-06, "loss": 0.4465, "step": 7006 }, { "epoch": 0.8, "learning_rate": 2.0101932634290345e-06, "loss": 0.4694, "step": 7007 }, { "epoch": 0.8, "learning_rate": 2.0079677972059163e-06, "loss": 0.4513, "step": 7008 }, { "epoch": 0.8, "learning_rate": 2.005743426069641e-06, "loss": 0.4398, "step": 7009 }, { "epoch": 0.8, "learning_rate": 2.003520150325e-06, "loss": 0.4537, "step": 7010 }, { "epoch": 0.8, "learning_rate": 2.0012979702766277e-06, "loss": 0.4491, "step": 7011 }, { "epoch": 0.8, "learning_rate": 1.9990768862290155e-06, "loss": 0.4225, "step": 7012 }, { "epoch": 0.8, "learning_rate": 1.9968568984865e-06, "loss": 0.4786, "step": 7013 }, { "epoch": 0.8, "learning_rate": 1.9946380073532668e-06, "loss": 0.4358, "step": 7014 }, { "epoch": 0.8, "learning_rate": 1.992420213133357e-06, "loss": 0.4804, "step": 7015 }, { "epoch": 0.8, "learning_rate": 1.9902035161306574e-06, "loss": 0.4417, "step": 7016 }, { "epoch": 0.8, "learning_rate": 1.9879879166489023e-06, "loss": 0.4523, "step": 7017 }, { "epoch": 0.8, "learning_rate": 1.9857734149916787e-06, "loss": 0.4359, "step": 7018 }, { "epoch": 0.8, "learning_rate": 1.983560011462425e-06, "loss": 0.4723, "step": 7019 }, { "epoch": 0.8, "learning_rate": 1.981347706364429e-06, "loss": 0.441, "step": 7020 }, { "epoch": 0.8, "learning_rate": 1.979136500000822e-06, "loss": 0.4501, "step": 7021 }, { "epoch": 0.8, "learning_rate": 1.9769263926745886e-06, "loss": 0.4283, "step": 7022 }, { "epoch": 0.8, "learning_rate": 1.974717384688566e-06, "loss": 0.4435, "step": 7023 }, { "epoch": 0.8, "learning_rate": 1.972509476345432e-06, "loss": 0.4534, "step": 7024 }, { "epoch": 0.8, "learning_rate": 1.9703026679477253e-06, "loss": 0.4595, "step": 7025 }, { "epoch": 0.8, "learning_rate": 1.968096959797827e-06, "loss": 0.4401, "step": 7026 }, { "epoch": 0.8, "learning_rate": 1.9658923521979633e-06, "loss": 0.4562, "step": 7027 }, { "epoch": 0.8, "learning_rate": 1.963688845450218e-06, "loss": 0.4607, "step": 7028 }, { "epoch": 0.8, "learning_rate": 1.9614864398565212e-06, "loss": 0.4341, "step": 7029 }, { "epoch": 0.8, "learning_rate": 1.9592851357186537e-06, "loss": 0.4564, "step": 7030 }, { "epoch": 0.8, "learning_rate": 1.957084933338241e-06, "loss": 0.4644, "step": 7031 }, { "epoch": 0.8, "learning_rate": 1.9548858330167584e-06, "loss": 0.4615, "step": 7032 }, { "epoch": 0.8, "learning_rate": 1.9526878350555344e-06, "loss": 0.4764, "step": 7033 }, { "epoch": 0.8, "learning_rate": 1.9504909397557436e-06, "loss": 0.4278, "step": 7034 }, { "epoch": 0.8, "learning_rate": 1.9482951474184054e-06, "loss": 0.4495, "step": 7035 }, { "epoch": 0.8, "learning_rate": 1.9461004583443986e-06, "loss": 0.447, "step": 7036 }, { "epoch": 0.8, "learning_rate": 1.94390687283444e-06, "loss": 0.4558, "step": 7037 }, { "epoch": 0.8, "learning_rate": 1.9417143911891003e-06, "loss": 0.4436, "step": 7038 }, { "epoch": 0.8, "learning_rate": 1.939523013708803e-06, "loss": 0.4531, "step": 7039 }, { "epoch": 0.8, "learning_rate": 1.937332740693809e-06, "loss": 0.4468, "step": 7040 }, { "epoch": 0.8, "learning_rate": 1.9351435724442412e-06, "loss": 0.4673, "step": 7041 }, { "epoch": 0.8, "learning_rate": 1.9329555092600593e-06, "loss": 0.4542, "step": 7042 }, { "epoch": 0.8, "learning_rate": 1.9307685514410803e-06, "loss": 0.4458, "step": 7043 }, { "epoch": 0.81, "learning_rate": 1.928582699286965e-06, "loss": 0.4467, "step": 7044 }, { "epoch": 0.81, "learning_rate": 1.926397953097222e-06, "loss": 0.4474, "step": 7045 }, { "epoch": 0.81, "learning_rate": 1.924214313171211e-06, "loss": 0.4305, "step": 7046 }, { "epoch": 0.81, "learning_rate": 1.9220317798081433e-06, "loss": 0.456, "step": 7047 }, { "epoch": 0.81, "learning_rate": 1.9198503533070688e-06, "loss": 0.467, "step": 7048 }, { "epoch": 0.81, "learning_rate": 1.9176700339668986e-06, "loss": 0.4586, "step": 7049 }, { "epoch": 0.81, "learning_rate": 1.9154908220863775e-06, "loss": 0.447, "step": 7050 }, { "epoch": 0.81, "learning_rate": 1.913312717964113e-06, "loss": 0.4616, "step": 7051 }, { "epoch": 0.81, "learning_rate": 1.9111357218985504e-06, "loss": 0.4483, "step": 7052 }, { "epoch": 0.81, "learning_rate": 1.9089598341879855e-06, "loss": 0.4495, "step": 7053 }, { "epoch": 0.81, "learning_rate": 1.9067850551305678e-06, "loss": 0.4501, "step": 7054 }, { "epoch": 0.81, "learning_rate": 1.9046113850242843e-06, "loss": 0.4501, "step": 7055 }, { "epoch": 0.81, "learning_rate": 1.9024388241669811e-06, "loss": 0.4504, "step": 7056 }, { "epoch": 0.81, "learning_rate": 1.900267372856348e-06, "loss": 0.4638, "step": 7057 }, { "epoch": 0.81, "learning_rate": 1.8980970313899193e-06, "loss": 0.4497, "step": 7058 }, { "epoch": 0.81, "learning_rate": 1.8959278000650839e-06, "loss": 0.449, "step": 7059 }, { "epoch": 0.81, "learning_rate": 1.8937596791790735e-06, "loss": 0.45, "step": 7060 }, { "epoch": 0.81, "learning_rate": 1.8915926690289643e-06, "loss": 0.4337, "step": 7061 }, { "epoch": 0.81, "learning_rate": 1.889426769911693e-06, "loss": 0.4467, "step": 7062 }, { "epoch": 0.81, "learning_rate": 1.887261982124029e-06, "loss": 0.4389, "step": 7063 }, { "epoch": 0.81, "learning_rate": 1.8850983059626026e-06, "loss": 0.4479, "step": 7064 }, { "epoch": 0.81, "learning_rate": 1.8829357417238802e-06, "loss": 0.4554, "step": 7065 }, { "epoch": 0.81, "learning_rate": 1.8807742897041847e-06, "loss": 0.4657, "step": 7066 }, { "epoch": 0.81, "learning_rate": 1.8786139501996847e-06, "loss": 0.4486, "step": 7067 }, { "epoch": 0.81, "learning_rate": 1.8764547235063912e-06, "loss": 0.4762, "step": 7068 }, { "epoch": 0.81, "learning_rate": 1.8742966099201699e-06, "loss": 0.4658, "step": 7069 }, { "epoch": 0.81, "learning_rate": 1.8721396097367294e-06, "loss": 0.4481, "step": 7070 }, { "epoch": 0.81, "learning_rate": 1.8699837232516226e-06, "loss": 0.4427, "step": 7071 }, { "epoch": 0.81, "learning_rate": 1.867828950760262e-06, "loss": 0.4456, "step": 7072 }, { "epoch": 0.81, "learning_rate": 1.8656752925578948e-06, "loss": 0.4609, "step": 7073 }, { "epoch": 0.81, "learning_rate": 1.8635227489396178e-06, "loss": 0.4578, "step": 7074 }, { "epoch": 0.81, "learning_rate": 1.8613713202003813e-06, "loss": 0.4515, "step": 7075 }, { "epoch": 0.81, "learning_rate": 1.8592210066349781e-06, "loss": 0.4513, "step": 7076 }, { "epoch": 0.81, "learning_rate": 1.8570718085380512e-06, "loss": 0.4564, "step": 7077 }, { "epoch": 0.81, "learning_rate": 1.8549237262040876e-06, "loss": 0.4408, "step": 7078 }, { "epoch": 0.81, "learning_rate": 1.8527767599274193e-06, "loss": 0.4488, "step": 7079 }, { "epoch": 0.81, "learning_rate": 1.8506309100022334e-06, "loss": 0.4426, "step": 7080 }, { "epoch": 0.81, "learning_rate": 1.8484861767225549e-06, "loss": 0.4452, "step": 7081 }, { "epoch": 0.81, "learning_rate": 1.846342560382265e-06, "loss": 0.4534, "step": 7082 }, { "epoch": 0.81, "learning_rate": 1.8442000612750832e-06, "loss": 0.4499, "step": 7083 }, { "epoch": 0.81, "learning_rate": 1.8420586796945793e-06, "loss": 0.4449, "step": 7084 }, { "epoch": 0.81, "learning_rate": 1.839918415934171e-06, "loss": 0.4541, "step": 7085 }, { "epoch": 0.81, "learning_rate": 1.8377792702871266e-06, "loss": 0.4681, "step": 7086 }, { "epoch": 0.81, "learning_rate": 1.8356412430465498e-06, "loss": 0.4346, "step": 7087 }, { "epoch": 0.81, "learning_rate": 1.8335043345054048e-06, "loss": 0.4719, "step": 7088 }, { "epoch": 0.81, "learning_rate": 1.83136854495649e-06, "loss": 0.4324, "step": 7089 }, { "epoch": 0.81, "learning_rate": 1.829233874692461e-06, "loss": 0.4662, "step": 7090 }, { "epoch": 0.81, "learning_rate": 1.8271003240058127e-06, "loss": 0.4618, "step": 7091 }, { "epoch": 0.81, "learning_rate": 1.8249678931888881e-06, "loss": 0.4364, "step": 7092 }, { "epoch": 0.81, "learning_rate": 1.8228365825338811e-06, "loss": 0.4453, "step": 7093 }, { "epoch": 0.81, "learning_rate": 1.820706392332824e-06, "loss": 0.4628, "step": 7094 }, { "epoch": 0.81, "learning_rate": 1.8185773228776038e-06, "loss": 0.4462, "step": 7095 }, { "epoch": 0.81, "learning_rate": 1.8164493744599531e-06, "loss": 0.4569, "step": 7096 }, { "epoch": 0.81, "learning_rate": 1.814322547371443e-06, "loss": 0.4359, "step": 7097 }, { "epoch": 0.81, "learning_rate": 1.8121968419035007e-06, "loss": 0.4567, "step": 7098 }, { "epoch": 0.81, "learning_rate": 1.810072258347394e-06, "loss": 0.4508, "step": 7099 }, { "epoch": 0.81, "learning_rate": 1.8079487969942344e-06, "loss": 0.4589, "step": 7100 }, { "epoch": 0.81, "learning_rate": 1.8058264581349893e-06, "loss": 0.463, "step": 7101 }, { "epoch": 0.81, "learning_rate": 1.8037052420604618e-06, "loss": 0.4545, "step": 7102 }, { "epoch": 0.81, "learning_rate": 1.8015851490613079e-06, "loss": 0.4578, "step": 7103 }, { "epoch": 0.81, "learning_rate": 1.799466179428031e-06, "loss": 0.4468, "step": 7104 }, { "epoch": 0.81, "learning_rate": 1.7973483334509701e-06, "loss": 0.4457, "step": 7105 }, { "epoch": 0.81, "learning_rate": 1.795231611420325e-06, "loss": 0.4449, "step": 7106 }, { "epoch": 0.81, "learning_rate": 1.7931160136261272e-06, "loss": 0.4342, "step": 7107 }, { "epoch": 0.81, "learning_rate": 1.7910015403582659e-06, "loss": 0.4544, "step": 7108 }, { "epoch": 0.81, "learning_rate": 1.7888881919064694e-06, "loss": 0.4629, "step": 7109 }, { "epoch": 0.81, "learning_rate": 1.7867759685603115e-06, "loss": 0.4911, "step": 7110 }, { "epoch": 0.81, "learning_rate": 1.7846648706092173e-06, "loss": 0.444, "step": 7111 }, { "epoch": 0.81, "learning_rate": 1.78255489834245e-06, "loss": 0.4455, "step": 7112 }, { "epoch": 0.81, "learning_rate": 1.7804460520491263e-06, "loss": 0.4514, "step": 7113 }, { "epoch": 0.81, "learning_rate": 1.7783383320182069e-06, "loss": 0.4652, "step": 7114 }, { "epoch": 0.81, "learning_rate": 1.776231738538492e-06, "loss": 0.4435, "step": 7115 }, { "epoch": 0.81, "learning_rate": 1.7741262718986363e-06, "loss": 0.4645, "step": 7116 }, { "epoch": 0.81, "learning_rate": 1.7720219323871346e-06, "loss": 0.4633, "step": 7117 }, { "epoch": 0.81, "learning_rate": 1.7699187202923241e-06, "loss": 0.437, "step": 7118 }, { "epoch": 0.81, "learning_rate": 1.7678166359023973e-06, "loss": 0.4594, "step": 7119 }, { "epoch": 0.81, "learning_rate": 1.7657156795053821e-06, "loss": 0.4571, "step": 7120 }, { "epoch": 0.81, "learning_rate": 1.763615851389161e-06, "loss": 0.4344, "step": 7121 }, { "epoch": 0.81, "learning_rate": 1.7615171518414542e-06, "loss": 0.4568, "step": 7122 }, { "epoch": 0.81, "learning_rate": 1.7594195811498294e-06, "loss": 0.4552, "step": 7123 }, { "epoch": 0.81, "learning_rate": 1.7573231396017064e-06, "loss": 0.4622, "step": 7124 }, { "epoch": 0.81, "learning_rate": 1.755227827484338e-06, "loss": 0.4444, "step": 7125 }, { "epoch": 0.81, "learning_rate": 1.7531336450848335e-06, "loss": 0.4418, "step": 7126 }, { "epoch": 0.81, "learning_rate": 1.7510405926901408e-06, "loss": 0.4377, "step": 7127 }, { "epoch": 0.81, "learning_rate": 1.7489486705870517e-06, "loss": 0.448, "step": 7128 }, { "epoch": 0.81, "learning_rate": 1.7468578790622126e-06, "loss": 0.4435, "step": 7129 }, { "epoch": 0.81, "learning_rate": 1.7447682184021042e-06, "loss": 0.4557, "step": 7130 }, { "epoch": 0.81, "learning_rate": 1.7426796888930553e-06, "loss": 0.4505, "step": 7131 }, { "epoch": 0.82, "learning_rate": 1.7405922908212436e-06, "loss": 0.4546, "step": 7132 }, { "epoch": 0.82, "learning_rate": 1.7385060244726882e-06, "loss": 0.44, "step": 7133 }, { "epoch": 0.82, "learning_rate": 1.736420890133258e-06, "loss": 0.4504, "step": 7134 }, { "epoch": 0.82, "learning_rate": 1.7343368880886603e-06, "loss": 0.4574, "step": 7135 }, { "epoch": 0.82, "learning_rate": 1.7322540186244462e-06, "loss": 0.4503, "step": 7136 }, { "epoch": 0.82, "learning_rate": 1.7301722820260226e-06, "loss": 0.4587, "step": 7137 }, { "epoch": 0.82, "learning_rate": 1.7280916785786261e-06, "loss": 0.4356, "step": 7138 }, { "epoch": 0.82, "learning_rate": 1.7260122085673525e-06, "loss": 0.4409, "step": 7139 }, { "epoch": 0.82, "learning_rate": 1.7239338722771326e-06, "loss": 0.4578, "step": 7140 }, { "epoch": 0.82, "learning_rate": 1.721856669992743e-06, "loss": 0.447, "step": 7141 }, { "epoch": 0.82, "learning_rate": 1.7197806019988084e-06, "loss": 0.4626, "step": 7142 }, { "epoch": 0.82, "learning_rate": 1.7177056685797988e-06, "loss": 0.4323, "step": 7143 }, { "epoch": 0.82, "learning_rate": 1.7156318700200236e-06, "loss": 0.4271, "step": 7144 }, { "epoch": 0.82, "learning_rate": 1.713559206603642e-06, "loss": 0.4705, "step": 7145 }, { "epoch": 0.82, "learning_rate": 1.7114876786146505e-06, "loss": 0.4579, "step": 7146 }, { "epoch": 0.82, "learning_rate": 1.7094172863369007e-06, "loss": 0.4371, "step": 7147 }, { "epoch": 0.82, "learning_rate": 1.7073480300540802e-06, "loss": 0.4559, "step": 7148 }, { "epoch": 0.82, "learning_rate": 1.7052799100497197e-06, "loss": 0.4504, "step": 7149 }, { "epoch": 0.82, "learning_rate": 1.703212926607204e-06, "loss": 0.4783, "step": 7150 }, { "epoch": 0.82, "learning_rate": 1.7011470800097496e-06, "loss": 0.4489, "step": 7151 }, { "epoch": 0.82, "learning_rate": 1.6990823705404269e-06, "loss": 0.4556, "step": 7152 }, { "epoch": 0.82, "learning_rate": 1.6970187984821496e-06, "loss": 0.4528, "step": 7153 }, { "epoch": 0.82, "learning_rate": 1.694956364117668e-06, "loss": 0.4559, "step": 7154 }, { "epoch": 0.82, "learning_rate": 1.6928950677295875e-06, "loss": 0.4405, "step": 7155 }, { "epoch": 0.82, "learning_rate": 1.6908349096003484e-06, "loss": 0.4654, "step": 7156 }, { "epoch": 0.82, "learning_rate": 1.6887758900122352e-06, "loss": 0.453, "step": 7157 }, { "epoch": 0.82, "learning_rate": 1.6867180092473866e-06, "loss": 0.495, "step": 7158 }, { "epoch": 0.82, "learning_rate": 1.6846612675877716e-06, "loss": 0.4487, "step": 7159 }, { "epoch": 0.82, "learning_rate": 1.6826056653152122e-06, "loss": 0.46, "step": 7160 }, { "epoch": 0.82, "learning_rate": 1.6805512027113745e-06, "loss": 0.4511, "step": 7161 }, { "epoch": 0.82, "learning_rate": 1.6784978800577611e-06, "loss": 0.4701, "step": 7162 }, { "epoch": 0.82, "learning_rate": 1.6764456976357279e-06, "loss": 0.4382, "step": 7163 }, { "epoch": 0.82, "learning_rate": 1.6743946557264656e-06, "loss": 0.4417, "step": 7164 }, { "epoch": 0.82, "learning_rate": 1.672344754611016e-06, "loss": 0.4622, "step": 7165 }, { "epoch": 0.82, "learning_rate": 1.67029599457026e-06, "loss": 0.4403, "step": 7166 }, { "epoch": 0.82, "learning_rate": 1.6682483758849199e-06, "loss": 0.4704, "step": 7167 }, { "epoch": 0.82, "learning_rate": 1.666201898835572e-06, "loss": 0.4515, "step": 7168 }, { "epoch": 0.82, "learning_rate": 1.6641565637026225e-06, "loss": 0.4407, "step": 7169 }, { "epoch": 0.82, "learning_rate": 1.6621123707663312e-06, "loss": 0.448, "step": 7170 }, { "epoch": 0.82, "learning_rate": 1.6600693203068007e-06, "loss": 0.4588, "step": 7171 }, { "epoch": 0.82, "learning_rate": 1.6580274126039698e-06, "loss": 0.4502, "step": 7172 }, { "epoch": 0.82, "learning_rate": 1.6559866479376297e-06, "loss": 0.4401, "step": 7173 }, { "epoch": 0.82, "learning_rate": 1.6539470265874092e-06, "loss": 0.4351, "step": 7174 }, { "epoch": 0.82, "learning_rate": 1.651908548832779e-06, "loss": 0.4603, "step": 7175 }, { "epoch": 0.82, "learning_rate": 1.6498712149530606e-06, "loss": 0.4821, "step": 7176 }, { "epoch": 0.82, "learning_rate": 1.64783502522741e-06, "loss": 0.4347, "step": 7177 }, { "epoch": 0.82, "learning_rate": 1.6457999799348345e-06, "loss": 0.4536, "step": 7178 }, { "epoch": 0.82, "learning_rate": 1.6437660793541776e-06, "loss": 0.4413, "step": 7179 }, { "epoch": 0.82, "learning_rate": 1.6417333237641298e-06, "loss": 0.446, "step": 7180 }, { "epoch": 0.82, "learning_rate": 1.6397017134432281e-06, "loss": 0.455, "step": 7181 }, { "epoch": 0.82, "learning_rate": 1.6376712486698443e-06, "loss": 0.4394, "step": 7182 }, { "epoch": 0.82, "learning_rate": 1.635641929722196e-06, "loss": 0.4533, "step": 7183 }, { "epoch": 0.82, "learning_rate": 1.6336137568783495e-06, "loss": 0.4685, "step": 7184 }, { "epoch": 0.82, "learning_rate": 1.6315867304162058e-06, "loss": 0.4504, "step": 7185 }, { "epoch": 0.82, "learning_rate": 1.6295608506135162e-06, "loss": 0.4686, "step": 7186 }, { "epoch": 0.82, "learning_rate": 1.627536117747871e-06, "loss": 0.4506, "step": 7187 }, { "epoch": 0.82, "learning_rate": 1.625512532096699e-06, "loss": 0.4543, "step": 7188 }, { "epoch": 0.82, "learning_rate": 1.623490093937281e-06, "loss": 0.4635, "step": 7189 }, { "epoch": 0.82, "learning_rate": 1.6214688035467363e-06, "loss": 0.4493, "step": 7190 }, { "epoch": 0.82, "learning_rate": 1.6194486612020277e-06, "loss": 0.4523, "step": 7191 }, { "epoch": 0.82, "learning_rate": 1.6174296671799571e-06, "loss": 0.4677, "step": 7192 }, { "epoch": 0.82, "learning_rate": 1.6154118217571723e-06, "loss": 0.4354, "step": 7193 }, { "epoch": 0.82, "learning_rate": 1.6133951252101642e-06, "loss": 0.4581, "step": 7194 }, { "epoch": 0.82, "learning_rate": 1.6113795778152663e-06, "loss": 0.4396, "step": 7195 }, { "epoch": 0.82, "learning_rate": 1.6093651798486487e-06, "loss": 0.4427, "step": 7196 }, { "epoch": 0.82, "learning_rate": 1.6073519315863351e-06, "loss": 0.4417, "step": 7197 }, { "epoch": 0.82, "learning_rate": 1.6053398333041791e-06, "loss": 0.4423, "step": 7198 }, { "epoch": 0.82, "learning_rate": 1.6033288852778882e-06, "loss": 0.4448, "step": 7199 }, { "epoch": 0.82, "learning_rate": 1.6013190877830065e-06, "loss": 0.4561, "step": 7200 }, { "epoch": 0.82, "learning_rate": 1.5993104410949189e-06, "loss": 0.4564, "step": 7201 }, { "epoch": 0.82, "learning_rate": 1.5973029454888578e-06, "loss": 0.4518, "step": 7202 }, { "epoch": 0.82, "learning_rate": 1.5952966012398908e-06, "loss": 0.4463, "step": 7203 }, { "epoch": 0.82, "learning_rate": 1.5932914086229366e-06, "loss": 0.4785, "step": 7204 }, { "epoch": 0.82, "learning_rate": 1.5912873679127495e-06, "loss": 0.4446, "step": 7205 }, { "epoch": 0.82, "learning_rate": 1.5892844793839235e-06, "loss": 0.4422, "step": 7206 }, { "epoch": 0.82, "learning_rate": 1.5872827433109073e-06, "loss": 0.4585, "step": 7207 }, { "epoch": 0.82, "learning_rate": 1.5852821599679747e-06, "loss": 0.4655, "step": 7208 }, { "epoch": 0.82, "learning_rate": 1.5832827296292564e-06, "loss": 0.4546, "step": 7209 }, { "epoch": 0.82, "learning_rate": 1.5812844525687188e-06, "loss": 0.4432, "step": 7210 }, { "epoch": 0.82, "learning_rate": 1.5792873290601662e-06, "loss": 0.4541, "step": 7211 }, { "epoch": 0.82, "learning_rate": 1.5772913593772543e-06, "loss": 0.4737, "step": 7212 }, { "epoch": 0.82, "learning_rate": 1.575296543793473e-06, "loss": 0.4297, "step": 7213 }, { "epoch": 0.82, "learning_rate": 1.573302882582154e-06, "loss": 0.4452, "step": 7214 }, { "epoch": 0.82, "learning_rate": 1.5713103760164782e-06, "loss": 0.4724, "step": 7215 }, { "epoch": 0.82, "learning_rate": 1.56931902436946e-06, "loss": 0.4592, "step": 7216 }, { "epoch": 0.82, "learning_rate": 1.5673288279139586e-06, "loss": 0.4475, "step": 7217 }, { "epoch": 0.82, "learning_rate": 1.5653397869226806e-06, "loss": 0.4772, "step": 7218 }, { "epoch": 0.83, "learning_rate": 1.5633519016681631e-06, "loss": 0.4337, "step": 7219 }, { "epoch": 0.83, "learning_rate": 1.561365172422795e-06, "loss": 0.4538, "step": 7220 }, { "epoch": 0.83, "learning_rate": 1.559379599458798e-06, "loss": 0.4443, "step": 7221 }, { "epoch": 0.83, "learning_rate": 1.5573951830482458e-06, "loss": 0.4493, "step": 7222 }, { "epoch": 0.83, "learning_rate": 1.5554119234630438e-06, "loss": 0.4358, "step": 7223 }, { "epoch": 0.83, "learning_rate": 1.553429820974941e-06, "loss": 0.4569, "step": 7224 }, { "epoch": 0.83, "learning_rate": 1.5514488758555357e-06, "loss": 0.4639, "step": 7225 }, { "epoch": 0.83, "learning_rate": 1.5494690883762553e-06, "loss": 0.4464, "step": 7226 }, { "epoch": 0.83, "learning_rate": 1.5474904588083772e-06, "loss": 0.4525, "step": 7227 }, { "epoch": 0.83, "learning_rate": 1.5455129874230212e-06, "loss": 0.4562, "step": 7228 }, { "epoch": 0.83, "learning_rate": 1.5435366744911406e-06, "loss": 0.4502, "step": 7229 }, { "epoch": 0.83, "learning_rate": 1.5415615202835377e-06, "loss": 0.4496, "step": 7230 }, { "epoch": 0.83, "learning_rate": 1.5395875250708513e-06, "loss": 0.4492, "step": 7231 }, { "epoch": 0.83, "learning_rate": 1.53761468912356e-06, "loss": 0.4481, "step": 7232 }, { "epoch": 0.83, "learning_rate": 1.5356430127119915e-06, "loss": 0.4517, "step": 7233 }, { "epoch": 0.83, "learning_rate": 1.5336724961063043e-06, "loss": 0.4612, "step": 7234 }, { "epoch": 0.83, "learning_rate": 1.5317031395765081e-06, "loss": 0.447, "step": 7235 }, { "epoch": 0.83, "learning_rate": 1.5297349433924435e-06, "loss": 0.4387, "step": 7236 }, { "epoch": 0.83, "learning_rate": 1.5277679078238018e-06, "loss": 0.4682, "step": 7237 }, { "epoch": 0.83, "learning_rate": 1.5258020331401102e-06, "loss": 0.4466, "step": 7238 }, { "epoch": 0.83, "learning_rate": 1.523837319610737e-06, "loss": 0.4367, "step": 7239 }, { "epoch": 0.83, "learning_rate": 1.5218737675048888e-06, "loss": 0.452, "step": 7240 }, { "epoch": 0.83, "learning_rate": 1.5199113770916207e-06, "loss": 0.4353, "step": 7241 }, { "epoch": 0.83, "learning_rate": 1.5179501486398196e-06, "loss": 0.4702, "step": 7242 }, { "epoch": 0.83, "learning_rate": 1.5159900824182227e-06, "loss": 0.4602, "step": 7243 }, { "epoch": 0.83, "learning_rate": 1.5140311786953986e-06, "loss": 0.4643, "step": 7244 }, { "epoch": 0.83, "learning_rate": 1.5120734377397617e-06, "loss": 0.4605, "step": 7245 }, { "epoch": 0.83, "learning_rate": 1.5101168598195647e-06, "loss": 0.4429, "step": 7246 }, { "epoch": 0.83, "learning_rate": 1.508161445202906e-06, "loss": 0.4756, "step": 7247 }, { "epoch": 0.83, "learning_rate": 1.5062071941577217e-06, "loss": 0.4581, "step": 7248 }, { "epoch": 0.83, "learning_rate": 1.5042541069517846e-06, "loss": 0.4531, "step": 7249 }, { "epoch": 0.83, "learning_rate": 1.5023021838527108e-06, "loss": 0.4378, "step": 7250 }, { "epoch": 0.83, "learning_rate": 1.5003514251279616e-06, "loss": 0.4601, "step": 7251 }, { "epoch": 0.83, "learning_rate": 1.4984018310448312e-06, "loss": 0.466, "step": 7252 }, { "epoch": 0.83, "learning_rate": 1.4964534018704558e-06, "loss": 0.4375, "step": 7253 }, { "epoch": 0.83, "learning_rate": 1.4945061378718184e-06, "loss": 0.459, "step": 7254 }, { "epoch": 0.83, "learning_rate": 1.4925600393157325e-06, "loss": 0.4477, "step": 7255 }, { "epoch": 0.83, "learning_rate": 1.4906151064688602e-06, "loss": 0.4788, "step": 7256 }, { "epoch": 0.83, "learning_rate": 1.4886713395977015e-06, "loss": 0.4355, "step": 7257 }, { "epoch": 0.83, "learning_rate": 1.4867287389685936e-06, "loss": 0.4485, "step": 7258 }, { "epoch": 0.83, "learning_rate": 1.4847873048477191e-06, "loss": 0.4611, "step": 7259 }, { "epoch": 0.83, "learning_rate": 1.482847037501094e-06, "loss": 0.4529, "step": 7260 }, { "epoch": 0.83, "learning_rate": 1.4809079371945823e-06, "loss": 0.4453, "step": 7261 }, { "epoch": 0.83, "learning_rate": 1.4789700041938816e-06, "loss": 0.4605, "step": 7262 }, { "epoch": 0.83, "learning_rate": 1.4770332387645293e-06, "loss": 0.4372, "step": 7263 }, { "epoch": 0.83, "learning_rate": 1.475097641171912e-06, "loss": 0.4592, "step": 7264 }, { "epoch": 0.83, "learning_rate": 1.4731632116812434e-06, "loss": 0.4514, "step": 7265 }, { "epoch": 0.83, "learning_rate": 1.4712299505575868e-06, "loss": 0.4276, "step": 7266 }, { "epoch": 0.83, "learning_rate": 1.4692978580658434e-06, "loss": 0.4622, "step": 7267 }, { "epoch": 0.83, "learning_rate": 1.4673669344707498e-06, "loss": 0.4572, "step": 7268 }, { "epoch": 0.83, "learning_rate": 1.4654371800368882e-06, "loss": 0.4503, "step": 7269 }, { "epoch": 0.83, "learning_rate": 1.4635085950286776e-06, "loss": 0.4591, "step": 7270 }, { "epoch": 0.83, "learning_rate": 1.4615811797103751e-06, "loss": 0.4537, "step": 7271 }, { "epoch": 0.83, "learning_rate": 1.459654934346083e-06, "loss": 0.4507, "step": 7272 }, { "epoch": 0.83, "learning_rate": 1.4577298591997357e-06, "loss": 0.4602, "step": 7273 }, { "epoch": 0.83, "learning_rate": 1.4558059545351144e-06, "loss": 0.4625, "step": 7274 }, { "epoch": 0.83, "learning_rate": 1.4538832206158381e-06, "loss": 0.4445, "step": 7275 }, { "epoch": 0.83, "learning_rate": 1.4519616577053597e-06, "loss": 0.4464, "step": 7276 }, { "epoch": 0.83, "learning_rate": 1.4500412660669828e-06, "loss": 0.4605, "step": 7277 }, { "epoch": 0.83, "learning_rate": 1.448122045963839e-06, "loss": 0.4558, "step": 7278 }, { "epoch": 0.83, "learning_rate": 1.4462039976589048e-06, "loss": 0.4509, "step": 7279 }, { "epoch": 0.83, "learning_rate": 1.444287121414998e-06, "loss": 0.4439, "step": 7280 }, { "epoch": 0.83, "learning_rate": 1.442371417494769e-06, "loss": 0.4491, "step": 7281 }, { "epoch": 0.83, "learning_rate": 1.4404568861607172e-06, "loss": 0.4543, "step": 7282 }, { "epoch": 0.83, "learning_rate": 1.4385435276751724e-06, "loss": 0.4388, "step": 7283 }, { "epoch": 0.83, "learning_rate": 1.4366313423003087e-06, "loss": 0.4459, "step": 7284 }, { "epoch": 0.83, "learning_rate": 1.4347203302981393e-06, "loss": 0.4641, "step": 7285 }, { "epoch": 0.83, "learning_rate": 1.432810491930514e-06, "loss": 0.4506, "step": 7286 }, { "epoch": 0.83, "learning_rate": 1.4309018274591246e-06, "loss": 0.4384, "step": 7287 }, { "epoch": 0.83, "learning_rate": 1.4289943371455007e-06, "loss": 0.4767, "step": 7288 }, { "epoch": 0.83, "learning_rate": 1.4270880212510086e-06, "loss": 0.4374, "step": 7289 }, { "epoch": 0.83, "learning_rate": 1.4251828800368594e-06, "loss": 0.4517, "step": 7290 }, { "epoch": 0.83, "learning_rate": 1.4232789137640968e-06, "loss": 0.4359, "step": 7291 }, { "epoch": 0.83, "learning_rate": 1.4213761226936095e-06, "loss": 0.4627, "step": 7292 }, { "epoch": 0.83, "learning_rate": 1.4194745070861194e-06, "loss": 0.4673, "step": 7293 }, { "epoch": 0.83, "learning_rate": 1.417574067202192e-06, "loss": 0.4501, "step": 7294 }, { "epoch": 0.83, "learning_rate": 1.4156748033022328e-06, "loss": 0.443, "step": 7295 }, { "epoch": 0.83, "learning_rate": 1.413776715646481e-06, "loss": 0.4604, "step": 7296 }, { "epoch": 0.83, "learning_rate": 1.4118798044950132e-06, "loss": 0.4462, "step": 7297 }, { "epoch": 0.83, "learning_rate": 1.409984070107755e-06, "loss": 0.4305, "step": 7298 }, { "epoch": 0.83, "learning_rate": 1.4080895127444594e-06, "loss": 0.4609, "step": 7299 }, { "epoch": 0.83, "learning_rate": 1.4061961326647266e-06, "loss": 0.4414, "step": 7300 }, { "epoch": 0.83, "learning_rate": 1.4043039301279904e-06, "loss": 0.476, "step": 7301 }, { "epoch": 0.83, "learning_rate": 1.402412905393523e-06, "loss": 0.4646, "step": 7302 }, { "epoch": 0.83, "learning_rate": 1.4005230587204388e-06, "loss": 0.4492, "step": 7303 }, { "epoch": 0.83, "learning_rate": 1.398634390367688e-06, "loss": 0.4339, "step": 7304 }, { "epoch": 0.83, "learning_rate": 1.3967469005940638e-06, "loss": 0.448, "step": 7305 }, { "epoch": 0.83, "learning_rate": 1.3948605896581923e-06, "loss": 0.4402, "step": 7306 }, { "epoch": 0.84, "learning_rate": 1.3929754578185373e-06, "loss": 0.4364, "step": 7307 }, { "epoch": 0.84, "learning_rate": 1.3910915053334094e-06, "loss": 0.463, "step": 7308 }, { "epoch": 0.84, "learning_rate": 1.3892087324609482e-06, "loss": 0.4454, "step": 7309 }, { "epoch": 0.84, "learning_rate": 1.3873271394591348e-06, "loss": 0.4623, "step": 7310 }, { "epoch": 0.84, "learning_rate": 1.385446726585794e-06, "loss": 0.4608, "step": 7311 }, { "epoch": 0.84, "learning_rate": 1.3835674940985788e-06, "loss": 0.4374, "step": 7312 }, { "epoch": 0.84, "learning_rate": 1.3816894422549888e-06, "loss": 0.4594, "step": 7313 }, { "epoch": 0.84, "learning_rate": 1.379812571312361e-06, "loss": 0.4467, "step": 7314 }, { "epoch": 0.84, "learning_rate": 1.3779368815278648e-06, "loss": 0.4594, "step": 7315 }, { "epoch": 0.84, "learning_rate": 1.3760623731585165e-06, "loss": 0.4557, "step": 7316 }, { "epoch": 0.84, "learning_rate": 1.3741890464611597e-06, "loss": 0.446, "step": 7317 }, { "epoch": 0.84, "learning_rate": 1.3723169016924865e-06, "loss": 0.4579, "step": 7318 }, { "epoch": 0.84, "learning_rate": 1.370445939109022e-06, "loss": 0.4598, "step": 7319 }, { "epoch": 0.84, "learning_rate": 1.3685761589671253e-06, "loss": 0.4376, "step": 7320 }, { "epoch": 0.84, "learning_rate": 1.366707561523004e-06, "loss": 0.4252, "step": 7321 }, { "epoch": 0.84, "learning_rate": 1.3648401470326932e-06, "loss": 0.4451, "step": 7322 }, { "epoch": 0.84, "learning_rate": 1.3629739157520728e-06, "loss": 0.4647, "step": 7323 }, { "epoch": 0.84, "learning_rate": 1.361108867936859e-06, "loss": 0.4317, "step": 7324 }, { "epoch": 0.84, "learning_rate": 1.359245003842602e-06, "loss": 0.4451, "step": 7325 }, { "epoch": 0.84, "learning_rate": 1.3573823237246965e-06, "loss": 0.465, "step": 7326 }, { "epoch": 0.84, "learning_rate": 1.3555208278383691e-06, "loss": 0.4469, "step": 7327 }, { "epoch": 0.84, "learning_rate": 1.353660516438684e-06, "loss": 0.4517, "step": 7328 }, { "epoch": 0.84, "learning_rate": 1.3518013897805504e-06, "loss": 0.4704, "step": 7329 }, { "epoch": 0.84, "learning_rate": 1.3499434481187045e-06, "loss": 0.4471, "step": 7330 }, { "epoch": 0.84, "learning_rate": 1.3480866917077294e-06, "loss": 0.4489, "step": 7331 }, { "epoch": 0.84, "learning_rate": 1.346231120802044e-06, "loss": 0.4499, "step": 7332 }, { "epoch": 0.84, "learning_rate": 1.3443767356558989e-06, "loss": 0.4474, "step": 7333 }, { "epoch": 0.84, "learning_rate": 1.3425235365233892e-06, "loss": 0.4623, "step": 7334 }, { "epoch": 0.84, "learning_rate": 1.3406715236584433e-06, "loss": 0.4493, "step": 7335 }, { "epoch": 0.84, "learning_rate": 1.3388206973148265e-06, "loss": 0.4323, "step": 7336 }, { "epoch": 0.84, "learning_rate": 1.336971057746147e-06, "loss": 0.4577, "step": 7337 }, { "epoch": 0.84, "learning_rate": 1.335122605205843e-06, "loss": 0.436, "step": 7338 }, { "epoch": 0.84, "learning_rate": 1.3332753399471976e-06, "loss": 0.4512, "step": 7339 }, { "epoch": 0.84, "learning_rate": 1.3314292622233227e-06, "loss": 0.4495, "step": 7340 }, { "epoch": 0.84, "learning_rate": 1.329584372287176e-06, "loss": 0.4417, "step": 7341 }, { "epoch": 0.84, "learning_rate": 1.3277406703915485e-06, "loss": 0.4506, "step": 7342 }, { "epoch": 0.84, "learning_rate": 1.325898156789066e-06, "loss": 0.4717, "step": 7343 }, { "epoch": 0.84, "learning_rate": 1.3240568317321966e-06, "loss": 0.4456, "step": 7344 }, { "epoch": 0.84, "learning_rate": 1.322216695473243e-06, "loss": 0.4531, "step": 7345 }, { "epoch": 0.84, "learning_rate": 1.320377748264341e-06, "loss": 0.4392, "step": 7346 }, { "epoch": 0.84, "learning_rate": 1.3185399903574724e-06, "loss": 0.4464, "step": 7347 }, { "epoch": 0.84, "learning_rate": 1.3167034220044494e-06, "loss": 0.4205, "step": 7348 }, { "epoch": 0.84, "learning_rate": 1.3148680434569206e-06, "loss": 0.4495, "step": 7349 }, { "epoch": 0.84, "learning_rate": 1.3130338549663745e-06, "loss": 0.4453, "step": 7350 }, { "epoch": 0.84, "learning_rate": 1.3112008567841371e-06, "loss": 0.4435, "step": 7351 }, { "epoch": 0.84, "learning_rate": 1.309369049161372e-06, "loss": 0.4557, "step": 7352 }, { "epoch": 0.84, "learning_rate": 1.3075384323490759e-06, "loss": 0.4497, "step": 7353 }, { "epoch": 0.84, "learning_rate": 1.3057090065980816e-06, "loss": 0.4427, "step": 7354 }, { "epoch": 0.84, "learning_rate": 1.3038807721590663e-06, "loss": 0.4577, "step": 7355 }, { "epoch": 0.84, "learning_rate": 1.302053729282533e-06, "loss": 0.4432, "step": 7356 }, { "epoch": 0.84, "learning_rate": 1.3002278782188337e-06, "loss": 0.4521, "step": 7357 }, { "epoch": 0.84, "learning_rate": 1.2984032192181473e-06, "loss": 0.4507, "step": 7358 }, { "epoch": 0.84, "learning_rate": 1.2965797525304913e-06, "loss": 0.447, "step": 7359 }, { "epoch": 0.84, "learning_rate": 1.2947574784057237e-06, "loss": 0.4633, "step": 7360 }, { "epoch": 0.84, "learning_rate": 1.2929363970935371e-06, "loss": 0.4423, "step": 7361 }, { "epoch": 0.84, "learning_rate": 1.2911165088434584e-06, "loss": 0.4446, "step": 7362 }, { "epoch": 0.84, "learning_rate": 1.2892978139048562e-06, "loss": 0.459, "step": 7363 }, { "epoch": 0.84, "learning_rate": 1.2874803125269274e-06, "loss": 0.4648, "step": 7364 }, { "epoch": 0.84, "learning_rate": 1.2856640049587154e-06, "loss": 0.4511, "step": 7365 }, { "epoch": 0.84, "learning_rate": 1.283848891449092e-06, "loss": 0.4607, "step": 7366 }, { "epoch": 0.84, "learning_rate": 1.2820349722467663e-06, "loss": 0.4432, "step": 7367 }, { "epoch": 0.84, "learning_rate": 1.2802222476002911e-06, "loss": 0.4673, "step": 7368 }, { "epoch": 0.84, "learning_rate": 1.278410717758045e-06, "loss": 0.449, "step": 7369 }, { "epoch": 0.84, "learning_rate": 1.2766003829682504e-06, "loss": 0.4386, "step": 7370 }, { "epoch": 0.84, "learning_rate": 1.2747912434789655e-06, "loss": 0.4515, "step": 7371 }, { "epoch": 0.84, "learning_rate": 1.2729832995380775e-06, "loss": 0.4452, "step": 7372 }, { "epoch": 0.84, "learning_rate": 1.2711765513933216e-06, "loss": 0.4626, "step": 7373 }, { "epoch": 0.84, "learning_rate": 1.2693709992922575e-06, "loss": 0.4452, "step": 7374 }, { "epoch": 0.84, "learning_rate": 1.2675666434822887e-06, "loss": 0.443, "step": 7375 }, { "epoch": 0.84, "learning_rate": 1.2657634842106526e-06, "loss": 0.4632, "step": 7376 }, { "epoch": 0.84, "learning_rate": 1.2639615217244194e-06, "loss": 0.459, "step": 7377 }, { "epoch": 0.84, "learning_rate": 1.2621607562705018e-06, "loss": 0.4533, "step": 7378 }, { "epoch": 0.84, "learning_rate": 1.26036118809564e-06, "loss": 0.4352, "step": 7379 }, { "epoch": 0.84, "learning_rate": 1.2585628174464192e-06, "loss": 0.4407, "step": 7380 }, { "epoch": 0.84, "learning_rate": 1.2567656445692566e-06, "loss": 0.4571, "step": 7381 }, { "epoch": 0.84, "learning_rate": 1.254969669710402e-06, "loss": 0.4504, "step": 7382 }, { "epoch": 0.84, "learning_rate": 1.2531748931159472e-06, "loss": 0.4709, "step": 7383 }, { "epoch": 0.84, "learning_rate": 1.2513813150318155e-06, "loss": 0.4495, "step": 7384 }, { "epoch": 0.84, "learning_rate": 1.249588935703765e-06, "loss": 0.4497, "step": 7385 }, { "epoch": 0.84, "learning_rate": 1.2477977553773957e-06, "loss": 0.4771, "step": 7386 }, { "epoch": 0.84, "learning_rate": 1.2460077742981347e-06, "loss": 0.4575, "step": 7387 }, { "epoch": 0.84, "learning_rate": 1.2442189927112514e-06, "loss": 0.4703, "step": 7388 }, { "epoch": 0.84, "learning_rate": 1.2424314108618507e-06, "loss": 0.4338, "step": 7389 }, { "epoch": 0.84, "learning_rate": 1.240645028994869e-06, "loss": 0.44, "step": 7390 }, { "epoch": 0.84, "learning_rate": 1.2388598473550828e-06, "loss": 0.4633, "step": 7391 }, { "epoch": 0.84, "learning_rate": 1.2370758661870997e-06, "loss": 0.4367, "step": 7392 }, { "epoch": 0.84, "learning_rate": 1.235293085735364e-06, "loss": 0.4532, "step": 7393 }, { "epoch": 0.85, "learning_rate": 1.2335115062441593e-06, "loss": 0.4382, "step": 7394 }, { "epoch": 0.85, "learning_rate": 1.2317311279575982e-06, "loss": 0.4713, "step": 7395 }, { "epoch": 0.85, "learning_rate": 1.2299519511196368e-06, "loss": 0.4241, "step": 7396 }, { "epoch": 0.85, "learning_rate": 1.2281739759740575e-06, "loss": 0.4588, "step": 7397 }, { "epoch": 0.85, "learning_rate": 1.2263972027644854e-06, "loss": 0.4597, "step": 7398 }, { "epoch": 0.85, "learning_rate": 1.2246216317343796e-06, "loss": 0.4638, "step": 7399 }, { "epoch": 0.85, "learning_rate": 1.2228472631270272e-06, "loss": 0.4634, "step": 7400 }, { "epoch": 0.85, "learning_rate": 1.221074097185564e-06, "loss": 0.4513, "step": 7401 }, { "epoch": 0.85, "learning_rate": 1.2193021341529477e-06, "loss": 0.4579, "step": 7402 }, { "epoch": 0.85, "learning_rate": 1.2175313742719775e-06, "loss": 0.4613, "step": 7403 }, { "epoch": 0.85, "learning_rate": 1.2157618177852893e-06, "loss": 0.466, "step": 7404 }, { "epoch": 0.85, "learning_rate": 1.2139934649353503e-06, "loss": 0.4523, "step": 7405 }, { "epoch": 0.85, "learning_rate": 1.212226315964462e-06, "loss": 0.4477, "step": 7406 }, { "epoch": 0.85, "learning_rate": 1.2104603711147666e-06, "loss": 0.4393, "step": 7407 }, { "epoch": 0.85, "learning_rate": 1.2086956306282371e-06, "loss": 0.4522, "step": 7408 }, { "epoch": 0.85, "learning_rate": 1.2069320947466845e-06, "loss": 0.4699, "step": 7409 }, { "epoch": 0.85, "learning_rate": 1.20516976371175e-06, "loss": 0.4423, "step": 7410 }, { "epoch": 0.85, "learning_rate": 1.2034086377649102e-06, "loss": 0.4703, "step": 7411 }, { "epoch": 0.85, "learning_rate": 1.2016487171474844e-06, "loss": 0.4311, "step": 7412 }, { "epoch": 0.85, "learning_rate": 1.1998900021006155e-06, "loss": 0.4456, "step": 7413 }, { "epoch": 0.85, "learning_rate": 1.1981324928652905e-06, "loss": 0.4382, "step": 7414 }, { "epoch": 0.85, "learning_rate": 1.1963761896823255e-06, "loss": 0.4528, "step": 7415 }, { "epoch": 0.85, "learning_rate": 1.1946210927923729e-06, "loss": 0.4467, "step": 7416 }, { "epoch": 0.85, "learning_rate": 1.1928672024359211e-06, "loss": 0.448, "step": 7417 }, { "epoch": 0.85, "learning_rate": 1.1911145188532936e-06, "loss": 0.4427, "step": 7418 }, { "epoch": 0.85, "learning_rate": 1.1893630422846437e-06, "loss": 0.4495, "step": 7419 }, { "epoch": 0.85, "learning_rate": 1.187612772969966e-06, "loss": 0.4557, "step": 7420 }, { "epoch": 0.85, "learning_rate": 1.1858637111490845e-06, "loss": 0.4693, "step": 7421 }, { "epoch": 0.85, "learning_rate": 1.1841158570616617e-06, "loss": 0.453, "step": 7422 }, { "epoch": 0.85, "learning_rate": 1.1823692109471919e-06, "loss": 0.4517, "step": 7423 }, { "epoch": 0.85, "learning_rate": 1.1806237730450009e-06, "loss": 0.4596, "step": 7424 }, { "epoch": 0.85, "learning_rate": 1.1788795435942591e-06, "loss": 0.4496, "step": 7425 }, { "epoch": 0.85, "learning_rate": 1.1771365228339593e-06, "loss": 0.4406, "step": 7426 }, { "epoch": 0.85, "learning_rate": 1.1753947110029373e-06, "loss": 0.4555, "step": 7427 }, { "epoch": 0.85, "learning_rate": 1.17365410833986e-06, "loss": 0.4693, "step": 7428 }, { "epoch": 0.85, "learning_rate": 1.1719147150832278e-06, "loss": 0.4451, "step": 7429 }, { "epoch": 0.85, "learning_rate": 1.1701765314713786e-06, "loss": 0.4423, "step": 7430 }, { "epoch": 0.85, "learning_rate": 1.16843955774248e-06, "loss": 0.4563, "step": 7431 }, { "epoch": 0.85, "learning_rate": 1.1667037941345361e-06, "loss": 0.4354, "step": 7432 }, { "epoch": 0.85, "learning_rate": 1.1649692408853875e-06, "loss": 0.4411, "step": 7433 }, { "epoch": 0.85, "learning_rate": 1.163235898232703e-06, "loss": 0.4415, "step": 7434 }, { "epoch": 0.85, "learning_rate": 1.1615037664139928e-06, "loss": 0.4729, "step": 7435 }, { "epoch": 0.85, "learning_rate": 1.1597728456665958e-06, "loss": 0.4422, "step": 7436 }, { "epoch": 0.85, "learning_rate": 1.1580431362276866e-06, "loss": 0.47, "step": 7437 }, { "epoch": 0.85, "learning_rate": 1.156314638334277e-06, "loss": 0.4466, "step": 7438 }, { "epoch": 0.85, "learning_rate": 1.1545873522232055e-06, "loss": 0.4476, "step": 7439 }, { "epoch": 0.85, "learning_rate": 1.1528612781311532e-06, "loss": 0.4512, "step": 7440 }, { "epoch": 0.85, "learning_rate": 1.1511364162946282e-06, "loss": 0.4626, "step": 7441 }, { "epoch": 0.85, "learning_rate": 1.1494127669499732e-06, "loss": 0.4321, "step": 7442 }, { "epoch": 0.85, "learning_rate": 1.147690330333371e-06, "loss": 0.4471, "step": 7443 }, { "epoch": 0.85, "learning_rate": 1.14596910668083e-06, "loss": 0.463, "step": 7444 }, { "epoch": 0.85, "learning_rate": 1.1442490962281983e-06, "loss": 0.449, "step": 7445 }, { "epoch": 0.85, "learning_rate": 1.1425302992111564e-06, "loss": 0.4584, "step": 7446 }, { "epoch": 0.85, "learning_rate": 1.140812715865215e-06, "loss": 0.4398, "step": 7447 }, { "epoch": 0.85, "learning_rate": 1.1390963464257254e-06, "loss": 0.4492, "step": 7448 }, { "epoch": 0.85, "learning_rate": 1.1373811911278666e-06, "loss": 0.4535, "step": 7449 }, { "epoch": 0.85, "learning_rate": 1.1356672502066512e-06, "loss": 0.4298, "step": 7450 }, { "epoch": 0.85, "learning_rate": 1.1339545238969308e-06, "loss": 0.4531, "step": 7451 }, { "epoch": 0.85, "learning_rate": 1.1322430124333839e-06, "loss": 0.4477, "step": 7452 }, { "epoch": 0.85, "learning_rate": 1.1305327160505286e-06, "loss": 0.4755, "step": 7453 }, { "epoch": 0.85, "learning_rate": 1.1288236349827108e-06, "loss": 0.4572, "step": 7454 }, { "epoch": 0.85, "learning_rate": 1.1271157694641144e-06, "loss": 0.433, "step": 7455 }, { "epoch": 0.85, "learning_rate": 1.1254091197287564e-06, "loss": 0.4565, "step": 7456 }, { "epoch": 0.85, "learning_rate": 1.1237036860104833e-06, "loss": 0.4589, "step": 7457 }, { "epoch": 0.85, "learning_rate": 1.1219994685429814e-06, "loss": 0.4504, "step": 7458 }, { "epoch": 0.85, "learning_rate": 1.1202964675597627e-06, "loss": 0.4553, "step": 7459 }, { "epoch": 0.85, "learning_rate": 1.1185946832941774e-06, "loss": 0.4452, "step": 7460 }, { "epoch": 0.85, "learning_rate": 1.116894115979409e-06, "loss": 0.4826, "step": 7461 }, { "epoch": 0.85, "learning_rate": 1.115194765848473e-06, "loss": 0.4367, "step": 7462 }, { "epoch": 0.85, "learning_rate": 1.1134966331342157e-06, "loss": 0.4409, "step": 7463 }, { "epoch": 0.85, "learning_rate": 1.1117997180693207e-06, "loss": 0.474, "step": 7464 }, { "epoch": 0.85, "learning_rate": 1.1101040208863035e-06, "loss": 0.4283, "step": 7465 }, { "epoch": 0.85, "learning_rate": 1.1084095418175156e-06, "loss": 0.4431, "step": 7466 }, { "epoch": 0.85, "learning_rate": 1.106716281095136e-06, "loss": 0.4705, "step": 7467 }, { "epoch": 0.85, "learning_rate": 1.1050242389511757e-06, "loss": 0.4547, "step": 7468 }, { "epoch": 0.85, "learning_rate": 1.103333415617488e-06, "loss": 0.4496, "step": 7469 }, { "epoch": 0.85, "learning_rate": 1.1016438113257487e-06, "loss": 0.4439, "step": 7470 }, { "epoch": 0.85, "learning_rate": 1.0999554263074752e-06, "loss": 0.4491, "step": 7471 }, { "epoch": 0.85, "learning_rate": 1.0982682607940131e-06, "loss": 0.4593, "step": 7472 }, { "epoch": 0.85, "learning_rate": 1.0965823150165378e-06, "loss": 0.4651, "step": 7473 }, { "epoch": 0.85, "learning_rate": 1.0948975892060655e-06, "loss": 0.4513, "step": 7474 }, { "epoch": 0.85, "learning_rate": 1.0932140835934414e-06, "loss": 0.4345, "step": 7475 }, { "epoch": 0.85, "learning_rate": 1.091531798409341e-06, "loss": 0.4719, "step": 7476 }, { "epoch": 0.85, "learning_rate": 1.0898507338842779e-06, "loss": 0.4596, "step": 7477 }, { "epoch": 0.85, "learning_rate": 1.088170890248591e-06, "loss": 0.4358, "step": 7478 }, { "epoch": 0.85, "learning_rate": 1.086492267732462e-06, "loss": 0.452, "step": 7479 }, { "epoch": 0.85, "learning_rate": 1.0848148665658975e-06, "loss": 0.4601, "step": 7480 }, { "epoch": 0.85, "learning_rate": 1.0831386869787353e-06, "loss": 0.4573, "step": 7481 }, { "epoch": 0.86, "learning_rate": 1.0814637292006536e-06, "loss": 0.4399, "step": 7482 }, { "epoch": 0.86, "learning_rate": 1.0797899934611567e-06, "loss": 0.4623, "step": 7483 }, { "epoch": 0.86, "learning_rate": 1.0781174799895844e-06, "loss": 0.4499, "step": 7484 }, { "epoch": 0.86, "learning_rate": 1.0764461890151112e-06, "loss": 0.4421, "step": 7485 }, { "epoch": 0.86, "learning_rate": 1.0747761207667372e-06, "loss": 0.4446, "step": 7486 }, { "epoch": 0.86, "learning_rate": 1.0731072754733019e-06, "loss": 0.4585, "step": 7487 }, { "epoch": 0.86, "learning_rate": 1.071439653363473e-06, "loss": 0.4381, "step": 7488 }, { "epoch": 0.86, "learning_rate": 1.0697732546657512e-06, "loss": 0.4405, "step": 7489 }, { "epoch": 0.86, "learning_rate": 1.068108079608473e-06, "loss": 0.4639, "step": 7490 }, { "epoch": 0.86, "learning_rate": 1.0664441284198002e-06, "loss": 0.4362, "step": 7491 }, { "epoch": 0.86, "learning_rate": 1.0647814013277358e-06, "loss": 0.4415, "step": 7492 }, { "epoch": 0.86, "learning_rate": 1.0631198985601077e-06, "loss": 0.4541, "step": 7493 }, { "epoch": 0.86, "learning_rate": 1.0614596203445793e-06, "loss": 0.4463, "step": 7494 }, { "epoch": 0.86, "learning_rate": 1.0598005669086475e-06, "loss": 0.4557, "step": 7495 }, { "epoch": 0.86, "learning_rate": 1.0581427384796372e-06, "loss": 0.4597, "step": 7496 }, { "epoch": 0.86, "learning_rate": 1.056486135284711e-06, "loss": 0.4463, "step": 7497 }, { "epoch": 0.86, "learning_rate": 1.0548307575508587e-06, "loss": 0.4581, "step": 7498 }, { "epoch": 0.86, "learning_rate": 1.053176605504902e-06, "loss": 0.439, "step": 7499 }, { "epoch": 0.86, "learning_rate": 1.0515236793735007e-06, "loss": 0.4394, "step": 7500 }, { "epoch": 0.86, "learning_rate": 1.049871979383138e-06, "loss": 0.4437, "step": 7501 }, { "epoch": 0.86, "learning_rate": 1.0482215057601364e-06, "loss": 0.4593, "step": 7502 }, { "epoch": 0.86, "learning_rate": 1.0465722587306494e-06, "loss": 0.4444, "step": 7503 }, { "epoch": 0.86, "learning_rate": 1.044924238520657e-06, "loss": 0.4475, "step": 7504 }, { "epoch": 0.86, "learning_rate": 1.043277445355978e-06, "loss": 0.4565, "step": 7505 }, { "epoch": 0.86, "learning_rate": 1.0416318794622594e-06, "loss": 0.4562, "step": 7506 }, { "epoch": 0.86, "learning_rate": 1.0399875410649763e-06, "loss": 0.441, "step": 7507 }, { "epoch": 0.86, "learning_rate": 1.0383444303894453e-06, "loss": 0.4679, "step": 7508 }, { "epoch": 0.86, "learning_rate": 1.0367025476608038e-06, "loss": 0.4631, "step": 7509 }, { "epoch": 0.86, "learning_rate": 1.0350618931040324e-06, "loss": 0.4433, "step": 7510 }, { "epoch": 0.86, "learning_rate": 1.033422466943933e-06, "loss": 0.4734, "step": 7511 }, { "epoch": 0.86, "learning_rate": 1.031784269405144e-06, "loss": 0.4519, "step": 7512 }, { "epoch": 0.86, "learning_rate": 1.0301473007121376e-06, "loss": 0.4499, "step": 7513 }, { "epoch": 0.86, "learning_rate": 1.0285115610892138e-06, "loss": 0.4637, "step": 7514 }, { "epoch": 0.86, "learning_rate": 1.026877050760503e-06, "loss": 0.4271, "step": 7515 }, { "epoch": 0.86, "learning_rate": 1.025243769949974e-06, "loss": 0.4543, "step": 7516 }, { "epoch": 0.86, "learning_rate": 1.0236117188814187e-06, "loss": 0.4584, "step": 7517 }, { "epoch": 0.86, "learning_rate": 1.0219808977784673e-06, "loss": 0.4422, "step": 7518 }, { "epoch": 0.86, "learning_rate": 1.0203513068645788e-06, "loss": 0.4595, "step": 7519 }, { "epoch": 0.86, "learning_rate": 1.01872294636304e-06, "loss": 0.4512, "step": 7520 }, { "epoch": 0.86, "learning_rate": 1.0170958164969746e-06, "loss": 0.438, "step": 7521 }, { "epoch": 0.86, "learning_rate": 1.0154699174893367e-06, "loss": 0.4515, "step": 7522 }, { "epoch": 0.86, "learning_rate": 1.0138452495629125e-06, "loss": 0.4465, "step": 7523 }, { "epoch": 0.86, "learning_rate": 1.012221812940315e-06, "loss": 0.4385, "step": 7524 }, { "epoch": 0.86, "learning_rate": 1.0105996078439894e-06, "loss": 0.4496, "step": 7525 }, { "epoch": 0.86, "learning_rate": 1.0089786344962194e-06, "loss": 0.4472, "step": 7526 }, { "epoch": 0.86, "learning_rate": 1.0073588931191104e-06, "loss": 0.4485, "step": 7527 }, { "epoch": 0.86, "learning_rate": 1.0057403839346037e-06, "loss": 0.4544, "step": 7528 }, { "epoch": 0.86, "learning_rate": 1.004123107164472e-06, "loss": 0.4726, "step": 7529 }, { "epoch": 0.86, "learning_rate": 1.0025070630303168e-06, "loss": 0.4521, "step": 7530 }, { "epoch": 0.86, "learning_rate": 1.0008922517535747e-06, "loss": 0.4609, "step": 7531 }, { "epoch": 0.86, "learning_rate": 9.992786735555104e-07, "loss": 0.4313, "step": 7532 }, { "epoch": 0.86, "learning_rate": 9.976663286572176e-07, "loss": 0.4458, "step": 7533 }, { "epoch": 0.86, "learning_rate": 9.960552172796278e-07, "loss": 0.4657, "step": 7534 }, { "epoch": 0.86, "learning_rate": 9.94445339643495e-07, "loss": 0.435, "step": 7535 }, { "epoch": 0.86, "learning_rate": 9.928366959694113e-07, "loss": 0.4605, "step": 7536 }, { "epoch": 0.86, "learning_rate": 9.912292864777961e-07, "loss": 0.4526, "step": 7537 }, { "epoch": 0.86, "learning_rate": 9.896231113888988e-07, "loss": 0.468, "step": 7538 }, { "epoch": 0.86, "learning_rate": 9.880181709228032e-07, "loss": 0.4484, "step": 7539 }, { "epoch": 0.86, "learning_rate": 9.8641446529942e-07, "loss": 0.4639, "step": 7540 }, { "epoch": 0.86, "learning_rate": 9.848119947384937e-07, "loss": 0.4492, "step": 7541 }, { "epoch": 0.86, "learning_rate": 9.832107594596008e-07, "loss": 0.4683, "step": 7542 }, { "epoch": 0.86, "learning_rate": 9.81610759682141e-07, "loss": 0.4317, "step": 7543 }, { "epoch": 0.86, "learning_rate": 9.800119956253574e-07, "loss": 0.4468, "step": 7544 }, { "epoch": 0.86, "learning_rate": 9.784144675083107e-07, "loss": 0.4447, "step": 7545 }, { "epoch": 0.86, "learning_rate": 9.768181755498973e-07, "loss": 0.4756, "step": 7546 }, { "epoch": 0.86, "learning_rate": 9.7522311996885e-07, "loss": 0.4309, "step": 7547 }, { "epoch": 0.86, "learning_rate": 9.736293009837206e-07, "loss": 0.446, "step": 7548 }, { "epoch": 0.86, "learning_rate": 9.720367188129043e-07, "loss": 0.452, "step": 7549 }, { "epoch": 0.86, "learning_rate": 9.704453736746156e-07, "loss": 0.4351, "step": 7550 }, { "epoch": 0.86, "learning_rate": 9.688552657869055e-07, "loss": 0.4406, "step": 7551 }, { "epoch": 0.86, "learning_rate": 9.672663953676563e-07, "loss": 0.467, "step": 7552 }, { "epoch": 0.86, "learning_rate": 9.656787626345765e-07, "loss": 0.4444, "step": 7553 }, { "epoch": 0.86, "learning_rate": 9.640923678052094e-07, "loss": 0.4607, "step": 7554 }, { "epoch": 0.86, "learning_rate": 9.625072110969246e-07, "loss": 0.4649, "step": 7555 }, { "epoch": 0.86, "learning_rate": 9.60923292726923e-07, "loss": 0.4632, "step": 7556 }, { "epoch": 0.86, "learning_rate": 9.593406129122397e-07, "loss": 0.4489, "step": 7557 }, { "epoch": 0.86, "learning_rate": 9.577591718697343e-07, "loss": 0.4486, "step": 7558 }, { "epoch": 0.86, "learning_rate": 9.561789698161007e-07, "loss": 0.4312, "step": 7559 }, { "epoch": 0.86, "learning_rate": 9.54600006967864e-07, "loss": 0.4647, "step": 7560 }, { "epoch": 0.86, "learning_rate": 9.530222835413739e-07, "loss": 0.451, "step": 7561 }, { "epoch": 0.86, "learning_rate": 9.514457997528171e-07, "loss": 0.4704, "step": 7562 }, { "epoch": 0.86, "learning_rate": 9.498705558182053e-07, "loss": 0.4483, "step": 7563 }, { "epoch": 0.86, "learning_rate": 9.482965519533804e-07, "loss": 0.4656, "step": 7564 }, { "epoch": 0.86, "learning_rate": 9.467237883740199e-07, "loss": 0.4515, "step": 7565 }, { "epoch": 0.86, "learning_rate": 9.451522652956225e-07, "loss": 0.4385, "step": 7566 }, { "epoch": 0.86, "learning_rate": 9.435819829335269e-07, "loss": 0.4314, "step": 7567 }, { "epoch": 0.86, "learning_rate": 9.420129415028934e-07, "loss": 0.4629, "step": 7568 }, { "epoch": 0.87, "learning_rate": 9.404451412187166e-07, "loss": 0.4392, "step": 7569 }, { "epoch": 0.87, "learning_rate": 9.388785822958224e-07, "loss": 0.4575, "step": 7570 }, { "epoch": 0.87, "learning_rate": 9.373132649488636e-07, "loss": 0.4626, "step": 7571 }, { "epoch": 0.87, "learning_rate": 9.357491893923198e-07, "loss": 0.4594, "step": 7572 }, { "epoch": 0.87, "learning_rate": 9.341863558405084e-07, "loss": 0.4318, "step": 7573 }, { "epoch": 0.87, "learning_rate": 9.326247645075703e-07, "loss": 0.4612, "step": 7574 }, { "epoch": 0.87, "learning_rate": 9.310644156074811e-07, "loss": 0.4626, "step": 7575 }, { "epoch": 0.87, "learning_rate": 9.295053093540408e-07, "loss": 0.43, "step": 7576 }, { "epoch": 0.87, "learning_rate": 9.279474459608806e-07, "loss": 0.4374, "step": 7577 }, { "epoch": 0.87, "learning_rate": 9.263908256414656e-07, "loss": 0.4794, "step": 7578 }, { "epoch": 0.87, "learning_rate": 9.24835448609085e-07, "loss": 0.4464, "step": 7579 }, { "epoch": 0.87, "learning_rate": 9.23281315076865e-07, "loss": 0.4559, "step": 7580 }, { "epoch": 0.87, "learning_rate": 9.217284252577519e-07, "loss": 0.4274, "step": 7581 }, { "epoch": 0.87, "learning_rate": 9.201767793645255e-07, "loss": 0.4647, "step": 7582 }, { "epoch": 0.87, "learning_rate": 9.186263776098014e-07, "loss": 0.4514, "step": 7583 }, { "epoch": 0.87, "learning_rate": 9.170772202060141e-07, "loss": 0.4447, "step": 7584 }, { "epoch": 0.87, "learning_rate": 9.155293073654337e-07, "loss": 0.4388, "step": 7585 }, { "epoch": 0.87, "learning_rate": 9.139826393001617e-07, "loss": 0.452, "step": 7586 }, { "epoch": 0.87, "learning_rate": 9.124372162221217e-07, "loss": 0.4597, "step": 7587 }, { "epoch": 0.87, "learning_rate": 9.108930383430736e-07, "loss": 0.4609, "step": 7588 }, { "epoch": 0.87, "learning_rate": 9.093501058746057e-07, "loss": 0.4423, "step": 7589 }, { "epoch": 0.87, "learning_rate": 9.078084190281311e-07, "loss": 0.4459, "step": 7590 }, { "epoch": 0.87, "learning_rate": 9.062679780148987e-07, "loss": 0.4487, "step": 7591 }, { "epoch": 0.87, "learning_rate": 9.047287830459806e-07, "loss": 0.4524, "step": 7592 }, { "epoch": 0.87, "learning_rate": 9.031908343322826e-07, "loss": 0.449, "step": 7593 }, { "epoch": 0.87, "learning_rate": 9.016541320845373e-07, "loss": 0.4447, "step": 7594 }, { "epoch": 0.87, "learning_rate": 9.001186765133052e-07, "loss": 0.4528, "step": 7595 }, { "epoch": 0.87, "learning_rate": 8.985844678289823e-07, "loss": 0.4641, "step": 7596 }, { "epoch": 0.87, "learning_rate": 8.97051506241785e-07, "loss": 0.4672, "step": 7597 }, { "epoch": 0.87, "learning_rate": 8.955197919617653e-07, "loss": 0.4495, "step": 7598 }, { "epoch": 0.87, "learning_rate": 8.93989325198803e-07, "loss": 0.4568, "step": 7599 }, { "epoch": 0.87, "learning_rate": 8.924601061626049e-07, "loss": 0.4654, "step": 7600 }, { "epoch": 0.87, "learning_rate": 8.909321350627109e-07, "loss": 0.4634, "step": 7601 }, { "epoch": 0.87, "learning_rate": 8.894054121084839e-07, "loss": 0.4489, "step": 7602 }, { "epoch": 0.87, "learning_rate": 8.878799375091185e-07, "loss": 0.444, "step": 7603 }, { "epoch": 0.87, "learning_rate": 8.863557114736432e-07, "loss": 0.4585, "step": 7604 }, { "epoch": 0.87, "learning_rate": 8.848327342109053e-07, "loss": 0.4396, "step": 7605 }, { "epoch": 0.87, "learning_rate": 8.833110059295913e-07, "loss": 0.4655, "step": 7606 }, { "epoch": 0.87, "learning_rate": 8.817905268382088e-07, "loss": 0.4619, "step": 7607 }, { "epoch": 0.87, "learning_rate": 8.802712971450989e-07, "loss": 0.4306, "step": 7608 }, { "epoch": 0.87, "learning_rate": 8.787533170584317e-07, "loss": 0.4527, "step": 7609 }, { "epoch": 0.87, "learning_rate": 8.772365867862021e-07, "loss": 0.4511, "step": 7610 }, { "epoch": 0.87, "learning_rate": 8.757211065362359e-07, "loss": 0.4495, "step": 7611 }, { "epoch": 0.87, "learning_rate": 8.742068765161893e-07, "loss": 0.4779, "step": 7612 }, { "epoch": 0.87, "learning_rate": 8.726938969335419e-07, "loss": 0.4548, "step": 7613 }, { "epoch": 0.87, "learning_rate": 8.711821679956111e-07, "loss": 0.4472, "step": 7614 }, { "epoch": 0.87, "learning_rate": 8.696716899095336e-07, "loss": 0.4485, "step": 7615 }, { "epoch": 0.87, "learning_rate": 8.681624628822794e-07, "loss": 0.4791, "step": 7616 }, { "epoch": 0.87, "learning_rate": 8.666544871206484e-07, "loss": 0.4501, "step": 7617 }, { "epoch": 0.87, "learning_rate": 8.651477628312632e-07, "loss": 0.4501, "step": 7618 }, { "epoch": 0.87, "learning_rate": 8.636422902205821e-07, "loss": 0.4504, "step": 7619 }, { "epoch": 0.87, "learning_rate": 8.621380694948878e-07, "loss": 0.4417, "step": 7620 }, { "epoch": 0.87, "learning_rate": 8.606351008602898e-07, "loss": 0.4476, "step": 7621 }, { "epoch": 0.87, "learning_rate": 8.591333845227312e-07, "loss": 0.4568, "step": 7622 }, { "epoch": 0.87, "learning_rate": 8.576329206879785e-07, "loss": 0.4544, "step": 7623 }, { "epoch": 0.87, "learning_rate": 8.561337095616306e-07, "loss": 0.4428, "step": 7624 }, { "epoch": 0.87, "learning_rate": 8.54635751349111e-07, "loss": 0.4396, "step": 7625 }, { "epoch": 0.87, "learning_rate": 8.531390462556744e-07, "loss": 0.4423, "step": 7626 }, { "epoch": 0.87, "learning_rate": 8.516435944864043e-07, "loss": 0.4446, "step": 7627 }, { "epoch": 0.87, "learning_rate": 8.501493962462092e-07, "loss": 0.4541, "step": 7628 }, { "epoch": 0.87, "learning_rate": 8.486564517398265e-07, "loss": 0.4383, "step": 7629 }, { "epoch": 0.87, "learning_rate": 8.471647611718259e-07, "loss": 0.4603, "step": 7630 }, { "epoch": 0.87, "learning_rate": 8.456743247465992e-07, "loss": 0.4471, "step": 7631 }, { "epoch": 0.87, "learning_rate": 8.441851426683723e-07, "loss": 0.4791, "step": 7632 }, { "epoch": 0.87, "learning_rate": 8.426972151411961e-07, "loss": 0.4562, "step": 7633 }, { "epoch": 0.87, "learning_rate": 8.412105423689465e-07, "loss": 0.4443, "step": 7634 }, { "epoch": 0.87, "learning_rate": 8.397251245553339e-07, "loss": 0.4659, "step": 7635 }, { "epoch": 0.87, "learning_rate": 8.382409619038923e-07, "loss": 0.4401, "step": 7636 }, { "epoch": 0.87, "learning_rate": 8.367580546179877e-07, "loss": 0.4638, "step": 7637 }, { "epoch": 0.87, "learning_rate": 8.352764029008098e-07, "loss": 0.4554, "step": 7638 }, { "epoch": 0.87, "learning_rate": 8.337960069553763e-07, "loss": 0.4306, "step": 7639 }, { "epoch": 0.87, "learning_rate": 8.323168669845383e-07, "loss": 0.4672, "step": 7640 }, { "epoch": 0.87, "learning_rate": 8.30838983190968e-07, "loss": 0.453, "step": 7641 }, { "epoch": 0.87, "learning_rate": 8.29362355777168e-07, "loss": 0.4381, "step": 7642 }, { "epoch": 0.87, "learning_rate": 8.278869849454718e-07, "loss": 0.4571, "step": 7643 }, { "epoch": 0.87, "learning_rate": 8.264128708980345e-07, "loss": 0.4619, "step": 7644 }, { "epoch": 0.87, "learning_rate": 8.249400138368457e-07, "loss": 0.4437, "step": 7645 }, { "epoch": 0.87, "learning_rate": 8.234684139637205e-07, "loss": 0.4636, "step": 7646 }, { "epoch": 0.87, "learning_rate": 8.219980714802978e-07, "loss": 0.4432, "step": 7647 }, { "epoch": 0.87, "learning_rate": 8.205289865880505e-07, "loss": 0.4722, "step": 7648 }, { "epoch": 0.87, "learning_rate": 8.190611594882736e-07, "loss": 0.4393, "step": 7649 }, { "epoch": 0.87, "learning_rate": 8.175945903820937e-07, "loss": 0.4602, "step": 7650 }, { "epoch": 0.87, "learning_rate": 8.161292794704634e-07, "loss": 0.4411, "step": 7651 }, { "epoch": 0.87, "learning_rate": 8.146652269541599e-07, "loss": 0.458, "step": 7652 }, { "epoch": 0.87, "learning_rate": 8.132024330337962e-07, "loss": 0.4397, "step": 7653 }, { "epoch": 0.87, "learning_rate": 8.11740897909803e-07, "loss": 0.4447, "step": 7654 }, { "epoch": 0.87, "learning_rate": 8.102806217824455e-07, "loss": 0.4601, "step": 7655 }, { "epoch": 0.87, "learning_rate": 8.08821604851816e-07, "loss": 0.4818, "step": 7656 }, { "epoch": 0.88, "learning_rate": 8.073638473178291e-07, "loss": 0.4526, "step": 7657 }, { "epoch": 0.88, "learning_rate": 8.059073493802327e-07, "loss": 0.4646, "step": 7658 }, { "epoch": 0.88, "learning_rate": 8.044521112385983e-07, "loss": 0.4406, "step": 7659 }, { "epoch": 0.88, "learning_rate": 8.029981330923242e-07, "loss": 0.4413, "step": 7660 }, { "epoch": 0.88, "learning_rate": 8.01545415140641e-07, "loss": 0.4463, "step": 7661 }, { "epoch": 0.88, "learning_rate": 8.000939575826016e-07, "loss": 0.4578, "step": 7662 }, { "epoch": 0.88, "learning_rate": 7.986437606170893e-07, "loss": 0.4601, "step": 7663 }, { "epoch": 0.88, "learning_rate": 7.971948244428118e-07, "loss": 0.4446, "step": 7664 }, { "epoch": 0.88, "learning_rate": 7.957471492583068e-07, "loss": 0.4322, "step": 7665 }, { "epoch": 0.88, "learning_rate": 7.943007352619392e-07, "loss": 0.4489, "step": 7666 }, { "epoch": 0.88, "learning_rate": 7.928555826518991e-07, "loss": 0.4336, "step": 7667 }, { "epoch": 0.88, "learning_rate": 7.914116916262027e-07, "loss": 0.4407, "step": 7668 }, { "epoch": 0.88, "learning_rate": 7.899690623826983e-07, "loss": 0.4515, "step": 7669 }, { "epoch": 0.88, "learning_rate": 7.885276951190568e-07, "loss": 0.4516, "step": 7670 }, { "epoch": 0.88, "learning_rate": 7.870875900327779e-07, "loss": 0.4426, "step": 7671 }, { "epoch": 0.88, "learning_rate": 7.856487473211871e-07, "loss": 0.4682, "step": 7672 }, { "epoch": 0.88, "learning_rate": 7.842111671814401e-07, "loss": 0.4245, "step": 7673 }, { "epoch": 0.88, "learning_rate": 7.82774849810517e-07, "loss": 0.4563, "step": 7674 }, { "epoch": 0.88, "learning_rate": 7.813397954052237e-07, "loss": 0.4313, "step": 7675 }, { "epoch": 0.88, "learning_rate": 7.799060041621975e-07, "loss": 0.449, "step": 7676 }, { "epoch": 0.88, "learning_rate": 7.784734762778978e-07, "loss": 0.4433, "step": 7677 }, { "epoch": 0.88, "learning_rate": 7.77042211948611e-07, "loss": 0.438, "step": 7678 }, { "epoch": 0.88, "learning_rate": 7.756122113704567e-07, "loss": 0.4465, "step": 7679 }, { "epoch": 0.88, "learning_rate": 7.741834747393751e-07, "loss": 0.4503, "step": 7680 }, { "epoch": 0.88, "learning_rate": 7.727560022511327e-07, "loss": 0.4502, "step": 7681 }, { "epoch": 0.88, "learning_rate": 7.713297941013264e-07, "loss": 0.455, "step": 7682 }, { "epoch": 0.88, "learning_rate": 7.69904850485379e-07, "loss": 0.4359, "step": 7683 }, { "epoch": 0.88, "learning_rate": 7.684811715985429e-07, "loss": 0.4722, "step": 7684 }, { "epoch": 0.88, "learning_rate": 7.670587576358889e-07, "loss": 0.4377, "step": 7685 }, { "epoch": 0.88, "learning_rate": 7.656376087923212e-07, "loss": 0.4555, "step": 7686 }, { "epoch": 0.88, "learning_rate": 7.642177252625704e-07, "loss": 0.4569, "step": 7687 }, { "epoch": 0.88, "learning_rate": 7.627991072411889e-07, "loss": 0.4471, "step": 7688 }, { "epoch": 0.88, "learning_rate": 7.613817549225621e-07, "loss": 0.4646, "step": 7689 }, { "epoch": 0.88, "learning_rate": 7.599656685008982e-07, "loss": 0.4708, "step": 7690 }, { "epoch": 0.88, "learning_rate": 7.585508481702308e-07, "loss": 0.4315, "step": 7691 }, { "epoch": 0.88, "learning_rate": 7.571372941244237e-07, "loss": 0.4523, "step": 7692 }, { "epoch": 0.88, "learning_rate": 7.557250065571664e-07, "loss": 0.435, "step": 7693 }, { "epoch": 0.88, "learning_rate": 7.543139856619708e-07, "loss": 0.4433, "step": 7694 }, { "epoch": 0.88, "learning_rate": 7.52904231632181e-07, "loss": 0.4802, "step": 7695 }, { "epoch": 0.88, "learning_rate": 7.514957446609627e-07, "loss": 0.4475, "step": 7696 }, { "epoch": 0.88, "learning_rate": 7.500885249413126e-07, "loss": 0.469, "step": 7697 }, { "epoch": 0.88, "learning_rate": 7.486825726660496e-07, "loss": 0.4423, "step": 7698 }, { "epoch": 0.88, "learning_rate": 7.472778880278197e-07, "loss": 0.4658, "step": 7699 }, { "epoch": 0.88, "learning_rate": 7.45874471219098e-07, "loss": 0.4586, "step": 7700 }, { "epoch": 0.88, "learning_rate": 7.444723224321804e-07, "loss": 0.4538, "step": 7701 }, { "epoch": 0.88, "learning_rate": 7.430714418591966e-07, "loss": 0.4298, "step": 7702 }, { "epoch": 0.88, "learning_rate": 7.416718296920977e-07, "loss": 0.4549, "step": 7703 }, { "epoch": 0.88, "learning_rate": 7.40273486122659e-07, "loss": 0.438, "step": 7704 }, { "epoch": 0.88, "learning_rate": 7.388764113424895e-07, "loss": 0.4753, "step": 7705 }, { "epoch": 0.88, "learning_rate": 7.37480605543015e-07, "loss": 0.4512, "step": 7706 }, { "epoch": 0.88, "learning_rate": 7.360860689154969e-07, "loss": 0.4467, "step": 7707 }, { "epoch": 0.88, "learning_rate": 7.346928016510135e-07, "loss": 0.438, "step": 7708 }, { "epoch": 0.88, "learning_rate": 7.333008039404743e-07, "loss": 0.4606, "step": 7709 }, { "epoch": 0.88, "learning_rate": 7.319100759746167e-07, "loss": 0.4459, "step": 7710 }, { "epoch": 0.88, "learning_rate": 7.305206179439972e-07, "loss": 0.4351, "step": 7711 }, { "epoch": 0.88, "learning_rate": 7.291324300390057e-07, "loss": 0.46, "step": 7712 }, { "epoch": 0.88, "learning_rate": 7.277455124498545e-07, "loss": 0.4704, "step": 7713 }, { "epoch": 0.88, "learning_rate": 7.263598653665815e-07, "loss": 0.4559, "step": 7714 }, { "epoch": 0.88, "learning_rate": 7.249754889790539e-07, "loss": 0.4432, "step": 7715 }, { "epoch": 0.88, "learning_rate": 7.235923834769599e-07, "loss": 0.4376, "step": 7716 }, { "epoch": 0.88, "learning_rate": 7.222105490498133e-07, "loss": 0.4602, "step": 7717 }, { "epoch": 0.88, "learning_rate": 7.208299858869616e-07, "loss": 0.449, "step": 7718 }, { "epoch": 0.88, "learning_rate": 7.194506941775681e-07, "loss": 0.4414, "step": 7719 }, { "epoch": 0.88, "learning_rate": 7.180726741106303e-07, "loss": 0.4416, "step": 7720 }, { "epoch": 0.88, "learning_rate": 7.16695925874964e-07, "loss": 0.4513, "step": 7721 }, { "epoch": 0.88, "learning_rate": 7.15320449659217e-07, "loss": 0.4673, "step": 7722 }, { "epoch": 0.88, "learning_rate": 7.139462456518619e-07, "loss": 0.4606, "step": 7723 }, { "epoch": 0.88, "learning_rate": 7.125733140411928e-07, "loss": 0.4422, "step": 7724 }, { "epoch": 0.88, "learning_rate": 7.1120165501533e-07, "loss": 0.45, "step": 7725 }, { "epoch": 0.88, "learning_rate": 7.098312687622256e-07, "loss": 0.4541, "step": 7726 }, { "epoch": 0.88, "learning_rate": 7.084621554696502e-07, "loss": 0.4516, "step": 7727 }, { "epoch": 0.88, "learning_rate": 7.070943153252053e-07, "loss": 0.4362, "step": 7728 }, { "epoch": 0.88, "learning_rate": 7.057277485163116e-07, "loss": 0.4724, "step": 7729 }, { "epoch": 0.88, "learning_rate": 7.043624552302231e-07, "loss": 0.4389, "step": 7730 }, { "epoch": 0.88, "learning_rate": 7.029984356540153e-07, "loss": 0.4602, "step": 7731 }, { "epoch": 0.88, "learning_rate": 7.016356899745869e-07, "loss": 0.4498, "step": 7732 }, { "epoch": 0.88, "learning_rate": 7.002742183786671e-07, "loss": 0.4505, "step": 7733 }, { "epoch": 0.88, "learning_rate": 6.989140210528067e-07, "loss": 0.4436, "step": 7734 }, { "epoch": 0.88, "learning_rate": 6.975550981833823e-07, "loss": 0.4532, "step": 7735 }, { "epoch": 0.88, "learning_rate": 6.961974499565982e-07, "loss": 0.4534, "step": 7736 }, { "epoch": 0.88, "learning_rate": 6.948410765584813e-07, "loss": 0.4557, "step": 7737 }, { "epoch": 0.88, "learning_rate": 6.934859781748848e-07, "loss": 0.4727, "step": 7738 }, { "epoch": 0.88, "learning_rate": 6.921321549914872e-07, "loss": 0.4457, "step": 7739 }, { "epoch": 0.88, "learning_rate": 6.907796071937944e-07, "loss": 0.4459, "step": 7740 }, { "epoch": 0.88, "learning_rate": 6.894283349671349e-07, "loss": 0.4443, "step": 7741 }, { "epoch": 0.88, "learning_rate": 6.880783384966638e-07, "loss": 0.4602, "step": 7742 }, { "epoch": 0.88, "learning_rate": 6.867296179673588e-07, "loss": 0.4401, "step": 7743 }, { "epoch": 0.89, "learning_rate": 6.853821735640265e-07, "loss": 0.438, "step": 7744 }, { "epoch": 0.89, "learning_rate": 6.840360054712946e-07, "loss": 0.4418, "step": 7745 }, { "epoch": 0.89, "learning_rate": 6.826911138736214e-07, "loss": 0.4423, "step": 7746 }, { "epoch": 0.89, "learning_rate": 6.81347498955286e-07, "loss": 0.461, "step": 7747 }, { "epoch": 0.89, "learning_rate": 6.800051609003911e-07, "loss": 0.4588, "step": 7748 }, { "epoch": 0.89, "learning_rate": 6.786640998928684e-07, "loss": 0.457, "step": 7749 }, { "epoch": 0.89, "learning_rate": 6.773243161164756e-07, "loss": 0.4321, "step": 7750 }, { "epoch": 0.89, "learning_rate": 6.7598580975479e-07, "loss": 0.4422, "step": 7751 }, { "epoch": 0.89, "learning_rate": 6.746485809912184e-07, "loss": 0.4472, "step": 7752 }, { "epoch": 0.89, "learning_rate": 6.733126300089898e-07, "loss": 0.4487, "step": 7753 }, { "epoch": 0.89, "learning_rate": 6.719779569911622e-07, "loss": 0.4533, "step": 7754 }, { "epoch": 0.89, "learning_rate": 6.706445621206126e-07, "loss": 0.4623, "step": 7755 }, { "epoch": 0.89, "learning_rate": 6.69312445580046e-07, "loss": 0.4483, "step": 7756 }, { "epoch": 0.89, "learning_rate": 6.67981607551994e-07, "loss": 0.4525, "step": 7757 }, { "epoch": 0.89, "learning_rate": 6.666520482188087e-07, "loss": 0.4394, "step": 7758 }, { "epoch": 0.89, "learning_rate": 6.653237677626701e-07, "loss": 0.458, "step": 7759 }, { "epoch": 0.89, "learning_rate": 6.639967663655844e-07, "loss": 0.4302, "step": 7760 }, { "epoch": 0.89, "learning_rate": 6.626710442093776e-07, "loss": 0.4385, "step": 7761 }, { "epoch": 0.89, "learning_rate": 6.613466014757064e-07, "loss": 0.4548, "step": 7762 }, { "epoch": 0.89, "learning_rate": 6.600234383460469e-07, "loss": 0.4378, "step": 7763 }, { "epoch": 0.89, "learning_rate": 6.587015550017006e-07, "loss": 0.431, "step": 7764 }, { "epoch": 0.89, "learning_rate": 6.573809516237984e-07, "loss": 0.4637, "step": 7765 }, { "epoch": 0.89, "learning_rate": 6.560616283932897e-07, "loss": 0.4629, "step": 7766 }, { "epoch": 0.89, "learning_rate": 6.547435854909534e-07, "loss": 0.4502, "step": 7767 }, { "epoch": 0.89, "learning_rate": 6.534268230973873e-07, "loss": 0.4431, "step": 7768 }, { "epoch": 0.89, "learning_rate": 6.521113413930202e-07, "loss": 0.452, "step": 7769 }, { "epoch": 0.89, "learning_rate": 6.507971405581037e-07, "loss": 0.4402, "step": 7770 }, { "epoch": 0.89, "learning_rate": 6.494842207727092e-07, "loss": 0.4589, "step": 7771 }, { "epoch": 0.89, "learning_rate": 6.481725822167384e-07, "loss": 0.446, "step": 7772 }, { "epoch": 0.89, "learning_rate": 6.468622250699152e-07, "loss": 0.4478, "step": 7773 }, { "epoch": 0.89, "learning_rate": 6.45553149511785e-07, "loss": 0.4533, "step": 7774 }, { "epoch": 0.89, "learning_rate": 6.442453557217243e-07, "loss": 0.4651, "step": 7775 }, { "epoch": 0.89, "learning_rate": 6.429388438789252e-07, "loss": 0.4491, "step": 7776 }, { "epoch": 0.89, "learning_rate": 6.416336141624146e-07, "loss": 0.4507, "step": 7777 }, { "epoch": 0.89, "learning_rate": 6.403296667510339e-07, "loss": 0.4598, "step": 7778 }, { "epoch": 0.89, "learning_rate": 6.390270018234534e-07, "loss": 0.4574, "step": 7779 }, { "epoch": 0.89, "learning_rate": 6.377256195581705e-07, "loss": 0.4618, "step": 7780 }, { "epoch": 0.89, "learning_rate": 6.364255201335013e-07, "loss": 0.4581, "step": 7781 }, { "epoch": 0.89, "learning_rate": 6.351267037275877e-07, "loss": 0.4482, "step": 7782 }, { "epoch": 0.89, "learning_rate": 6.338291705183986e-07, "loss": 0.4528, "step": 7783 }, { "epoch": 0.89, "learning_rate": 6.325329206837217e-07, "loss": 0.463, "step": 7784 }, { "epoch": 0.89, "learning_rate": 6.31237954401176e-07, "loss": 0.4425, "step": 7785 }, { "epoch": 0.89, "learning_rate": 6.299442718481974e-07, "loss": 0.4418, "step": 7786 }, { "epoch": 0.89, "learning_rate": 6.286518732020519e-07, "loss": 0.4509, "step": 7787 }, { "epoch": 0.89, "learning_rate": 6.273607586398267e-07, "loss": 0.4507, "step": 7788 }, { "epoch": 0.89, "learning_rate": 6.260709283384326e-07, "loss": 0.4678, "step": 7789 }, { "epoch": 0.89, "learning_rate": 6.247823824746058e-07, "loss": 0.4374, "step": 7790 }, { "epoch": 0.89, "learning_rate": 6.234951212249052e-07, "loss": 0.4768, "step": 7791 }, { "epoch": 0.89, "learning_rate": 6.222091447657119e-07, "loss": 0.4333, "step": 7792 }, { "epoch": 0.89, "learning_rate": 6.209244532732394e-07, "loss": 0.4462, "step": 7793 }, { "epoch": 0.89, "learning_rate": 6.196410469235148e-07, "loss": 0.4515, "step": 7794 }, { "epoch": 0.89, "learning_rate": 6.183589258923928e-07, "loss": 0.4577, "step": 7795 }, { "epoch": 0.89, "learning_rate": 6.170780903555529e-07, "loss": 0.4478, "step": 7796 }, { "epoch": 0.89, "learning_rate": 6.157985404885003e-07, "loss": 0.4433, "step": 7797 }, { "epoch": 0.89, "learning_rate": 6.145202764665626e-07, "loss": 0.4634, "step": 7798 }, { "epoch": 0.89, "learning_rate": 6.132432984648895e-07, "loss": 0.4328, "step": 7799 }, { "epoch": 0.89, "learning_rate": 6.119676066584523e-07, "loss": 0.4386, "step": 7800 }, { "epoch": 0.89, "learning_rate": 6.106932012220534e-07, "loss": 0.4653, "step": 7801 }, { "epoch": 0.89, "learning_rate": 6.09420082330312e-07, "loss": 0.4458, "step": 7802 }, { "epoch": 0.89, "learning_rate": 6.081482501576763e-07, "loss": 0.4492, "step": 7803 }, { "epoch": 0.89, "learning_rate": 6.068777048784136e-07, "loss": 0.4465, "step": 7804 }, { "epoch": 0.89, "learning_rate": 6.056084466666167e-07, "loss": 0.4539, "step": 7805 }, { "epoch": 0.89, "learning_rate": 6.043404756962046e-07, "loss": 0.4583, "step": 7806 }, { "epoch": 0.89, "learning_rate": 6.030737921409169e-07, "loss": 0.4634, "step": 7807 }, { "epoch": 0.89, "learning_rate": 6.01808396174316e-07, "loss": 0.4564, "step": 7808 }, { "epoch": 0.89, "learning_rate": 6.005442879697909e-07, "loss": 0.4556, "step": 7809 }, { "epoch": 0.89, "learning_rate": 5.992814677005521e-07, "loss": 0.4375, "step": 7810 }, { "epoch": 0.89, "learning_rate": 5.980199355396343e-07, "loss": 0.4505, "step": 7811 }, { "epoch": 0.89, "learning_rate": 5.967596916598961e-07, "loss": 0.4443, "step": 7812 }, { "epoch": 0.89, "learning_rate": 5.955007362340171e-07, "loss": 0.4439, "step": 7813 }, { "epoch": 0.89, "learning_rate": 5.942430694345058e-07, "loss": 0.4427, "step": 7814 }, { "epoch": 0.89, "learning_rate": 5.929866914336857e-07, "loss": 0.4509, "step": 7815 }, { "epoch": 0.89, "learning_rate": 5.917316024037123e-07, "loss": 0.4467, "step": 7816 }, { "epoch": 0.89, "learning_rate": 5.904778025165614e-07, "loss": 0.4594, "step": 7817 }, { "epoch": 0.89, "learning_rate": 5.892252919440289e-07, "loss": 0.4512, "step": 7818 }, { "epoch": 0.89, "learning_rate": 5.879740708577386e-07, "loss": 0.4463, "step": 7819 }, { "epoch": 0.89, "learning_rate": 5.867241394291356e-07, "loss": 0.4634, "step": 7820 }, { "epoch": 0.89, "learning_rate": 5.854754978294863e-07, "loss": 0.4553, "step": 7821 }, { "epoch": 0.89, "learning_rate": 5.84228146229886e-07, "loss": 0.444, "step": 7822 }, { "epoch": 0.89, "learning_rate": 5.829820848012457e-07, "loss": 0.4574, "step": 7823 }, { "epoch": 0.89, "learning_rate": 5.817373137143079e-07, "loss": 0.4532, "step": 7824 }, { "epoch": 0.89, "learning_rate": 5.804938331396292e-07, "loss": 0.4523, "step": 7825 }, { "epoch": 0.89, "learning_rate": 5.79251643247598e-07, "loss": 0.4373, "step": 7826 }, { "epoch": 0.89, "learning_rate": 5.780107442084215e-07, "loss": 0.4631, "step": 7827 }, { "epoch": 0.89, "learning_rate": 5.767711361921291e-07, "loss": 0.4318, "step": 7828 }, { "epoch": 0.89, "learning_rate": 5.755328193685772e-07, "loss": 0.4593, "step": 7829 }, { "epoch": 0.89, "learning_rate": 5.742957939074412e-07, "loss": 0.4494, "step": 7830 }, { "epoch": 0.89, "learning_rate": 5.730600599782188e-07, "loss": 0.4487, "step": 7831 }, { "epoch": 0.9, "learning_rate": 5.718256177502379e-07, "loss": 0.4477, "step": 7832 }, { "epoch": 0.9, "learning_rate": 5.70592467392641e-07, "loss": 0.4551, "step": 7833 }, { "epoch": 0.9, "learning_rate": 5.693606090744008e-07, "loss": 0.4259, "step": 7834 }, { "epoch": 0.9, "learning_rate": 5.681300429643044e-07, "loss": 0.4667, "step": 7835 }, { "epoch": 0.9, "learning_rate": 5.669007692309703e-07, "loss": 0.4529, "step": 7836 }, { "epoch": 0.9, "learning_rate": 5.65672788042837e-07, "loss": 0.4611, "step": 7837 }, { "epoch": 0.9, "learning_rate": 5.644460995681644e-07, "loss": 0.4351, "step": 7838 }, { "epoch": 0.9, "learning_rate": 5.632207039750348e-07, "loss": 0.4465, "step": 7839 }, { "epoch": 0.9, "learning_rate": 5.61996601431356e-07, "loss": 0.463, "step": 7840 }, { "epoch": 0.9, "learning_rate": 5.607737921048573e-07, "loss": 0.4737, "step": 7841 }, { "epoch": 0.9, "learning_rate": 5.595522761630911e-07, "loss": 0.4388, "step": 7842 }, { "epoch": 0.9, "learning_rate": 5.583320537734315e-07, "loss": 0.455, "step": 7843 }, { "epoch": 0.9, "learning_rate": 5.57113125103077e-07, "loss": 0.4427, "step": 7844 }, { "epoch": 0.9, "learning_rate": 5.558954903190483e-07, "loss": 0.4489, "step": 7845 }, { "epoch": 0.9, "learning_rate": 5.546791495881887e-07, "loss": 0.4557, "step": 7846 }, { "epoch": 0.9, "learning_rate": 5.534641030771615e-07, "loss": 0.4598, "step": 7847 }, { "epoch": 0.9, "learning_rate": 5.522503509524591e-07, "loss": 0.4401, "step": 7848 }, { "epoch": 0.9, "learning_rate": 5.510378933803895e-07, "loss": 0.4515, "step": 7849 }, { "epoch": 0.9, "learning_rate": 5.498267305270888e-07, "loss": 0.4423, "step": 7850 }, { "epoch": 0.9, "learning_rate": 5.48616862558512e-07, "loss": 0.4442, "step": 7851 }, { "epoch": 0.9, "learning_rate": 5.474082896404365e-07, "loss": 0.4525, "step": 7852 }, { "epoch": 0.9, "learning_rate": 5.462010119384665e-07, "loss": 0.4448, "step": 7853 }, { "epoch": 0.9, "learning_rate": 5.44995029618024e-07, "loss": 0.4257, "step": 7854 }, { "epoch": 0.9, "learning_rate": 5.43790342844358e-07, "loss": 0.4738, "step": 7855 }, { "epoch": 0.9, "learning_rate": 5.425869517825366e-07, "loss": 0.4501, "step": 7856 }, { "epoch": 0.9, "learning_rate": 5.413848565974489e-07, "loss": 0.4749, "step": 7857 }, { "epoch": 0.9, "learning_rate": 5.401840574538108e-07, "loss": 0.4564, "step": 7858 }, { "epoch": 0.9, "learning_rate": 5.389845545161598e-07, "loss": 0.4435, "step": 7859 }, { "epoch": 0.9, "learning_rate": 5.37786347948851e-07, "loss": 0.4443, "step": 7860 }, { "epoch": 0.9, "learning_rate": 5.365894379160686e-07, "loss": 0.4699, "step": 7861 }, { "epoch": 0.9, "learning_rate": 5.353938245818147e-07, "loss": 0.4474, "step": 7862 }, { "epoch": 0.9, "learning_rate": 5.341995081099139e-07, "loss": 0.4651, "step": 7863 }, { "epoch": 0.9, "learning_rate": 5.330064886640173e-07, "loss": 0.4474, "step": 7864 }, { "epoch": 0.9, "learning_rate": 5.318147664075923e-07, "loss": 0.4703, "step": 7865 }, { "epoch": 0.9, "learning_rate": 5.306243415039336e-07, "loss": 0.452, "step": 7866 }, { "epoch": 0.9, "learning_rate": 5.294352141161541e-07, "loss": 0.4484, "step": 7867 }, { "epoch": 0.9, "learning_rate": 5.282473844071933e-07, "loss": 0.4377, "step": 7868 }, { "epoch": 0.9, "learning_rate": 5.27060852539808e-07, "loss": 0.4763, "step": 7869 }, { "epoch": 0.9, "learning_rate": 5.258756186765801e-07, "loss": 0.4567, "step": 7870 }, { "epoch": 0.9, "learning_rate": 5.246916829799132e-07, "loss": 0.4356, "step": 7871 }, { "epoch": 0.9, "learning_rate": 5.235090456120329e-07, "loss": 0.4509, "step": 7872 }, { "epoch": 0.9, "learning_rate": 5.223277067349864e-07, "loss": 0.4649, "step": 7873 }, { "epoch": 0.9, "learning_rate": 5.211476665106463e-07, "loss": 0.4489, "step": 7874 }, { "epoch": 0.9, "learning_rate": 5.199689251007001e-07, "loss": 0.4553, "step": 7875 }, { "epoch": 0.9, "learning_rate": 5.187914826666662e-07, "loss": 0.4444, "step": 7876 }, { "epoch": 0.9, "learning_rate": 5.17615339369878e-07, "loss": 0.4496, "step": 7877 }, { "epoch": 0.9, "learning_rate": 5.164404953714919e-07, "loss": 0.4492, "step": 7878 }, { "epoch": 0.9, "learning_rate": 5.152669508324904e-07, "loss": 0.4534, "step": 7879 }, { "epoch": 0.9, "learning_rate": 5.140947059136736e-07, "loss": 0.4503, "step": 7880 }, { "epoch": 0.9, "learning_rate": 5.129237607756677e-07, "loss": 0.4529, "step": 7881 }, { "epoch": 0.9, "learning_rate": 5.117541155789141e-07, "loss": 0.4364, "step": 7882 }, { "epoch": 0.9, "learning_rate": 5.105857704836836e-07, "loss": 0.4399, "step": 7883 }, { "epoch": 0.9, "learning_rate": 5.094187256500671e-07, "loss": 0.4533, "step": 7884 }, { "epoch": 0.9, "learning_rate": 5.08252981237971e-07, "loss": 0.4392, "step": 7885 }, { "epoch": 0.9, "learning_rate": 5.070885374071321e-07, "loss": 0.4464, "step": 7886 }, { "epoch": 0.9, "learning_rate": 5.05925394317105e-07, "loss": 0.4763, "step": 7887 }, { "epoch": 0.9, "learning_rate": 5.047635521272631e-07, "loss": 0.4511, "step": 7888 }, { "epoch": 0.9, "learning_rate": 5.036030109968082e-07, "loss": 0.456, "step": 7889 }, { "epoch": 0.9, "learning_rate": 5.024437710847574e-07, "loss": 0.4665, "step": 7890 }, { "epoch": 0.9, "learning_rate": 5.012858325499559e-07, "loss": 0.4364, "step": 7891 }, { "epoch": 0.9, "learning_rate": 5.001291955510634e-07, "loss": 0.4645, "step": 7892 }, { "epoch": 0.9, "learning_rate": 4.989738602465666e-07, "loss": 0.4316, "step": 7893 }, { "epoch": 0.9, "learning_rate": 4.978198267947742e-07, "loss": 0.4545, "step": 7894 }, { "epoch": 0.9, "learning_rate": 4.966670953538133e-07, "loss": 0.4539, "step": 7895 }, { "epoch": 0.9, "learning_rate": 4.955156660816307e-07, "loss": 0.454, "step": 7896 }, { "epoch": 0.9, "learning_rate": 4.943655391360025e-07, "loss": 0.4422, "step": 7897 }, { "epoch": 0.9, "learning_rate": 4.932167146745193e-07, "loss": 0.4376, "step": 7898 }, { "epoch": 0.9, "learning_rate": 4.920691928545973e-07, "loss": 0.456, "step": 7899 }, { "epoch": 0.9, "learning_rate": 4.909229738334698e-07, "loss": 0.4591, "step": 7900 }, { "epoch": 0.9, "learning_rate": 4.897780577681954e-07, "loss": 0.4428, "step": 7901 }, { "epoch": 0.9, "learning_rate": 4.886344448156566e-07, "loss": 0.4412, "step": 7902 }, { "epoch": 0.9, "learning_rate": 4.874921351325512e-07, "loss": 0.4327, "step": 7903 }, { "epoch": 0.9, "learning_rate": 4.863511288753986e-07, "loss": 0.4401, "step": 7904 }, { "epoch": 0.9, "learning_rate": 4.85211426200547e-07, "loss": 0.4561, "step": 7905 }, { "epoch": 0.9, "learning_rate": 4.840730272641569e-07, "loss": 0.4616, "step": 7906 }, { "epoch": 0.9, "learning_rate": 4.829359322222182e-07, "loss": 0.4657, "step": 7907 }, { "epoch": 0.9, "learning_rate": 4.818001412305362e-07, "loss": 0.4471, "step": 7908 }, { "epoch": 0.9, "learning_rate": 4.806656544447374e-07, "loss": 0.4503, "step": 7909 }, { "epoch": 0.9, "learning_rate": 4.795324720202754e-07, "loss": 0.4521, "step": 7910 }, { "epoch": 0.9, "learning_rate": 4.784005941124203e-07, "loss": 0.4485, "step": 7911 }, { "epoch": 0.9, "learning_rate": 4.772700208762659e-07, "loss": 0.4421, "step": 7912 }, { "epoch": 0.9, "learning_rate": 4.761407524667239e-07, "loss": 0.4397, "step": 7913 }, { "epoch": 0.9, "learning_rate": 4.750127890385292e-07, "loss": 0.4493, "step": 7914 }, { "epoch": 0.9, "learning_rate": 4.738861307462406e-07, "loss": 0.461, "step": 7915 }, { "epoch": 0.9, "learning_rate": 4.7276077774423334e-07, "loss": 0.4571, "step": 7916 }, { "epoch": 0.9, "learning_rate": 4.716367301867053e-07, "loss": 0.4409, "step": 7917 }, { "epoch": 0.9, "learning_rate": 4.705139882276788e-07, "loss": 0.4698, "step": 7918 }, { "epoch": 0.91, "learning_rate": 4.693925520209908e-07, "loss": 0.4495, "step": 7919 }, { "epoch": 0.91, "learning_rate": 4.6827242172030495e-07, "loss": 0.4517, "step": 7920 }, { "epoch": 0.91, "learning_rate": 4.6715359747910526e-07, "loss": 0.4549, "step": 7921 }, { "epoch": 0.91, "learning_rate": 4.660360794506946e-07, "loss": 0.4327, "step": 7922 }, { "epoch": 0.91, "learning_rate": 4.649198677881983e-07, "loss": 0.4543, "step": 7923 }, { "epoch": 0.91, "learning_rate": 4.6380496264456064e-07, "loss": 0.4555, "step": 7924 }, { "epoch": 0.91, "learning_rate": 4.6269136417255167e-07, "loss": 0.433, "step": 7925 }, { "epoch": 0.91, "learning_rate": 4.615790725247571e-07, "loss": 0.4415, "step": 7926 }, { "epoch": 0.91, "learning_rate": 4.60468087853585e-07, "loss": 0.44, "step": 7927 }, { "epoch": 0.91, "learning_rate": 4.5935841031126693e-07, "loss": 0.4495, "step": 7928 }, { "epoch": 0.91, "learning_rate": 4.582500400498513e-07, "loss": 0.4418, "step": 7929 }, { "epoch": 0.91, "learning_rate": 4.5714297722121105e-07, "loss": 0.458, "step": 7930 }, { "epoch": 0.91, "learning_rate": 4.5603722197703925e-07, "loss": 0.4415, "step": 7931 }, { "epoch": 0.91, "learning_rate": 4.54932774468847e-07, "loss": 0.4602, "step": 7932 }, { "epoch": 0.91, "learning_rate": 4.5382963484797096e-07, "loss": 0.4578, "step": 7933 }, { "epoch": 0.91, "learning_rate": 4.5272780326556466e-07, "loss": 0.469, "step": 7934 }, { "epoch": 0.91, "learning_rate": 4.516272798726018e-07, "loss": 0.4415, "step": 7935 }, { "epoch": 0.91, "learning_rate": 4.5052806481988175e-07, "loss": 0.4508, "step": 7936 }, { "epoch": 0.91, "learning_rate": 4.494301582580185e-07, "loss": 0.4495, "step": 7937 }, { "epoch": 0.91, "learning_rate": 4.4833356033745167e-07, "loss": 0.4321, "step": 7938 }, { "epoch": 0.91, "learning_rate": 4.472382712084389e-07, "loss": 0.4402, "step": 7939 }, { "epoch": 0.91, "learning_rate": 4.4614429102105893e-07, "loss": 0.441, "step": 7940 }, { "epoch": 0.91, "learning_rate": 4.4505161992521417e-07, "loss": 0.4518, "step": 7941 }, { "epoch": 0.91, "learning_rate": 4.439602580706226e-07, "loss": 0.4709, "step": 7942 }, { "epoch": 0.91, "learning_rate": 4.4287020560682345e-07, "loss": 0.4147, "step": 7943 }, { "epoch": 0.91, "learning_rate": 4.4178146268318177e-07, "loss": 0.4517, "step": 7944 }, { "epoch": 0.91, "learning_rate": 4.406940294488771e-07, "loss": 0.4611, "step": 7945 }, { "epoch": 0.91, "learning_rate": 4.396079060529146e-07, "loss": 0.4488, "step": 7946 }, { "epoch": 0.91, "learning_rate": 4.3852309264411417e-07, "loss": 0.434, "step": 7947 }, { "epoch": 0.91, "learning_rate": 4.3743958937112253e-07, "loss": 0.4538, "step": 7948 }, { "epoch": 0.91, "learning_rate": 4.363573963824008e-07, "loss": 0.4536, "step": 7949 }, { "epoch": 0.91, "learning_rate": 4.3527651382623603e-07, "loss": 0.4758, "step": 7950 }, { "epoch": 0.91, "learning_rate": 4.3419694185073303e-07, "loss": 0.449, "step": 7951 }, { "epoch": 0.91, "learning_rate": 4.331186806038179e-07, "loss": 0.4611, "step": 7952 }, { "epoch": 0.91, "learning_rate": 4.320417302332325e-07, "loss": 0.4398, "step": 7953 }, { "epoch": 0.91, "learning_rate": 4.3096609088654873e-07, "loss": 0.4411, "step": 7954 }, { "epoch": 0.91, "learning_rate": 4.298917627111476e-07, "loss": 0.4262, "step": 7955 }, { "epoch": 0.91, "learning_rate": 4.2881874585424146e-07, "loss": 0.4694, "step": 7956 }, { "epoch": 0.91, "learning_rate": 4.2774704046285254e-07, "loss": 0.4418, "step": 7957 }, { "epoch": 0.91, "learning_rate": 4.266766466838335e-07, "loss": 0.4588, "step": 7958 }, { "epoch": 0.91, "learning_rate": 4.256075646638469e-07, "loss": 0.442, "step": 7959 }, { "epoch": 0.91, "learning_rate": 4.2453979454938563e-07, "loss": 0.4577, "step": 7960 }, { "epoch": 0.91, "learning_rate": 4.2347333648675383e-07, "loss": 0.4395, "step": 7961 }, { "epoch": 0.91, "learning_rate": 4.2240819062208337e-07, "loss": 0.4491, "step": 7962 }, { "epoch": 0.91, "learning_rate": 4.2134435710132093e-07, "loss": 0.453, "step": 7963 }, { "epoch": 0.91, "learning_rate": 4.2028183607023766e-07, "loss": 0.4556, "step": 7964 }, { "epoch": 0.91, "learning_rate": 4.192206276744204e-07, "loss": 0.4387, "step": 7965 }, { "epoch": 0.91, "learning_rate": 4.181607320592784e-07, "loss": 0.4476, "step": 7966 }, { "epoch": 0.91, "learning_rate": 4.1710214937004223e-07, "loss": 0.4507, "step": 7967 }, { "epoch": 0.91, "learning_rate": 4.1604487975176136e-07, "loss": 0.4773, "step": 7968 }, { "epoch": 0.91, "learning_rate": 4.149889233493054e-07, "loss": 0.4412, "step": 7969 }, { "epoch": 0.91, "learning_rate": 4.139342803073632e-07, "loss": 0.4464, "step": 7970 }, { "epoch": 0.91, "learning_rate": 4.128809507704445e-07, "loss": 0.4332, "step": 7971 }, { "epoch": 0.91, "learning_rate": 4.1182893488287965e-07, "loss": 0.451, "step": 7972 }, { "epoch": 0.91, "learning_rate": 4.1077823278881767e-07, "loss": 0.4384, "step": 7973 }, { "epoch": 0.91, "learning_rate": 4.097288446322278e-07, "loss": 0.4486, "step": 7974 }, { "epoch": 0.91, "learning_rate": 4.086807705569018e-07, "loss": 0.4793, "step": 7975 }, { "epoch": 0.91, "learning_rate": 4.076340107064458e-07, "loss": 0.4487, "step": 7976 }, { "epoch": 0.91, "learning_rate": 4.065885652242907e-07, "loss": 0.4378, "step": 7977 }, { "epoch": 0.91, "learning_rate": 4.055444342536885e-07, "loss": 0.4562, "step": 7978 }, { "epoch": 0.91, "learning_rate": 4.045016179377048e-07, "loss": 0.4411, "step": 7979 }, { "epoch": 0.91, "learning_rate": 4.034601164192309e-07, "loss": 0.4305, "step": 7980 }, { "epoch": 0.91, "learning_rate": 4.024199298409737e-07, "loss": 0.4558, "step": 7981 }, { "epoch": 0.91, "learning_rate": 4.013810583454647e-07, "loss": 0.4528, "step": 7982 }, { "epoch": 0.91, "learning_rate": 4.0034350207505124e-07, "loss": 0.4647, "step": 7983 }, { "epoch": 0.91, "learning_rate": 3.9930726117190064e-07, "loss": 0.4603, "step": 7984 }, { "epoch": 0.91, "learning_rate": 3.982723357780027e-07, "loss": 0.4369, "step": 7985 }, { "epoch": 0.91, "learning_rate": 3.97238726035164e-07, "loss": 0.4506, "step": 7986 }, { "epoch": 0.91, "learning_rate": 3.962064320850112e-07, "loss": 0.4454, "step": 7987 }, { "epoch": 0.91, "learning_rate": 3.951754540689956e-07, "loss": 0.4581, "step": 7988 }, { "epoch": 0.91, "learning_rate": 3.9414579212838087e-07, "loss": 0.4423, "step": 7989 }, { "epoch": 0.91, "learning_rate": 3.931174464042542e-07, "loss": 0.4595, "step": 7990 }, { "epoch": 0.91, "learning_rate": 3.920904170375239e-07, "loss": 0.4608, "step": 7991 }, { "epoch": 0.91, "learning_rate": 3.9106470416891195e-07, "loss": 0.4527, "step": 7992 }, { "epoch": 0.91, "learning_rate": 3.9004030793896807e-07, "loss": 0.4451, "step": 7993 }, { "epoch": 0.91, "learning_rate": 3.8901722848805443e-07, "loss": 0.4519, "step": 7994 }, { "epoch": 0.91, "learning_rate": 3.8799546595635784e-07, "loss": 0.4403, "step": 7995 }, { "epoch": 0.91, "learning_rate": 3.8697502048387956e-07, "loss": 0.4511, "step": 7996 }, { "epoch": 0.91, "learning_rate": 3.8595589221044674e-07, "loss": 0.4411, "step": 7997 }, { "epoch": 0.91, "learning_rate": 3.84938081275702e-07, "loss": 0.4515, "step": 7998 }, { "epoch": 0.91, "learning_rate": 3.839215878191083e-07, "loss": 0.4685, "step": 7999 }, { "epoch": 0.91, "learning_rate": 3.8290641197994526e-07, "loss": 0.4395, "step": 8000 }, { "epoch": 0.91, "learning_rate": 3.8189255389731837e-07, "loss": 0.4388, "step": 8001 }, { "epoch": 0.91, "learning_rate": 3.808800137101465e-07, "loss": 0.4422, "step": 8002 }, { "epoch": 0.91, "learning_rate": 3.7986879155717084e-07, "loss": 0.4631, "step": 8003 }, { "epoch": 0.91, "learning_rate": 3.7885888757695054e-07, "loss": 0.4384, "step": 8004 }, { "epoch": 0.91, "learning_rate": 3.778503019078672e-07, "loss": 0.4312, "step": 8005 }, { "epoch": 0.91, "learning_rate": 3.768430346881169e-07, "loss": 0.4415, "step": 8006 }, { "epoch": 0.92, "learning_rate": 3.7583708605571923e-07, "loss": 0.4421, "step": 8007 }, { "epoch": 0.92, "learning_rate": 3.748324561485128e-07, "loss": 0.4674, "step": 8008 }, { "epoch": 0.92, "learning_rate": 3.7382914510415316e-07, "loss": 0.4332, "step": 8009 }, { "epoch": 0.92, "learning_rate": 3.7282715306011465e-07, "loss": 0.4402, "step": 8010 }, { "epoch": 0.92, "learning_rate": 3.7182648015369524e-07, "loss": 0.4535, "step": 8011 }, { "epoch": 0.92, "learning_rate": 3.708271265220087e-07, "loss": 0.4524, "step": 8012 }, { "epoch": 0.92, "learning_rate": 3.698290923019865e-07, "loss": 0.4364, "step": 8013 }, { "epoch": 0.92, "learning_rate": 3.688323776303837e-07, "loss": 0.4509, "step": 8014 }, { "epoch": 0.92, "learning_rate": 3.678369826437733e-07, "loss": 0.4523, "step": 8015 }, { "epoch": 0.92, "learning_rate": 3.668429074785451e-07, "loss": 0.4636, "step": 8016 }, { "epoch": 0.92, "learning_rate": 3.6585015227091013e-07, "loss": 0.4432, "step": 8017 }, { "epoch": 0.92, "learning_rate": 3.6485871715689735e-07, "loss": 0.4289, "step": 8018 }, { "epoch": 0.92, "learning_rate": 3.63868602272357e-07, "loss": 0.4573, "step": 8019 }, { "epoch": 0.92, "learning_rate": 3.6287980775295603e-07, "loss": 0.4517, "step": 8020 }, { "epoch": 0.92, "learning_rate": 3.6189233373418064e-07, "loss": 0.4437, "step": 8021 }, { "epoch": 0.92, "learning_rate": 3.609061803513392e-07, "loss": 0.4425, "step": 8022 }, { "epoch": 0.92, "learning_rate": 3.5992134773955354e-07, "loss": 0.4543, "step": 8023 }, { "epoch": 0.92, "learning_rate": 3.589378360337692e-07, "loss": 0.4701, "step": 8024 }, { "epoch": 0.92, "learning_rate": 3.579556453687494e-07, "loss": 0.4521, "step": 8025 }, { "epoch": 0.92, "learning_rate": 3.569747758790765e-07, "loss": 0.4548, "step": 8026 }, { "epoch": 0.92, "learning_rate": 3.5599522769915074e-07, "loss": 0.4471, "step": 8027 }, { "epoch": 0.92, "learning_rate": 3.550170009631926e-07, "loss": 0.443, "step": 8028 }, { "epoch": 0.92, "learning_rate": 3.5404009580524144e-07, "loss": 0.4381, "step": 8029 }, { "epoch": 0.92, "learning_rate": 3.5306451235915475e-07, "loss": 0.4476, "step": 8030 }, { "epoch": 0.92, "learning_rate": 3.520902507586077e-07, "loss": 0.4408, "step": 8031 }, { "epoch": 0.92, "learning_rate": 3.51117311137098e-07, "loss": 0.4631, "step": 8032 }, { "epoch": 0.92, "learning_rate": 3.50145693627939e-07, "loss": 0.4327, "step": 8033 }, { "epoch": 0.92, "learning_rate": 3.4917539836426317e-07, "loss": 0.4601, "step": 8034 }, { "epoch": 0.92, "learning_rate": 3.4820642547902516e-07, "loss": 0.4565, "step": 8035 }, { "epoch": 0.92, "learning_rate": 3.472387751049944e-07, "loss": 0.4424, "step": 8036 }, { "epoch": 0.92, "learning_rate": 3.462724473747603e-07, "loss": 0.459, "step": 8037 }, { "epoch": 0.92, "learning_rate": 3.4530744242073143e-07, "loss": 0.4567, "step": 8038 }, { "epoch": 0.92, "learning_rate": 3.443437603751354e-07, "loss": 0.4382, "step": 8039 }, { "epoch": 0.92, "learning_rate": 3.433814013700187e-07, "loss": 0.4704, "step": 8040 }, { "epoch": 0.92, "learning_rate": 3.424203655372438e-07, "loss": 0.4377, "step": 8041 }, { "epoch": 0.92, "learning_rate": 3.414606530084974e-07, "loss": 0.4581, "step": 8042 }, { "epoch": 0.92, "learning_rate": 3.405022639152777e-07, "loss": 0.4452, "step": 8043 }, { "epoch": 0.92, "learning_rate": 3.3954519838890866e-07, "loss": 0.4596, "step": 8044 }, { "epoch": 0.92, "learning_rate": 3.3858945656052855e-07, "loss": 0.4302, "step": 8045 }, { "epoch": 0.92, "learning_rate": 3.376350385610938e-07, "loss": 0.4521, "step": 8046 }, { "epoch": 0.92, "learning_rate": 3.3668194452138423e-07, "loss": 0.4579, "step": 8047 }, { "epoch": 0.92, "learning_rate": 3.357301745719932e-07, "loss": 0.4506, "step": 8048 }, { "epoch": 0.92, "learning_rate": 3.34779728843333e-07, "loss": 0.4377, "step": 8049 }, { "epoch": 0.92, "learning_rate": 3.3383060746563836e-07, "loss": 0.4593, "step": 8050 }, { "epoch": 0.92, "learning_rate": 3.3288281056895746e-07, "loss": 0.4456, "step": 8051 }, { "epoch": 0.92, "learning_rate": 3.3193633828316306e-07, "loss": 0.4628, "step": 8052 }, { "epoch": 0.92, "learning_rate": 3.309911907379393e-07, "loss": 0.4529, "step": 8053 }, { "epoch": 0.92, "learning_rate": 3.300473680627947e-07, "loss": 0.4455, "step": 8054 }, { "epoch": 0.92, "learning_rate": 3.2910487038705476e-07, "loss": 0.4394, "step": 8055 }, { "epoch": 0.92, "learning_rate": 3.2816369783986166e-07, "loss": 0.463, "step": 8056 }, { "epoch": 0.92, "learning_rate": 3.2722385055017567e-07, "loss": 0.4431, "step": 8057 }, { "epoch": 0.92, "learning_rate": 3.262853286467804e-07, "loss": 0.4564, "step": 8058 }, { "epoch": 0.92, "learning_rate": 3.2534813225826965e-07, "loss": 0.4397, "step": 8059 }, { "epoch": 0.92, "learning_rate": 3.2441226151306403e-07, "loss": 0.4575, "step": 8060 }, { "epoch": 0.92, "learning_rate": 3.234777165393965e-07, "loss": 0.4362, "step": 8061 }, { "epoch": 0.92, "learning_rate": 3.2254449746532246e-07, "loss": 0.4318, "step": 8062 }, { "epoch": 0.92, "learning_rate": 3.216126044187118e-07, "loss": 0.4545, "step": 8063 }, { "epoch": 0.92, "learning_rate": 3.206820375272557e-07, "loss": 0.462, "step": 8064 }, { "epoch": 0.92, "learning_rate": 3.1975279691846437e-07, "loss": 0.4365, "step": 8065 }, { "epoch": 0.92, "learning_rate": 3.188248827196616e-07, "loss": 0.4711, "step": 8066 }, { "epoch": 0.92, "learning_rate": 3.178982950579923e-07, "loss": 0.4475, "step": 8067 }, { "epoch": 0.92, "learning_rate": 3.169730340604227e-07, "loss": 0.4419, "step": 8068 }, { "epoch": 0.92, "learning_rate": 3.160490998537313e-07, "loss": 0.4292, "step": 8069 }, { "epoch": 0.92, "learning_rate": 3.151264925645192e-07, "loss": 0.4678, "step": 8070 }, { "epoch": 0.92, "learning_rate": 3.142052123192019e-07, "loss": 0.4485, "step": 8071 }, { "epoch": 0.92, "learning_rate": 3.132852592440194e-07, "loss": 0.4481, "step": 8072 }, { "epoch": 0.92, "learning_rate": 3.1236663346502215e-07, "loss": 0.4427, "step": 8073 }, { "epoch": 0.92, "learning_rate": 3.11449335108085e-07, "loss": 0.4701, "step": 8074 }, { "epoch": 0.92, "learning_rate": 3.1053336429889616e-07, "loss": 0.4609, "step": 8075 }, { "epoch": 0.92, "learning_rate": 3.0961872116296645e-07, "loss": 0.4481, "step": 8076 }, { "epoch": 0.92, "learning_rate": 3.0870540582562003e-07, "loss": 0.4279, "step": 8077 }, { "epoch": 0.92, "learning_rate": 3.077934184120035e-07, "loss": 0.4586, "step": 8078 }, { "epoch": 0.92, "learning_rate": 3.06882759047078e-07, "loss": 0.4453, "step": 8079 }, { "epoch": 0.92, "learning_rate": 3.059734278556237e-07, "loss": 0.4442, "step": 8080 }, { "epoch": 0.92, "learning_rate": 3.050654249622398e-07, "loss": 0.4565, "step": 8081 }, { "epoch": 0.92, "learning_rate": 3.0415875049134566e-07, "loss": 0.4458, "step": 8082 }, { "epoch": 0.92, "learning_rate": 3.03253404567172e-07, "loss": 0.4353, "step": 8083 }, { "epoch": 0.92, "learning_rate": 3.0234938731377394e-07, "loss": 0.4717, "step": 8084 }, { "epoch": 0.92, "learning_rate": 3.014466988550202e-07, "loss": 0.4587, "step": 8085 }, { "epoch": 0.92, "learning_rate": 3.0054533931460186e-07, "loss": 0.4576, "step": 8086 }, { "epoch": 0.92, "learning_rate": 2.996453088160234e-07, "loss": 0.4396, "step": 8087 }, { "epoch": 0.92, "learning_rate": 2.9874660748260843e-07, "loss": 0.443, "step": 8088 }, { "epoch": 0.92, "learning_rate": 2.978492354375007e-07, "loss": 0.4552, "step": 8089 }, { "epoch": 0.92, "learning_rate": 2.969531928036595e-07, "loss": 0.4378, "step": 8090 }, { "epoch": 0.92, "learning_rate": 2.9605847970386125e-07, "loss": 0.4272, "step": 8091 }, { "epoch": 0.92, "learning_rate": 2.9516509626070553e-07, "loss": 0.4468, "step": 8092 }, { "epoch": 0.92, "learning_rate": 2.9427304259660117e-07, "loss": 0.4672, "step": 8093 }, { "epoch": 0.93, "learning_rate": 2.9338231883378365e-07, "loss": 0.4169, "step": 8094 }, { "epoch": 0.93, "learning_rate": 2.924929250942998e-07, "loss": 0.4546, "step": 8095 }, { "epoch": 0.93, "learning_rate": 2.9160486150001556e-07, "loss": 0.4413, "step": 8096 }, { "epoch": 0.93, "learning_rate": 2.907181281726179e-07, "loss": 0.4463, "step": 8097 }, { "epoch": 0.93, "learning_rate": 2.8983272523360637e-07, "loss": 0.4412, "step": 8098 }, { "epoch": 0.93, "learning_rate": 2.889486528043028e-07, "loss": 0.4416, "step": 8099 }, { "epoch": 0.93, "learning_rate": 2.880659110058448e-07, "loss": 0.4381, "step": 8100 }, { "epoch": 0.93, "learning_rate": 2.8718449995918553e-07, "loss": 0.4511, "step": 8101 }, { "epoch": 0.93, "learning_rate": 2.863044197851017e-07, "loss": 0.463, "step": 8102 }, { "epoch": 0.93, "learning_rate": 2.8542567060418135e-07, "loss": 0.4676, "step": 8103 }, { "epoch": 0.93, "learning_rate": 2.845482525368337e-07, "loss": 0.43, "step": 8104 }, { "epoch": 0.93, "learning_rate": 2.836721657032848e-07, "loss": 0.4403, "step": 8105 }, { "epoch": 0.93, "learning_rate": 2.8279741022357535e-07, "loss": 0.444, "step": 8106 }, { "epoch": 0.93, "learning_rate": 2.8192398621757156e-07, "loss": 0.4691, "step": 8107 }, { "epoch": 0.93, "learning_rate": 2.810518938049478e-07, "loss": 0.4507, "step": 8108 }, { "epoch": 0.93, "learning_rate": 2.801811331052007e-07, "loss": 0.4691, "step": 8109 }, { "epoch": 0.93, "learning_rate": 2.7931170423764363e-07, "loss": 0.4466, "step": 8110 }, { "epoch": 0.93, "learning_rate": 2.784436073214103e-07, "loss": 0.4667, "step": 8111 }, { "epoch": 0.93, "learning_rate": 2.775768424754488e-07, "loss": 0.443, "step": 8112 }, { "epoch": 0.93, "learning_rate": 2.7671140981852306e-07, "loss": 0.4504, "step": 8113 }, { "epoch": 0.93, "learning_rate": 2.7584730946921825e-07, "loss": 0.442, "step": 8114 }, { "epoch": 0.93, "learning_rate": 2.7498454154593624e-07, "loss": 0.4698, "step": 8115 }, { "epoch": 0.93, "learning_rate": 2.741231061668925e-07, "loss": 0.4184, "step": 8116 }, { "epoch": 0.93, "learning_rate": 2.73263003450126e-07, "loss": 0.4488, "step": 8117 }, { "epoch": 0.93, "learning_rate": 2.72404233513488e-07, "loss": 0.4538, "step": 8118 }, { "epoch": 0.93, "learning_rate": 2.71546796474651e-07, "loss": 0.4525, "step": 8119 }, { "epoch": 0.93, "learning_rate": 2.70690692451101e-07, "loss": 0.4407, "step": 8120 }, { "epoch": 0.93, "learning_rate": 2.698359215601443e-07, "loss": 0.4438, "step": 8121 }, { "epoch": 0.93, "learning_rate": 2.689824839189037e-07, "loss": 0.4545, "step": 8122 }, { "epoch": 0.93, "learning_rate": 2.681303796443202e-07, "loss": 0.4361, "step": 8123 }, { "epoch": 0.93, "learning_rate": 2.672796088531493e-07, "loss": 0.4593, "step": 8124 }, { "epoch": 0.93, "learning_rate": 2.664301716619666e-07, "loss": 0.4915, "step": 8125 }, { "epoch": 0.93, "learning_rate": 2.655820681871635e-07, "loss": 0.4487, "step": 8126 }, { "epoch": 0.93, "learning_rate": 2.6473529854494915e-07, "loss": 0.4443, "step": 8127 }, { "epoch": 0.93, "learning_rate": 2.638898628513498e-07, "loss": 0.443, "step": 8128 }, { "epoch": 0.93, "learning_rate": 2.6304576122221035e-07, "loss": 0.4475, "step": 8129 }, { "epoch": 0.93, "learning_rate": 2.6220299377318847e-07, "loss": 0.4359, "step": 8130 }, { "epoch": 0.93, "learning_rate": 2.613615606197661e-07, "loss": 0.444, "step": 8131 }, { "epoch": 0.93, "learning_rate": 2.605214618772356e-07, "loss": 0.4468, "step": 8132 }, { "epoch": 0.93, "learning_rate": 2.596826976607114e-07, "loss": 0.4594, "step": 8133 }, { "epoch": 0.93, "learning_rate": 2.5884526808511946e-07, "loss": 0.4441, "step": 8134 }, { "epoch": 0.93, "learning_rate": 2.5800917326521013e-07, "loss": 0.4514, "step": 8135 }, { "epoch": 0.93, "learning_rate": 2.5717441331554517e-07, "loss": 0.4474, "step": 8136 }, { "epoch": 0.93, "learning_rate": 2.5634098835050415e-07, "loss": 0.439, "step": 8137 }, { "epoch": 0.93, "learning_rate": 2.555088984842868e-07, "loss": 0.4606, "step": 8138 }, { "epoch": 0.93, "learning_rate": 2.546781438309087e-07, "loss": 0.4344, "step": 8139 }, { "epoch": 0.93, "learning_rate": 2.5384872450419985e-07, "loss": 0.4299, "step": 8140 }, { "epoch": 0.93, "learning_rate": 2.530206406178104e-07, "loss": 0.4699, "step": 8141 }, { "epoch": 0.93, "learning_rate": 2.5219389228520517e-07, "loss": 0.452, "step": 8142 }, { "epoch": 0.93, "learning_rate": 2.51368479619668e-07, "loss": 0.4446, "step": 8143 }, { "epoch": 0.93, "learning_rate": 2.505444027342996e-07, "loss": 0.4496, "step": 8144 }, { "epoch": 0.93, "learning_rate": 2.497216617420151e-07, "loss": 0.4444, "step": 8145 }, { "epoch": 0.93, "learning_rate": 2.4890025675554983e-07, "loss": 0.4439, "step": 8146 }, { "epoch": 0.93, "learning_rate": 2.480801878874528e-07, "loss": 0.4742, "step": 8147 }, { "epoch": 0.93, "learning_rate": 2.4726145525009404e-07, "loss": 0.4355, "step": 8148 }, { "epoch": 0.93, "learning_rate": 2.4644405895565717e-07, "loss": 0.4577, "step": 8149 }, { "epoch": 0.93, "learning_rate": 2.456279991161437e-07, "loss": 0.4551, "step": 8150 }, { "epoch": 0.93, "learning_rate": 2.448132758433719e-07, "loss": 0.4834, "step": 8151 }, { "epoch": 0.93, "learning_rate": 2.439998892489781e-07, "loss": 0.4243, "step": 8152 }, { "epoch": 0.93, "learning_rate": 2.4318783944441314e-07, "loss": 0.458, "step": 8153 }, { "epoch": 0.93, "learning_rate": 2.4237712654094693e-07, "loss": 0.4451, "step": 8154 }, { "epoch": 0.93, "learning_rate": 2.4156775064966273e-07, "loss": 0.4431, "step": 8155 }, { "epoch": 0.93, "learning_rate": 2.4075971188146754e-07, "loss": 0.4606, "step": 8156 }, { "epoch": 0.93, "learning_rate": 2.3995301034707597e-07, "loss": 0.451, "step": 8157 }, { "epoch": 0.93, "learning_rate": 2.3914764615702747e-07, "loss": 0.4384, "step": 8158 }, { "epoch": 0.93, "learning_rate": 2.3834361942167484e-07, "loss": 0.4686, "step": 8159 }, { "epoch": 0.93, "learning_rate": 2.375409302511855e-07, "loss": 0.4473, "step": 8160 }, { "epoch": 0.93, "learning_rate": 2.367395787555482e-07, "loss": 0.4443, "step": 8161 }, { "epoch": 0.93, "learning_rate": 2.3593956504456396e-07, "loss": 0.4512, "step": 8162 }, { "epoch": 0.93, "learning_rate": 2.3514088922785284e-07, "loss": 0.4504, "step": 8163 }, { "epoch": 0.93, "learning_rate": 2.3434355141485287e-07, "loss": 0.4591, "step": 8164 }, { "epoch": 0.93, "learning_rate": 2.335475517148167e-07, "loss": 0.4477, "step": 8165 }, { "epoch": 0.93, "learning_rate": 2.3275289023681148e-07, "loss": 0.4334, "step": 8166 }, { "epoch": 0.93, "learning_rate": 2.3195956708972566e-07, "loss": 0.462, "step": 8167 }, { "epoch": 0.93, "learning_rate": 2.3116758238226233e-07, "loss": 0.4558, "step": 8168 }, { "epoch": 0.93, "learning_rate": 2.3037693622294244e-07, "loss": 0.4568, "step": 8169 }, { "epoch": 0.93, "learning_rate": 2.2958762872009932e-07, "loss": 0.4401, "step": 8170 }, { "epoch": 0.93, "learning_rate": 2.2879965998188646e-07, "loss": 0.4245, "step": 8171 }, { "epoch": 0.93, "learning_rate": 2.280130301162742e-07, "loss": 0.4457, "step": 8172 }, { "epoch": 0.93, "learning_rate": 2.2722773923104736e-07, "loss": 0.4725, "step": 8173 }, { "epoch": 0.93, "learning_rate": 2.264437874338099e-07, "loss": 0.4427, "step": 8174 }, { "epoch": 0.93, "learning_rate": 2.2566117483197923e-07, "loss": 0.4492, "step": 8175 }, { "epoch": 0.93, "learning_rate": 2.248799015327907e-07, "loss": 0.4409, "step": 8176 }, { "epoch": 0.93, "learning_rate": 2.2409996764329644e-07, "loss": 0.431, "step": 8177 }, { "epoch": 0.93, "learning_rate": 2.233213732703665e-07, "loss": 0.4616, "step": 8178 }, { "epoch": 0.93, "learning_rate": 2.2254411852068226e-07, "loss": 0.442, "step": 8179 }, { "epoch": 0.93, "learning_rate": 2.2176820350074846e-07, "loss": 0.4572, "step": 8180 }, { "epoch": 0.93, "learning_rate": 2.2099362831688008e-07, "loss": 0.4326, "step": 8181 }, { "epoch": 0.94, "learning_rate": 2.2022039307521337e-07, "loss": 0.4631, "step": 8182 }, { "epoch": 0.94, "learning_rate": 2.1944849788169798e-07, "loss": 0.4388, "step": 8183 }, { "epoch": 0.94, "learning_rate": 2.1867794284209932e-07, "loss": 0.4536, "step": 8184 }, { "epoch": 0.94, "learning_rate": 2.179087280620018e-07, "loss": 0.4582, "step": 8185 }, { "epoch": 0.94, "learning_rate": 2.1714085364680671e-07, "loss": 0.4496, "step": 8186 }, { "epoch": 0.94, "learning_rate": 2.163743197017265e-07, "loss": 0.4677, "step": 8187 }, { "epoch": 0.94, "learning_rate": 2.156091263317972e-07, "loss": 0.4457, "step": 8188 }, { "epoch": 0.94, "learning_rate": 2.1484527364186492e-07, "loss": 0.4335, "step": 8189 }, { "epoch": 0.94, "learning_rate": 2.140827617365948e-07, "loss": 0.4598, "step": 8190 }, { "epoch": 0.94, "learning_rate": 2.1332159072046887e-07, "loss": 0.4615, "step": 8191 }, { "epoch": 0.94, "learning_rate": 2.1256176069778367e-07, "loss": 0.4394, "step": 8192 }, { "epoch": 0.94, "learning_rate": 2.118032717726537e-07, "loss": 0.4442, "step": 8193 }, { "epoch": 0.94, "learning_rate": 2.1104612404900805e-07, "loss": 0.4259, "step": 8194 }, { "epoch": 0.94, "learning_rate": 2.102903176305926e-07, "loss": 0.461, "step": 8195 }, { "epoch": 0.94, "learning_rate": 2.0953585262097232e-07, "loss": 0.451, "step": 8196 }, { "epoch": 0.94, "learning_rate": 2.0878272912352117e-07, "loss": 0.455, "step": 8197 }, { "epoch": 0.94, "learning_rate": 2.0803094724143879e-07, "loss": 0.4479, "step": 8198 }, { "epoch": 0.94, "learning_rate": 2.0728050707773285e-07, "loss": 0.4658, "step": 8199 }, { "epoch": 0.94, "learning_rate": 2.0653140873523104e-07, "loss": 0.4647, "step": 8200 }, { "epoch": 0.94, "learning_rate": 2.0578365231657792e-07, "loss": 0.4496, "step": 8201 }, { "epoch": 0.94, "learning_rate": 2.0503723792423047e-07, "loss": 0.4439, "step": 8202 }, { "epoch": 0.94, "learning_rate": 2.0429216566046682e-07, "loss": 0.4974, "step": 8203 }, { "epoch": 0.94, "learning_rate": 2.0354843562737537e-07, "loss": 0.4585, "step": 8204 }, { "epoch": 0.94, "learning_rate": 2.0280604792686676e-07, "loss": 0.4521, "step": 8205 }, { "epoch": 0.94, "learning_rate": 2.0206500266066297e-07, "loss": 0.4531, "step": 8206 }, { "epoch": 0.94, "learning_rate": 2.0132529993030392e-07, "loss": 0.4476, "step": 8207 }, { "epoch": 0.94, "learning_rate": 2.0058693983714628e-07, "loss": 0.4422, "step": 8208 }, { "epoch": 0.94, "learning_rate": 1.9984992248236135e-07, "loss": 0.4532, "step": 8209 }, { "epoch": 0.94, "learning_rate": 1.9911424796693611e-07, "loss": 0.4243, "step": 8210 }, { "epoch": 0.94, "learning_rate": 1.9837991639167552e-07, "loss": 0.4565, "step": 8211 }, { "epoch": 0.94, "learning_rate": 1.9764692785719909e-07, "loss": 0.426, "step": 8212 }, { "epoch": 0.94, "learning_rate": 1.9691528246394197e-07, "loss": 0.4706, "step": 8213 }, { "epoch": 0.94, "learning_rate": 1.9618498031215738e-07, "loss": 0.4329, "step": 8214 }, { "epoch": 0.94, "learning_rate": 1.954560215019108e-07, "loss": 0.4393, "step": 8215 }, { "epoch": 0.94, "learning_rate": 1.9472840613308787e-07, "loss": 0.4472, "step": 8216 }, { "epoch": 0.94, "learning_rate": 1.9400213430538773e-07, "loss": 0.4587, "step": 8217 }, { "epoch": 0.94, "learning_rate": 1.9327720611832523e-07, "loss": 0.4529, "step": 8218 }, { "epoch": 0.94, "learning_rate": 1.9255362167123316e-07, "loss": 0.4603, "step": 8219 }, { "epoch": 0.94, "learning_rate": 1.918313810632566e-07, "loss": 0.4376, "step": 8220 }, { "epoch": 0.94, "learning_rate": 1.9111048439335978e-07, "loss": 0.4576, "step": 8221 }, { "epoch": 0.94, "learning_rate": 1.903909317603214e-07, "loss": 0.4322, "step": 8222 }, { "epoch": 0.94, "learning_rate": 1.89672723262736e-07, "loss": 0.4532, "step": 8223 }, { "epoch": 0.94, "learning_rate": 1.889558589990148e-07, "loss": 0.459, "step": 8224 }, { "epoch": 0.94, "learning_rate": 1.882403390673837e-07, "loss": 0.4548, "step": 8225 }, { "epoch": 0.94, "learning_rate": 1.8752616356588648e-07, "loss": 0.4389, "step": 8226 }, { "epoch": 0.94, "learning_rate": 1.8681333259237933e-07, "loss": 0.4535, "step": 8227 }, { "epoch": 0.94, "learning_rate": 1.861018462445352e-07, "loss": 0.4543, "step": 8228 }, { "epoch": 0.94, "learning_rate": 1.8539170461984612e-07, "loss": 0.4711, "step": 8229 }, { "epoch": 0.94, "learning_rate": 1.8468290781561538e-07, "loss": 0.4632, "step": 8230 }, { "epoch": 0.94, "learning_rate": 1.8397545592896527e-07, "loss": 0.4474, "step": 8231 }, { "epoch": 0.94, "learning_rate": 1.832693490568327e-07, "loss": 0.4422, "step": 8232 }, { "epoch": 0.94, "learning_rate": 1.8256458729596692e-07, "loss": 0.4676, "step": 8233 }, { "epoch": 0.94, "learning_rate": 1.8186117074293964e-07, "loss": 0.4515, "step": 8234 }, { "epoch": 0.94, "learning_rate": 1.811590994941337e-07, "loss": 0.4537, "step": 8235 }, { "epoch": 0.94, "learning_rate": 1.804583736457477e-07, "loss": 0.437, "step": 8236 }, { "epoch": 0.94, "learning_rate": 1.797589932937982e-07, "loss": 0.4531, "step": 8237 }, { "epoch": 0.94, "learning_rate": 1.790609585341141e-07, "loss": 0.4455, "step": 8238 }, { "epoch": 0.94, "learning_rate": 1.7836426946234332e-07, "loss": 0.4547, "step": 8239 }, { "epoch": 0.94, "learning_rate": 1.7766892617394727e-07, "loss": 0.4408, "step": 8240 }, { "epoch": 0.94, "learning_rate": 1.7697492876420198e-07, "loss": 0.4442, "step": 8241 }, { "epoch": 0.94, "learning_rate": 1.7628227732820247e-07, "loss": 0.4326, "step": 8242 }, { "epoch": 0.94, "learning_rate": 1.755909719608573e-07, "loss": 0.4699, "step": 8243 }, { "epoch": 0.94, "learning_rate": 1.7490101275689064e-07, "loss": 0.459, "step": 8244 }, { "epoch": 0.94, "learning_rate": 1.7421239981084136e-07, "loss": 0.4532, "step": 8245 }, { "epoch": 0.94, "learning_rate": 1.7352513321706621e-07, "loss": 0.4455, "step": 8246 }, { "epoch": 0.94, "learning_rate": 1.7283921306973538e-07, "loss": 0.4646, "step": 8247 }, { "epoch": 0.94, "learning_rate": 1.7215463946283483e-07, "loss": 0.4467, "step": 8248 }, { "epoch": 0.94, "learning_rate": 1.714714124901662e-07, "loss": 0.4495, "step": 8249 }, { "epoch": 0.94, "learning_rate": 1.70789532245349e-07, "loss": 0.4299, "step": 8250 }, { "epoch": 0.94, "learning_rate": 1.70108998821813e-07, "loss": 0.456, "step": 8251 }, { "epoch": 0.94, "learning_rate": 1.6942981231280798e-07, "loss": 0.4508, "step": 8252 }, { "epoch": 0.94, "learning_rate": 1.6875197281139844e-07, "loss": 0.4679, "step": 8253 }, { "epoch": 0.94, "learning_rate": 1.680754804104623e-07, "loss": 0.4539, "step": 8254 }, { "epoch": 0.94, "learning_rate": 1.6740033520269538e-07, "loss": 0.458, "step": 8255 }, { "epoch": 0.94, "learning_rate": 1.6672653728060594e-07, "loss": 0.4426, "step": 8256 }, { "epoch": 0.94, "learning_rate": 1.6605408673652012e-07, "loss": 0.4507, "step": 8257 }, { "epoch": 0.94, "learning_rate": 1.6538298366257975e-07, "loss": 0.4408, "step": 8258 }, { "epoch": 0.94, "learning_rate": 1.647132281507391e-07, "loss": 0.4554, "step": 8259 }, { "epoch": 0.94, "learning_rate": 1.6404482029277023e-07, "loss": 0.4514, "step": 8260 }, { "epoch": 0.94, "learning_rate": 1.6337776018026108e-07, "loss": 0.449, "step": 8261 }, { "epoch": 0.94, "learning_rate": 1.627120479046118e-07, "loss": 0.4437, "step": 8262 }, { "epoch": 0.94, "learning_rate": 1.620476835570417e-07, "loss": 0.4701, "step": 8263 }, { "epoch": 0.94, "learning_rate": 1.6138466722858237e-07, "loss": 0.4428, "step": 8264 }, { "epoch": 0.94, "learning_rate": 1.6072299901008226e-07, "loss": 0.4623, "step": 8265 }, { "epoch": 0.94, "learning_rate": 1.6006267899220552e-07, "loss": 0.4378, "step": 8266 }, { "epoch": 0.94, "learning_rate": 1.5940370726542864e-07, "loss": 0.4599, "step": 8267 }, { "epoch": 0.94, "learning_rate": 1.587460839200472e-07, "loss": 0.4498, "step": 8268 }, { "epoch": 0.95, "learning_rate": 1.580898090461691e-07, "loss": 0.4708, "step": 8269 }, { "epoch": 0.95, "learning_rate": 1.5743488273372133e-07, "loss": 0.4397, "step": 8270 }, { "epoch": 0.95, "learning_rate": 1.567813050724387e-07, "loss": 0.4513, "step": 8271 }, { "epoch": 0.95, "learning_rate": 1.5612907615187967e-07, "loss": 0.4539, "step": 8272 }, { "epoch": 0.95, "learning_rate": 1.554781960614138e-07, "loss": 0.467, "step": 8273 }, { "epoch": 0.95, "learning_rate": 1.548286648902253e-07, "loss": 0.4331, "step": 8274 }, { "epoch": 0.95, "learning_rate": 1.5418048272731413e-07, "loss": 0.438, "step": 8275 }, { "epoch": 0.95, "learning_rate": 1.5353364966149697e-07, "loss": 0.4538, "step": 8276 }, { "epoch": 0.95, "learning_rate": 1.5288816578140298e-07, "loss": 0.4652, "step": 8277 }, { "epoch": 0.95, "learning_rate": 1.5224403117547916e-07, "loss": 0.4538, "step": 8278 }, { "epoch": 0.95, "learning_rate": 1.51601245931986e-07, "loss": 0.4449, "step": 8279 }, { "epoch": 0.95, "learning_rate": 1.5095981013899863e-07, "loss": 0.435, "step": 8280 }, { "epoch": 0.95, "learning_rate": 1.5031972388440787e-07, "loss": 0.4511, "step": 8281 }, { "epoch": 0.95, "learning_rate": 1.4968098725592127e-07, "loss": 0.445, "step": 8282 }, { "epoch": 0.95, "learning_rate": 1.4904360034106e-07, "loss": 0.4407, "step": 8283 }, { "epoch": 0.95, "learning_rate": 1.4840756322715866e-07, "loss": 0.4414, "step": 8284 }, { "epoch": 0.95, "learning_rate": 1.477728760013697e-07, "loss": 0.4752, "step": 8285 }, { "epoch": 0.95, "learning_rate": 1.4713953875065912e-07, "loss": 0.4692, "step": 8286 }, { "epoch": 0.95, "learning_rate": 1.4650755156180973e-07, "loss": 0.4513, "step": 8287 }, { "epoch": 0.95, "learning_rate": 1.458769145214145e-07, "loss": 0.4425, "step": 8288 }, { "epoch": 0.95, "learning_rate": 1.4524762771588763e-07, "loss": 0.4558, "step": 8289 }, { "epoch": 0.95, "learning_rate": 1.4461969123145458e-07, "loss": 0.4535, "step": 8290 }, { "epoch": 0.95, "learning_rate": 1.4399310515415655e-07, "loss": 0.4321, "step": 8291 }, { "epoch": 0.95, "learning_rate": 1.4336786956985038e-07, "loss": 0.4441, "step": 8292 }, { "epoch": 0.95, "learning_rate": 1.4274398456420647e-07, "loss": 0.4445, "step": 8293 }, { "epoch": 0.95, "learning_rate": 1.4212145022271196e-07, "loss": 0.4637, "step": 8294 }, { "epoch": 0.95, "learning_rate": 1.415002666306664e-07, "loss": 0.4635, "step": 8295 }, { "epoch": 0.95, "learning_rate": 1.4088043387318838e-07, "loss": 0.4472, "step": 8296 }, { "epoch": 0.95, "learning_rate": 1.4026195203520666e-07, "loss": 0.4377, "step": 8297 }, { "epoch": 0.95, "learning_rate": 1.3964482120146672e-07, "loss": 0.4463, "step": 8298 }, { "epoch": 0.95, "learning_rate": 1.3902904145653094e-07, "loss": 0.4532, "step": 8299 }, { "epoch": 0.95, "learning_rate": 1.384146128847741e-07, "loss": 0.4427, "step": 8300 }, { "epoch": 0.95, "learning_rate": 1.3780153557038655e-07, "loss": 0.4533, "step": 8301 }, { "epoch": 0.95, "learning_rate": 1.3718980959737448e-07, "loss": 0.4675, "step": 8302 }, { "epoch": 0.95, "learning_rate": 1.365794350495564e-07, "loss": 0.4572, "step": 8303 }, { "epoch": 0.95, "learning_rate": 1.359704120105687e-07, "loss": 0.4524, "step": 8304 }, { "epoch": 0.95, "learning_rate": 1.3536274056386134e-07, "loss": 0.4236, "step": 8305 }, { "epoch": 0.95, "learning_rate": 1.3475642079269659e-07, "loss": 0.4386, "step": 8306 }, { "epoch": 0.95, "learning_rate": 1.3415145278015575e-07, "loss": 0.4413, "step": 8307 }, { "epoch": 0.95, "learning_rate": 1.335478366091325e-07, "loss": 0.4468, "step": 8308 }, { "epoch": 0.95, "learning_rate": 1.329455723623352e-07, "loss": 0.4596, "step": 8309 }, { "epoch": 0.95, "learning_rate": 1.3234466012228887e-07, "loss": 0.467, "step": 8310 }, { "epoch": 0.95, "learning_rate": 1.31745099971331e-07, "loss": 0.4309, "step": 8311 }, { "epoch": 0.95, "learning_rate": 1.3114689199161478e-07, "loss": 0.4875, "step": 8312 }, { "epoch": 0.95, "learning_rate": 1.3055003626510687e-07, "loss": 0.4334, "step": 8313 }, { "epoch": 0.95, "learning_rate": 1.2995453287359293e-07, "loss": 0.4388, "step": 8314 }, { "epoch": 0.95, "learning_rate": 1.2936038189866773e-07, "loss": 0.4582, "step": 8315 }, { "epoch": 0.95, "learning_rate": 1.287675834217428e-07, "loss": 0.4398, "step": 8316 }, { "epoch": 0.95, "learning_rate": 1.2817613752404646e-07, "loss": 0.4413, "step": 8317 }, { "epoch": 0.95, "learning_rate": 1.2758604428661836e-07, "loss": 0.469, "step": 8318 }, { "epoch": 0.95, "learning_rate": 1.2699730379031604e-07, "loss": 0.4525, "step": 8319 }, { "epoch": 0.95, "learning_rate": 1.2640991611580943e-07, "loss": 0.4553, "step": 8320 }, { "epoch": 0.95, "learning_rate": 1.2582388134358414e-07, "loss": 0.469, "step": 8321 }, { "epoch": 0.95, "learning_rate": 1.2523919955393925e-07, "loss": 0.4566, "step": 8322 }, { "epoch": 0.95, "learning_rate": 1.246558708269896e-07, "loss": 0.4418, "step": 8323 }, { "epoch": 0.95, "learning_rate": 1.2407389524266456e-07, "loss": 0.4348, "step": 8324 }, { "epoch": 0.95, "learning_rate": 1.23493272880707e-07, "loss": 0.4491, "step": 8325 }, { "epoch": 0.95, "learning_rate": 1.2291400382067553e-07, "loss": 0.4521, "step": 8326 }, { "epoch": 0.95, "learning_rate": 1.223360881419433e-07, "loss": 0.4571, "step": 8327 }, { "epoch": 0.95, "learning_rate": 1.21759525923697e-07, "loss": 0.4485, "step": 8328 }, { "epoch": 0.95, "learning_rate": 1.2118431724493895e-07, "loss": 0.4499, "step": 8329 }, { "epoch": 0.95, "learning_rate": 1.2061046218448724e-07, "loss": 0.4544, "step": 8330 }, { "epoch": 0.95, "learning_rate": 1.2003796082097008e-07, "loss": 0.4409, "step": 8331 }, { "epoch": 0.95, "learning_rate": 1.194668132328325e-07, "loss": 0.4329, "step": 8332 }, { "epoch": 0.95, "learning_rate": 1.1889701949833743e-07, "loss": 0.4414, "step": 8333 }, { "epoch": 0.95, "learning_rate": 1.18328579695558e-07, "loss": 0.448, "step": 8334 }, { "epoch": 0.95, "learning_rate": 1.1776149390238301e-07, "loss": 0.4538, "step": 8335 }, { "epoch": 0.95, "learning_rate": 1.1719576219651585e-07, "loss": 0.4408, "step": 8336 }, { "epoch": 0.95, "learning_rate": 1.1663138465547341e-07, "loss": 0.4368, "step": 8337 }, { "epoch": 0.95, "learning_rate": 1.1606836135658939e-07, "loss": 0.453, "step": 8338 }, { "epoch": 0.95, "learning_rate": 1.1550669237700985e-07, "loss": 0.4487, "step": 8339 }, { "epoch": 0.95, "learning_rate": 1.1494637779369766e-07, "loss": 0.429, "step": 8340 }, { "epoch": 0.95, "learning_rate": 1.1438741768342587e-07, "loss": 0.4466, "step": 8341 }, { "epoch": 0.95, "learning_rate": 1.1382981212278655e-07, "loss": 0.4571, "step": 8342 }, { "epoch": 0.95, "learning_rate": 1.13273561188183e-07, "loss": 0.4546, "step": 8343 }, { "epoch": 0.95, "learning_rate": 1.1271866495583428e-07, "loss": 0.4403, "step": 8344 }, { "epoch": 0.95, "learning_rate": 1.12165123501774e-07, "loss": 0.4579, "step": 8345 }, { "epoch": 0.95, "learning_rate": 1.1161293690184927e-07, "loss": 0.4458, "step": 8346 }, { "epoch": 0.95, "learning_rate": 1.1106210523172068e-07, "loss": 0.4447, "step": 8347 }, { "epoch": 0.95, "learning_rate": 1.1051262856686673e-07, "loss": 0.4585, "step": 8348 }, { "epoch": 0.95, "learning_rate": 1.0996450698257721e-07, "loss": 0.4428, "step": 8349 }, { "epoch": 0.95, "learning_rate": 1.0941774055395538e-07, "loss": 0.4559, "step": 8350 }, { "epoch": 0.95, "learning_rate": 1.0887232935592351e-07, "loss": 0.4442, "step": 8351 }, { "epoch": 0.95, "learning_rate": 1.0832827346321295e-07, "loss": 0.4561, "step": 8352 }, { "epoch": 0.95, "learning_rate": 1.0778557295037296e-07, "loss": 0.4558, "step": 8353 }, { "epoch": 0.95, "learning_rate": 1.0724422789176404e-07, "loss": 0.4638, "step": 8354 }, { "epoch": 0.95, "learning_rate": 1.0670423836156241e-07, "loss": 0.439, "step": 8355 }, { "epoch": 0.95, "learning_rate": 1.0616560443376e-07, "loss": 0.4519, "step": 8356 }, { "epoch": 0.96, "learning_rate": 1.0562832618216223e-07, "loss": 0.4447, "step": 8357 }, { "epoch": 0.96, "learning_rate": 1.0509240368038576e-07, "loss": 0.4416, "step": 8358 }, { "epoch": 0.96, "learning_rate": 1.0455783700186628e-07, "loss": 0.4505, "step": 8359 }, { "epoch": 0.96, "learning_rate": 1.0402462621984965e-07, "loss": 0.4415, "step": 8360 }, { "epoch": 0.96, "learning_rate": 1.0349277140739966e-07, "loss": 0.4615, "step": 8361 }, { "epoch": 0.96, "learning_rate": 1.0296227263739023e-07, "loss": 0.4467, "step": 8362 }, { "epoch": 0.96, "learning_rate": 1.0243312998251209e-07, "loss": 0.4314, "step": 8363 }, { "epoch": 0.96, "learning_rate": 1.0190534351527059e-07, "loss": 0.4581, "step": 8364 }, { "epoch": 0.96, "learning_rate": 1.0137891330798344e-07, "loss": 0.4285, "step": 8365 }, { "epoch": 0.96, "learning_rate": 1.0085383943278293e-07, "loss": 0.4495, "step": 8366 }, { "epoch": 0.96, "learning_rate": 1.0033012196161706e-07, "loss": 0.4665, "step": 8367 }, { "epoch": 0.96, "learning_rate": 9.980776096624511e-08, "loss": 0.4569, "step": 8368 }, { "epoch": 0.96, "learning_rate": 9.928675651824427e-08, "loss": 0.4427, "step": 8369 }, { "epoch": 0.96, "learning_rate": 9.876710868900297e-08, "loss": 0.4595, "step": 8370 }, { "epoch": 0.96, "learning_rate": 9.824881754972426e-08, "loss": 0.4592, "step": 8371 }, { "epoch": 0.96, "learning_rate": 9.773188317142579e-08, "loss": 0.4459, "step": 8372 }, { "epoch": 0.96, "learning_rate": 9.721630562493867e-08, "loss": 0.4578, "step": 8373 }, { "epoch": 0.96, "learning_rate": 9.670208498090861e-08, "loss": 0.4662, "step": 8374 }, { "epoch": 0.96, "learning_rate": 9.61892213097959e-08, "loss": 0.4425, "step": 8375 }, { "epoch": 0.96, "learning_rate": 9.567771468187326e-08, "loss": 0.4341, "step": 8376 }, { "epoch": 0.96, "learning_rate": 9.516756516723124e-08, "loss": 0.4402, "step": 8377 }, { "epoch": 0.96, "learning_rate": 9.46587728357673e-08, "loss": 0.4484, "step": 8378 }, { "epoch": 0.96, "learning_rate": 9.415133775720231e-08, "loss": 0.477, "step": 8379 }, { "epoch": 0.96, "learning_rate": 9.364526000106289e-08, "loss": 0.4292, "step": 8380 }, { "epoch": 0.96, "learning_rate": 9.314053963669245e-08, "loss": 0.4351, "step": 8381 }, { "epoch": 0.96, "learning_rate": 9.263717673325124e-08, "loss": 0.4642, "step": 8382 }, { "epoch": 0.96, "learning_rate": 9.213517135971073e-08, "loss": 0.4251, "step": 8383 }, { "epoch": 0.96, "learning_rate": 9.163452358485591e-08, "loss": 0.4471, "step": 8384 }, { "epoch": 0.96, "learning_rate": 9.113523347728748e-08, "loss": 0.4405, "step": 8385 }, { "epoch": 0.96, "learning_rate": 9.063730110541846e-08, "loss": 0.4519, "step": 8386 }, { "epoch": 0.96, "learning_rate": 9.014072653747763e-08, "loss": 0.4561, "step": 8387 }, { "epoch": 0.96, "learning_rate": 8.964550984150611e-08, "loss": 0.4654, "step": 8388 }, { "epoch": 0.96, "learning_rate": 8.915165108536072e-08, "loss": 0.4423, "step": 8389 }, { "epoch": 0.96, "learning_rate": 8.865915033671069e-08, "loss": 0.4749, "step": 8390 }, { "epoch": 0.96, "learning_rate": 8.816800766303756e-08, "loss": 0.4455, "step": 8391 }, { "epoch": 0.96, "learning_rate": 8.767822313164198e-08, "loss": 0.4368, "step": 8392 }, { "epoch": 0.96, "learning_rate": 8.718979680963469e-08, "loss": 0.4495, "step": 8393 }, { "epoch": 0.96, "learning_rate": 8.670272876393881e-08, "loss": 0.4468, "step": 8394 }, { "epoch": 0.96, "learning_rate": 8.621701906129542e-08, "loss": 0.4538, "step": 8395 }, { "epoch": 0.96, "learning_rate": 8.573266776825683e-08, "loss": 0.4725, "step": 8396 }, { "epoch": 0.96, "learning_rate": 8.524967495119107e-08, "loss": 0.4482, "step": 8397 }, { "epoch": 0.96, "learning_rate": 8.476804067627852e-08, "loss": 0.4601, "step": 8398 }, { "epoch": 0.96, "learning_rate": 8.428776500951308e-08, "loss": 0.4497, "step": 8399 }, { "epoch": 0.96, "learning_rate": 8.380884801670431e-08, "loss": 0.4364, "step": 8400 }, { "epoch": 0.96, "learning_rate": 8.333128976347305e-08, "loss": 0.4429, "step": 8401 }, { "epoch": 0.96, "learning_rate": 8.285509031525696e-08, "loss": 0.461, "step": 8402 }, { "epoch": 0.96, "learning_rate": 8.238024973730497e-08, "loss": 0.4412, "step": 8403 }, { "epoch": 0.96, "learning_rate": 8.190676809468056e-08, "loss": 0.4573, "step": 8404 }, { "epoch": 0.96, "learning_rate": 8.143464545226298e-08, "loss": 0.4421, "step": 8405 }, { "epoch": 0.96, "learning_rate": 8.096388187474269e-08, "loss": 0.4717, "step": 8406 }, { "epoch": 0.96, "learning_rate": 8.049447742662364e-08, "loss": 0.4514, "step": 8407 }, { "epoch": 0.96, "learning_rate": 8.002643217222661e-08, "loss": 0.4507, "step": 8408 }, { "epoch": 0.96, "learning_rate": 7.955974617568252e-08, "loss": 0.4262, "step": 8409 }, { "epoch": 0.96, "learning_rate": 7.90944195009391e-08, "loss": 0.4479, "step": 8410 }, { "epoch": 0.96, "learning_rate": 7.863045221175647e-08, "loss": 0.4506, "step": 8411 }, { "epoch": 0.96, "learning_rate": 7.81678443717071e-08, "loss": 0.4619, "step": 8412 }, { "epoch": 0.96, "learning_rate": 7.77065960441803e-08, "loss": 0.4708, "step": 8413 }, { "epoch": 0.96, "learning_rate": 7.72467072923766e-08, "loss": 0.4405, "step": 8414 }, { "epoch": 0.96, "learning_rate": 7.678817817931006e-08, "loss": 0.4463, "step": 8415 }, { "epoch": 0.96, "learning_rate": 7.633100876781152e-08, "loss": 0.48, "step": 8416 }, { "epoch": 0.96, "learning_rate": 7.587519912052199e-08, "loss": 0.4355, "step": 8417 }, { "epoch": 0.96, "learning_rate": 7.542074929989818e-08, "loss": 0.4531, "step": 8418 }, { "epoch": 0.96, "learning_rate": 7.496765936821027e-08, "loss": 0.4639, "step": 8419 }, { "epoch": 0.96, "learning_rate": 7.451592938753971e-08, "loss": 0.4652, "step": 8420 }, { "epoch": 0.96, "learning_rate": 7.406555941978478e-08, "loss": 0.4412, "step": 8421 }, { "epoch": 0.96, "learning_rate": 7.361654952665608e-08, "loss": 0.4694, "step": 8422 }, { "epoch": 0.96, "learning_rate": 7.31688997696789e-08, "loss": 0.4387, "step": 8423 }, { "epoch": 0.96, "learning_rate": 7.272261021019079e-08, "loss": 0.4594, "step": 8424 }, { "epoch": 0.96, "learning_rate": 7.227768090934285e-08, "loss": 0.4461, "step": 8425 }, { "epoch": 0.96, "learning_rate": 7.183411192810075e-08, "loss": 0.4421, "step": 8426 }, { "epoch": 0.96, "learning_rate": 7.139190332724255e-08, "loss": 0.4374, "step": 8427 }, { "epoch": 0.96, "learning_rate": 7.095105516736201e-08, "loss": 0.4646, "step": 8428 }, { "epoch": 0.96, "learning_rate": 7.051156750886523e-08, "loss": 0.451, "step": 8429 }, { "epoch": 0.96, "learning_rate": 7.007344041196962e-08, "loss": 0.4344, "step": 8430 }, { "epoch": 0.96, "learning_rate": 6.963667393671048e-08, "loss": 0.4456, "step": 8431 }, { "epoch": 0.96, "learning_rate": 6.920126814293438e-08, "loss": 0.4396, "step": 8432 }, { "epoch": 0.96, "learning_rate": 6.876722309030026e-08, "loss": 0.4522, "step": 8433 }, { "epoch": 0.96, "learning_rate": 6.833453883828389e-08, "loss": 0.449, "step": 8434 }, { "epoch": 0.96, "learning_rate": 6.790321544617117e-08, "loss": 0.4438, "step": 8435 }, { "epoch": 0.96, "learning_rate": 6.747325297306484e-08, "loss": 0.4538, "step": 8436 }, { "epoch": 0.96, "learning_rate": 6.704465147787665e-08, "loss": 0.4676, "step": 8437 }, { "epoch": 0.96, "learning_rate": 6.661741101933628e-08, "loss": 0.4309, "step": 8438 }, { "epoch": 0.96, "learning_rate": 6.61915316559858e-08, "loss": 0.4555, "step": 8439 }, { "epoch": 0.96, "learning_rate": 6.576701344617964e-08, "loss": 0.4451, "step": 8440 }, { "epoch": 0.96, "learning_rate": 6.534385644808461e-08, "loss": 0.4492, "step": 8441 }, { "epoch": 0.96, "learning_rate": 6.492206071968432e-08, "loss": 0.4569, "step": 8442 }, { "epoch": 0.96, "learning_rate": 6.450162631877366e-08, "loss": 0.4277, "step": 8443 }, { "epoch": 0.97, "learning_rate": 6.40825533029632e-08, "loss": 0.4393, "step": 8444 }, { "epoch": 0.97, "learning_rate": 6.366484172967369e-08, "loss": 0.4463, "step": 8445 }, { "epoch": 0.97, "learning_rate": 6.324849165614045e-08, "loss": 0.4572, "step": 8446 }, { "epoch": 0.97, "learning_rate": 6.28335031394134e-08, "loss": 0.4336, "step": 8447 }, { "epoch": 0.97, "learning_rate": 6.241987623635482e-08, "loss": 0.4617, "step": 8448 }, { "epoch": 0.97, "learning_rate": 6.200761100364272e-08, "loss": 0.4252, "step": 8449 }, { "epoch": 0.97, "learning_rate": 6.159670749776414e-08, "loss": 0.4396, "step": 8450 }, { "epoch": 0.97, "learning_rate": 6.118716577502404e-08, "loss": 0.4562, "step": 8451 }, { "epoch": 0.97, "learning_rate": 6.077898589153642e-08, "loss": 0.4598, "step": 8452 }, { "epoch": 0.97, "learning_rate": 6.037216790323319e-08, "loss": 0.4458, "step": 8453 }, { "epoch": 0.97, "learning_rate": 5.996671186585756e-08, "loss": 0.4534, "step": 8454 }, { "epoch": 0.97, "learning_rate": 5.9562617834963974e-08, "loss": 0.4514, "step": 8455 }, { "epoch": 0.97, "learning_rate": 5.915988586592481e-08, "loss": 0.4507, "step": 8456 }, { "epoch": 0.97, "learning_rate": 5.8758516013921464e-08, "loss": 0.4562, "step": 8457 }, { "epoch": 0.97, "learning_rate": 5.8358508333951066e-08, "loss": 0.4379, "step": 8458 }, { "epoch": 0.97, "learning_rate": 5.795986288082422e-08, "loss": 0.438, "step": 8459 }, { "epoch": 0.97, "learning_rate": 5.75625797091639e-08, "loss": 0.4665, "step": 8460 }, { "epoch": 0.97, "learning_rate": 5.716665887340656e-08, "loss": 0.4447, "step": 8461 }, { "epoch": 0.97, "learning_rate": 5.677210042780212e-08, "loss": 0.4512, "step": 8462 }, { "epoch": 0.97, "learning_rate": 5.637890442641403e-08, "loss": 0.4368, "step": 8463 }, { "epoch": 0.97, "learning_rate": 5.598707092311917e-08, "loss": 0.4483, "step": 8464 }, { "epoch": 0.97, "learning_rate": 5.5596599971606823e-08, "loss": 0.4491, "step": 8465 }, { "epoch": 0.97, "learning_rate": 5.520749162538197e-08, "loss": 0.4589, "step": 8466 }, { "epoch": 0.97, "learning_rate": 5.4819745937758625e-08, "loss": 0.4372, "step": 8467 }, { "epoch": 0.97, "learning_rate": 5.443336296186874e-08, "loss": 0.4507, "step": 8468 }, { "epoch": 0.97, "learning_rate": 5.40483427506544e-08, "loss": 0.4463, "step": 8469 }, { "epoch": 0.97, "learning_rate": 5.3664685356871193e-08, "loss": 0.4787, "step": 8470 }, { "epoch": 0.97, "learning_rate": 5.3282390833090393e-08, "loss": 0.4549, "step": 8471 }, { "epoch": 0.97, "learning_rate": 5.290145923169343e-08, "loss": 0.4251, "step": 8472 }, { "epoch": 0.97, "learning_rate": 5.252189060487855e-08, "loss": 0.4497, "step": 8473 }, { "epoch": 0.97, "learning_rate": 5.214368500465305e-08, "loss": 0.4614, "step": 8474 }, { "epoch": 0.97, "learning_rate": 5.176684248283992e-08, "loss": 0.4422, "step": 8475 }, { "epoch": 0.97, "learning_rate": 5.1391363091075616e-08, "loss": 0.4454, "step": 8476 }, { "epoch": 0.97, "learning_rate": 5.1017246880809e-08, "loss": 0.4402, "step": 8477 }, { "epoch": 0.97, "learning_rate": 5.064449390330239e-08, "loss": 0.4599, "step": 8478 }, { "epoch": 0.97, "learning_rate": 5.02731042096305e-08, "loss": 0.4456, "step": 8479 }, { "epoch": 0.97, "learning_rate": 4.99030778506826e-08, "loss": 0.4534, "step": 8480 }, { "epoch": 0.97, "learning_rate": 4.953441487716037e-08, "loss": 0.4505, "step": 8481 }, { "epoch": 0.97, "learning_rate": 4.9167115339580074e-08, "loss": 0.461, "step": 8482 }, { "epoch": 0.97, "learning_rate": 4.8801179288268105e-08, "loss": 0.4449, "step": 8483 }, { "epoch": 0.97, "learning_rate": 4.84366067733677e-08, "loss": 0.451, "step": 8484 }, { "epoch": 0.97, "learning_rate": 4.807339784483112e-08, "loss": 0.4375, "step": 8485 }, { "epoch": 0.97, "learning_rate": 4.771155255242854e-08, "loss": 0.4622, "step": 8486 }, { "epoch": 0.97, "learning_rate": 4.7351070945739206e-08, "loss": 0.4462, "step": 8487 }, { "epoch": 0.97, "learning_rate": 4.699195307415805e-08, "loss": 0.4648, "step": 8488 }, { "epoch": 0.97, "learning_rate": 4.663419898689125e-08, "loss": 0.4283, "step": 8489 }, { "epoch": 0.97, "learning_rate": 4.6277808732959616e-08, "loss": 0.4329, "step": 8490 }, { "epoch": 0.97, "learning_rate": 4.5922782361197405e-08, "loss": 0.4742, "step": 8491 }, { "epoch": 0.97, "learning_rate": 4.556911992025015e-08, "loss": 0.4469, "step": 8492 }, { "epoch": 0.97, "learning_rate": 4.521682145857797e-08, "loss": 0.4465, "step": 8493 }, { "epoch": 0.97, "learning_rate": 4.486588702445338e-08, "loss": 0.4458, "step": 8494 }, { "epoch": 0.97, "learning_rate": 4.451631666596123e-08, "loss": 0.4394, "step": 8495 }, { "epoch": 0.97, "learning_rate": 4.416811043100322e-08, "loss": 0.4785, "step": 8496 }, { "epoch": 0.97, "learning_rate": 4.382126836728895e-08, "loss": 0.4551, "step": 8497 }, { "epoch": 0.97, "learning_rate": 4.347579052234374e-08, "loss": 0.4671, "step": 8498 }, { "epoch": 0.97, "learning_rate": 4.3131676943506395e-08, "loss": 0.4613, "step": 8499 }, { "epoch": 0.97, "learning_rate": 4.278892767792808e-08, "loss": 0.463, "step": 8500 }, { "epoch": 0.97, "learning_rate": 4.244754277257346e-08, "loss": 0.4322, "step": 8501 }, { "epoch": 0.97, "learning_rate": 4.210752227421955e-08, "loss": 0.4353, "step": 8502 }, { "epoch": 0.97, "learning_rate": 4.176886622945575e-08, "loss": 0.4607, "step": 8503 }, { "epoch": 0.97, "learning_rate": 4.143157468468717e-08, "loss": 0.4652, "step": 8504 }, { "epoch": 0.97, "learning_rate": 4.109564768613017e-08, "loss": 0.4465, "step": 8505 }, { "epoch": 0.97, "learning_rate": 4.076108527981237e-08, "loss": 0.4399, "step": 8506 }, { "epoch": 0.97, "learning_rate": 4.0427887511578224e-08, "loss": 0.4457, "step": 8507 }, { "epoch": 0.97, "learning_rate": 4.009605442708231e-08, "loss": 0.4501, "step": 8508 }, { "epoch": 0.97, "learning_rate": 3.976558607179382e-08, "loss": 0.4637, "step": 8509 }, { "epoch": 0.97, "learning_rate": 3.943648249099319e-08, "loss": 0.4323, "step": 8510 }, { "epoch": 0.97, "learning_rate": 3.910874372977658e-08, "loss": 0.4528, "step": 8511 }, { "epoch": 0.97, "learning_rate": 3.8782369833050284e-08, "loss": 0.4539, "step": 8512 }, { "epoch": 0.97, "learning_rate": 3.845736084553408e-08, "loss": 0.4405, "step": 8513 }, { "epoch": 0.97, "learning_rate": 3.813371681176348e-08, "loss": 0.4558, "step": 8514 }, { "epoch": 0.97, "learning_rate": 3.7811437776084095e-08, "loss": 0.4546, "step": 8515 }, { "epoch": 0.97, "learning_rate": 3.749052378265505e-08, "loss": 0.4363, "step": 8516 }, { "epoch": 0.97, "learning_rate": 3.717097487545007e-08, "loss": 0.4546, "step": 8517 }, { "epoch": 0.97, "learning_rate": 3.6852791098251906e-08, "loss": 0.4673, "step": 8518 }, { "epoch": 0.97, "learning_rate": 3.653597249466012e-08, "loss": 0.4412, "step": 8519 }, { "epoch": 0.97, "learning_rate": 3.622051910808666e-08, "loss": 0.4481, "step": 8520 }, { "epoch": 0.97, "learning_rate": 3.5906430981754724e-08, "loss": 0.4613, "step": 8521 }, { "epoch": 0.97, "learning_rate": 3.559370815870211e-08, "loss": 0.4789, "step": 8522 }, { "epoch": 0.97, "learning_rate": 3.528235068177899e-08, "loss": 0.4422, "step": 8523 }, { "epoch": 0.97, "learning_rate": 3.4972358593646785e-08, "loss": 0.4468, "step": 8524 }, { "epoch": 0.97, "learning_rate": 3.466373193678263e-08, "loss": 0.4509, "step": 8525 }, { "epoch": 0.97, "learning_rate": 3.4356470753474927e-08, "loss": 0.4454, "step": 8526 }, { "epoch": 0.97, "learning_rate": 3.4050575085825546e-08, "loss": 0.4475, "step": 8527 }, { "epoch": 0.97, "learning_rate": 3.3746044975749845e-08, "loss": 0.4434, "step": 8528 }, { "epoch": 0.97, "learning_rate": 3.3442880464972237e-08, "loss": 0.4462, "step": 8529 }, { "epoch": 0.97, "learning_rate": 3.314108159503726e-08, "loss": 0.4664, "step": 8530 }, { "epoch": 0.97, "learning_rate": 3.284064840729406e-08, "loss": 0.453, "step": 8531 }, { "epoch": 0.98, "learning_rate": 3.2541580942911935e-08, "loss": 0.4415, "step": 8532 }, { "epoch": 0.98, "learning_rate": 3.224387924286698e-08, "loss": 0.4437, "step": 8533 }, { "epoch": 0.98, "learning_rate": 3.1947543347953246e-08, "loss": 0.4495, "step": 8534 }, { "epoch": 0.98, "learning_rate": 3.1652573298774916e-08, "loss": 0.4552, "step": 8535 }, { "epoch": 0.98, "learning_rate": 3.135896913574743e-08, "loss": 0.4514, "step": 8536 }, { "epoch": 0.98, "learning_rate": 3.106673089910417e-08, "loss": 0.4368, "step": 8537 }, { "epoch": 0.98, "learning_rate": 3.077585862888643e-08, "loss": 0.4588, "step": 8538 }, { "epoch": 0.98, "learning_rate": 3.048635236495012e-08, "loss": 0.446, "step": 8539 }, { "epoch": 0.98, "learning_rate": 3.019821214696572e-08, "loss": 0.4568, "step": 8540 }, { "epoch": 0.98, "learning_rate": 2.9911438014412765e-08, "loss": 0.4559, "step": 8541 }, { "epoch": 0.98, "learning_rate": 2.962603000658648e-08, "loss": 0.4478, "step": 8542 }, { "epoch": 0.98, "learning_rate": 2.9341988162595593e-08, "loss": 0.458, "step": 8543 }, { "epoch": 0.98, "learning_rate": 2.905931252135785e-08, "loss": 0.4289, "step": 8544 }, { "epoch": 0.98, "learning_rate": 2.8778003121607834e-08, "loss": 0.4586, "step": 8545 }, { "epoch": 0.98, "learning_rate": 2.849806000189026e-08, "loss": 0.4475, "step": 8546 }, { "epoch": 0.98, "learning_rate": 2.8219483200563334e-08, "loss": 0.4482, "step": 8547 }, { "epoch": 0.98, "learning_rate": 2.794227275579986e-08, "loss": 0.4307, "step": 8548 }, { "epoch": 0.98, "learning_rate": 2.766642870558278e-08, "loss": 0.4794, "step": 8549 }, { "epoch": 0.98, "learning_rate": 2.7391951087708534e-08, "loss": 0.4402, "step": 8550 }, { "epoch": 0.98, "learning_rate": 2.7118839939787033e-08, "loss": 0.4402, "step": 8551 }, { "epoch": 0.98, "learning_rate": 2.6847095299241678e-08, "loss": 0.4382, "step": 8552 }, { "epoch": 0.98, "learning_rate": 2.6576717203304904e-08, "loss": 0.4644, "step": 8553 }, { "epoch": 0.98, "learning_rate": 2.6307705689028184e-08, "loss": 0.4639, "step": 8554 }, { "epoch": 0.98, "learning_rate": 2.6040060793268705e-08, "loss": 0.4479, "step": 8555 }, { "epoch": 0.98, "learning_rate": 2.5773782552701578e-08, "loss": 0.4348, "step": 8556 }, { "epoch": 0.98, "learning_rate": 2.550887100381205e-08, "loss": 0.436, "step": 8557 }, { "epoch": 0.98, "learning_rate": 2.5245326182899987e-08, "loss": 0.4596, "step": 8558 }, { "epoch": 0.98, "learning_rate": 2.4983148126076494e-08, "loss": 0.4529, "step": 8559 }, { "epoch": 0.98, "learning_rate": 2.4722336869265063e-08, "loss": 0.4305, "step": 8560 }, { "epoch": 0.98, "learning_rate": 2.4462892448202657e-08, "loss": 0.4697, "step": 8561 }, { "epoch": 0.98, "learning_rate": 2.4204814898440844e-08, "loss": 0.4521, "step": 8562 }, { "epoch": 0.98, "learning_rate": 2.394810425534022e-08, "loss": 0.4691, "step": 8563 }, { "epoch": 0.98, "learning_rate": 2.369276055407599e-08, "loss": 0.4614, "step": 8564 }, { "epoch": 0.98, "learning_rate": 2.3438783829635714e-08, "loss": 0.4483, "step": 8565 }, { "epoch": 0.98, "learning_rate": 2.318617411682156e-08, "loss": 0.4659, "step": 8566 }, { "epoch": 0.98, "learning_rate": 2.2934931450245833e-08, "loss": 0.4533, "step": 8567 }, { "epoch": 0.98, "learning_rate": 2.2685055864333227e-08, "loss": 0.4534, "step": 8568 }, { "epoch": 0.98, "learning_rate": 2.2436547393323017e-08, "loss": 0.4475, "step": 8569 }, { "epoch": 0.98, "learning_rate": 2.218940607126685e-08, "loss": 0.4378, "step": 8570 }, { "epoch": 0.98, "learning_rate": 2.1943631932028752e-08, "loss": 0.4555, "step": 8571 }, { "epoch": 0.98, "learning_rate": 2.169922500928512e-08, "loss": 0.4596, "step": 8572 }, { "epoch": 0.98, "learning_rate": 2.1456185336524714e-08, "loss": 0.4347, "step": 8573 }, { "epoch": 0.98, "learning_rate": 2.1214512947048684e-08, "loss": 0.4469, "step": 8574 }, { "epoch": 0.98, "learning_rate": 2.097420787397275e-08, "loss": 0.4515, "step": 8575 }, { "epoch": 0.98, "learning_rate": 2.0735270150223917e-08, "loss": 0.4495, "step": 8576 }, { "epoch": 0.98, "learning_rate": 2.0497699808542658e-08, "loss": 0.4537, "step": 8577 }, { "epoch": 0.98, "learning_rate": 2.0261496881479605e-08, "loss": 0.4443, "step": 8578 }, { "epoch": 0.98, "learning_rate": 2.002666140140108e-08, "loss": 0.4546, "step": 8579 }, { "epoch": 0.98, "learning_rate": 1.979319340048469e-08, "loss": 0.4571, "step": 8580 }, { "epoch": 0.98, "learning_rate": 1.956109291072039e-08, "loss": 0.4424, "step": 8581 }, { "epoch": 0.98, "learning_rate": 1.9330359963910527e-08, "loss": 0.4511, "step": 8582 }, { "epoch": 0.98, "learning_rate": 1.910099459167314e-08, "loss": 0.4563, "step": 8583 }, { "epoch": 0.98, "learning_rate": 1.8872996825433086e-08, "loss": 0.4414, "step": 8584 }, { "epoch": 0.98, "learning_rate": 1.864636669643427e-08, "loss": 0.4554, "step": 8585 }, { "epoch": 0.98, "learning_rate": 1.8421104235727406e-08, "loss": 0.4389, "step": 8586 }, { "epoch": 0.98, "learning_rate": 1.8197209474180023e-08, "loss": 0.4647, "step": 8587 }, { "epoch": 0.98, "learning_rate": 1.7974682442470915e-08, "loss": 0.4403, "step": 8588 }, { "epoch": 0.98, "learning_rate": 1.775352317109014e-08, "loss": 0.4513, "step": 8589 }, { "epoch": 0.98, "learning_rate": 1.7533731690342338e-08, "loss": 0.4451, "step": 8590 }, { "epoch": 0.98, "learning_rate": 1.7315308030342314e-08, "loss": 0.4486, "step": 8591 }, { "epoch": 0.98, "learning_rate": 1.7098252221021683e-08, "loss": 0.4594, "step": 8592 }, { "epoch": 0.98, "learning_rate": 1.6882564292119984e-08, "loss": 0.4419, "step": 8593 }, { "epoch": 0.98, "learning_rate": 1.666824427319136e-08, "loss": 0.4521, "step": 8594 }, { "epoch": 0.98, "learning_rate": 1.6455292193603424e-08, "loss": 0.4343, "step": 8595 }, { "epoch": 0.98, "learning_rate": 1.624370808253506e-08, "loss": 0.4542, "step": 8596 }, { "epoch": 0.98, "learning_rate": 1.6033491968976412e-08, "loss": 0.4468, "step": 8597 }, { "epoch": 0.98, "learning_rate": 1.5824643881734438e-08, "loss": 0.4459, "step": 8598 }, { "epoch": 0.98, "learning_rate": 1.561716384942402e-08, "loss": 0.4632, "step": 8599 }, { "epoch": 0.98, "learning_rate": 1.541105190047465e-08, "loss": 0.4459, "step": 8600 }, { "epoch": 0.98, "learning_rate": 1.5206308063129282e-08, "loss": 0.4326, "step": 8601 }, { "epoch": 0.98, "learning_rate": 1.5002932365442148e-08, "loss": 0.4464, "step": 8602 }, { "epoch": 0.98, "learning_rate": 1.480092483527984e-08, "loss": 0.4586, "step": 8603 }, { "epoch": 0.98, "learning_rate": 1.4600285500322442e-08, "loss": 0.4658, "step": 8604 }, { "epoch": 0.98, "learning_rate": 1.4401014388061296e-08, "loss": 0.483, "step": 8605 }, { "epoch": 0.98, "learning_rate": 1.4203111525801228e-08, "loss": 0.4419, "step": 8606 }, { "epoch": 0.98, "learning_rate": 1.4006576940659433e-08, "loss": 0.4547, "step": 8607 }, { "epoch": 0.98, "learning_rate": 1.3811410659565483e-08, "loss": 0.4322, "step": 8608 }, { "epoch": 0.98, "learning_rate": 1.3617612709262428e-08, "loss": 0.4459, "step": 8609 }, { "epoch": 0.98, "learning_rate": 1.3425183116303475e-08, "loss": 0.4408, "step": 8610 }, { "epoch": 0.98, "learning_rate": 1.3234121907056418e-08, "loss": 0.4458, "step": 8611 }, { "epoch": 0.98, "learning_rate": 1.3044429107700319e-08, "loss": 0.4581, "step": 8612 }, { "epoch": 0.98, "learning_rate": 1.2856104744228826e-08, "loss": 0.4792, "step": 8613 }, { "epoch": 0.98, "learning_rate": 1.2669148842444634e-08, "loss": 0.4454, "step": 8614 }, { "epoch": 0.98, "learning_rate": 1.248356142796725e-08, "loss": 0.4506, "step": 8615 }, { "epoch": 0.98, "learning_rate": 1.2299342526224112e-08, "loss": 0.4594, "step": 8616 }, { "epoch": 0.98, "learning_rate": 1.211649216245836e-08, "loss": 0.4516, "step": 8617 }, { "epoch": 0.98, "learning_rate": 1.1935010361724397e-08, "loss": 0.4324, "step": 8618 }, { "epoch": 0.99, "learning_rate": 1.1754897148889e-08, "loss": 0.4501, "step": 8619 }, { "epoch": 0.99, "learning_rate": 1.1576152548631314e-08, "loss": 0.45, "step": 8620 }, { "epoch": 0.99, "learning_rate": 1.1398776585445082e-08, "loss": 0.4689, "step": 8621 }, { "epoch": 0.99, "learning_rate": 1.1222769283633083e-08, "loss": 0.4379, "step": 8622 }, { "epoch": 0.99, "learning_rate": 1.1048130667312695e-08, "loss": 0.449, "step": 8623 }, { "epoch": 0.99, "learning_rate": 1.0874860760413664e-08, "loss": 0.4387, "step": 8624 }, { "epoch": 0.99, "learning_rate": 1.0702959586678108e-08, "loss": 0.4623, "step": 8625 }, { "epoch": 0.99, "learning_rate": 1.0532427169659409e-08, "loss": 0.4342, "step": 8626 }, { "epoch": 0.99, "learning_rate": 1.0363263532724433e-08, "loss": 0.4405, "step": 8627 }, { "epoch": 0.99, "learning_rate": 1.0195468699052413e-08, "loss": 0.457, "step": 8628 }, { "epoch": 0.99, "learning_rate": 1.0029042691636071e-08, "loss": 0.4239, "step": 8629 }, { "epoch": 0.99, "learning_rate": 9.863985533278275e-09, "loss": 0.4434, "step": 8630 }, { "epoch": 0.99, "learning_rate": 9.700297246596491e-09, "loss": 0.461, "step": 8631 }, { "epoch": 0.99, "learning_rate": 9.537977854018332e-09, "loss": 0.4584, "step": 8632 }, { "epoch": 0.99, "learning_rate": 9.377027377786007e-09, "loss": 0.4492, "step": 8633 }, { "epoch": 0.99, "learning_rate": 9.217445839952988e-09, "loss": 0.4512, "step": 8634 }, { "epoch": 0.99, "learning_rate": 9.059233262386225e-09, "loss": 0.4474, "step": 8635 }, { "epoch": 0.99, "learning_rate": 8.902389666765044e-09, "loss": 0.4534, "step": 8636 }, { "epoch": 0.99, "learning_rate": 8.746915074577811e-09, "loss": 0.4459, "step": 8637 }, { "epoch": 0.99, "learning_rate": 8.592809507129706e-09, "loss": 0.4423, "step": 8638 }, { "epoch": 0.99, "learning_rate": 8.440072985537174e-09, "loss": 0.4627, "step": 8639 }, { "epoch": 0.99, "learning_rate": 8.288705530727915e-09, "loss": 0.4505, "step": 8640 }, { "epoch": 0.99, "learning_rate": 8.138707163442005e-09, "loss": 0.4333, "step": 8641 }, { "epoch": 0.99, "learning_rate": 7.990077904234117e-09, "loss": 0.4511, "step": 8642 }, { "epoch": 0.99, "learning_rate": 7.84281777346796e-09, "loss": 0.457, "step": 8643 }, { "epoch": 0.99, "learning_rate": 7.696926791322946e-09, "loss": 0.4234, "step": 8644 }, { "epoch": 0.99, "learning_rate": 7.552404977788641e-09, "loss": 0.4557, "step": 8645 }, { "epoch": 0.99, "learning_rate": 7.409252352668095e-09, "loss": 0.444, "step": 8646 }, { "epoch": 0.99, "learning_rate": 7.267468935575617e-09, "loss": 0.455, "step": 8647 }, { "epoch": 0.99, "learning_rate": 7.12705474594011e-09, "loss": 0.4692, "step": 8648 }, { "epoch": 0.99, "learning_rate": 6.988009803000628e-09, "loss": 0.4765, "step": 8649 }, { "epoch": 0.99, "learning_rate": 6.8503341258086e-09, "loss": 0.4445, "step": 8650 }, { "epoch": 0.99, "learning_rate": 6.714027733230044e-09, "loss": 0.4319, "step": 8651 }, { "epoch": 0.99, "learning_rate": 6.579090643942243e-09, "loss": 0.4481, "step": 8652 }, { "epoch": 0.99, "learning_rate": 6.4455228764326305e-09, "loss": 0.4501, "step": 8653 }, { "epoch": 0.99, "learning_rate": 6.3133244490043434e-09, "loss": 0.4475, "step": 8654 }, { "epoch": 0.99, "learning_rate": 6.18249537977178e-09, "loss": 0.4532, "step": 8655 }, { "epoch": 0.99, "learning_rate": 6.053035686661712e-09, "loss": 0.4401, "step": 8656 }, { "epoch": 0.99, "learning_rate": 5.924945387411063e-09, "loss": 0.4532, "step": 8657 }, { "epoch": 0.99, "learning_rate": 5.798224499572458e-09, "loss": 0.4334, "step": 8658 }, { "epoch": 0.99, "learning_rate": 5.672873040509786e-09, "loss": 0.4682, "step": 8659 }, { "epoch": 0.99, "learning_rate": 5.548891027398195e-09, "loss": 0.4225, "step": 8660 }, { "epoch": 0.99, "learning_rate": 5.426278477226321e-09, "loss": 0.4527, "step": 8661 }, { "epoch": 0.99, "learning_rate": 5.305035406795167e-09, "loss": 0.4467, "step": 8662 }, { "epoch": 0.99, "learning_rate": 5.185161832718111e-09, "loss": 0.4284, "step": 8663 }, { "epoch": 0.99, "learning_rate": 5.0666577714186815e-09, "loss": 0.4373, "step": 8664 }, { "epoch": 0.99, "learning_rate": 4.949523239136112e-09, "loss": 0.4694, "step": 8665 }, { "epoch": 0.99, "learning_rate": 4.833758251919785e-09, "loss": 0.4355, "step": 8666 }, { "epoch": 0.99, "learning_rate": 4.7193628256325676e-09, "loss": 0.4348, "step": 8667 }, { "epoch": 0.99, "learning_rate": 4.606336975948589e-09, "loss": 0.4469, "step": 8668 }, { "epoch": 0.99, "learning_rate": 4.494680718355459e-09, "loss": 0.4447, "step": 8669 }, { "epoch": 0.99, "learning_rate": 4.384394068153164e-09, "loss": 0.4434, "step": 8670 }, { "epoch": 0.99, "learning_rate": 4.275477040451836e-09, "loss": 0.453, "step": 8671 }, { "epoch": 0.99, "learning_rate": 4.167929650176206e-09, "loss": 0.4588, "step": 8672 }, { "epoch": 0.99, "learning_rate": 4.061751912063372e-09, "loss": 0.4509, "step": 8673 }, { "epoch": 0.99, "learning_rate": 3.956943840661698e-09, "loss": 0.4543, "step": 8674 }, { "epoch": 0.99, "learning_rate": 3.853505450331918e-09, "loss": 0.4426, "step": 8675 }, { "epoch": 0.99, "learning_rate": 3.751436755247139e-09, "loss": 0.4451, "step": 8676 }, { "epoch": 0.99, "learning_rate": 3.650737769393953e-09, "loss": 0.4378, "step": 8677 }, { "epoch": 0.99, "learning_rate": 3.5514085065690984e-09, "loss": 0.4355, "step": 8678 }, { "epoch": 0.99, "learning_rate": 3.4534489803850215e-09, "loss": 0.4543, "step": 8679 }, { "epoch": 0.99, "learning_rate": 3.3568592042620974e-09, "loss": 0.4409, "step": 8680 }, { "epoch": 0.99, "learning_rate": 3.2616391914364056e-09, "loss": 0.4628, "step": 8681 }, { "epoch": 0.99, "learning_rate": 3.167788954954176e-09, "loss": 0.4445, "step": 8682 }, { "epoch": 0.99, "learning_rate": 3.075308507677344e-09, "loss": 0.4646, "step": 8683 }, { "epoch": 0.99, "learning_rate": 2.9841978622746624e-09, "loss": 0.4466, "step": 8684 }, { "epoch": 0.99, "learning_rate": 2.894457031232811e-09, "loss": 0.4682, "step": 8685 }, { "epoch": 0.99, "learning_rate": 2.8060860268475097e-09, "loss": 0.4413, "step": 8686 }, { "epoch": 0.99, "learning_rate": 2.7190848612279606e-09, "loss": 0.4405, "step": 8687 }, { "epoch": 0.99, "learning_rate": 2.6334535462935184e-09, "loss": 0.46, "step": 8688 }, { "epoch": 0.99, "learning_rate": 2.54919209377924e-09, "loss": 0.454, "step": 8689 }, { "epoch": 0.99, "learning_rate": 2.4663005152314455e-09, "loss": 0.4464, "step": 8690 }, { "epoch": 0.99, "learning_rate": 2.384778822006606e-09, "loss": 0.4624, "step": 8691 }, { "epoch": 0.99, "learning_rate": 2.304627025274675e-09, "loss": 0.4351, "step": 8692 }, { "epoch": 0.99, "learning_rate": 2.225845136019089e-09, "loss": 0.4529, "step": 8693 }, { "epoch": 0.99, "learning_rate": 2.148433165035657e-09, "loss": 0.4624, "step": 8694 }, { "epoch": 0.99, "learning_rate": 2.0723911229303396e-09, "loss": 0.4256, "step": 8695 }, { "epoch": 0.99, "learning_rate": 1.9977190201225793e-09, "loss": 0.4375, "step": 8696 }, { "epoch": 0.99, "learning_rate": 1.924416866844192e-09, "loss": 0.4619, "step": 8697 }, { "epoch": 0.99, "learning_rate": 1.8524846731404755e-09, "loss": 0.4525, "step": 8698 }, { "epoch": 0.99, "learning_rate": 1.7819224488657695e-09, "loss": 0.4452, "step": 8699 }, { "epoch": 0.99, "learning_rate": 1.7127302036901162e-09, "loss": 0.4516, "step": 8700 }, { "epoch": 0.99, "learning_rate": 1.6449079470937103e-09, "loss": 0.4446, "step": 8701 }, { "epoch": 0.99, "learning_rate": 1.5784556883691183e-09, "loss": 0.4504, "step": 8702 }, { "epoch": 0.99, "learning_rate": 1.5133734366234998e-09, "loss": 0.458, "step": 8703 }, { "epoch": 0.99, "learning_rate": 1.449661200773056e-09, "loss": 0.4442, "step": 8704 }, { "epoch": 0.99, "learning_rate": 1.3873189895485806e-09, "loss": 0.4447, "step": 8705 }, { "epoch": 0.99, "learning_rate": 1.3263468114921295e-09, "loss": 0.4641, "step": 8706 }, { "epoch": 1.0, "learning_rate": 1.2667446749581314e-09, "loss": 0.4302, "step": 8707 }, { "epoch": 1.0, "learning_rate": 1.2085125881133863e-09, "loss": 0.4294, "step": 8708 }, { "epoch": 1.0, "learning_rate": 1.1516505589381777e-09, "loss": 0.4844, "step": 8709 }, { "epoch": 1.0, "learning_rate": 1.0961585952218301e-09, "loss": 0.4651, "step": 8710 }, { "epoch": 1.0, "learning_rate": 1.042036704568261e-09, "loss": 0.4544, "step": 8711 }, { "epoch": 1.0, "learning_rate": 9.89284894395981e-10, "loss": 0.4279, "step": 8712 }, { "epoch": 1.0, "learning_rate": 9.37903171929211e-10, "loss": 0.4377, "step": 8713 }, { "epoch": 1.0, "learning_rate": 8.878915442123159e-10, "loss": 0.4588, "step": 8714 }, { "epoch": 1.0, "learning_rate": 8.392500180953722e-10, "loss": 0.4642, "step": 8715 }, { "epoch": 1.0, "learning_rate": 7.919786002441588e-10, "loss": 0.4456, "step": 8716 }, { "epoch": 1.0, "learning_rate": 7.460772971357167e-10, "loss": 0.4498, "step": 8717 }, { "epoch": 1.0, "learning_rate": 7.015461150594594e-10, "loss": 0.4332, "step": 8718 }, { "epoch": 1.0, "learning_rate": 6.583850601182829e-10, "loss": 0.4588, "step": 8719 }, { "epoch": 1.0, "learning_rate": 6.165941382241248e-10, "loss": 0.449, "step": 8720 }, { "epoch": 1.0, "learning_rate": 5.761733551057357e-10, "loss": 0.4273, "step": 8721 }, { "epoch": 1.0, "learning_rate": 5.371227162997983e-10, "loss": 0.4443, "step": 8722 }, { "epoch": 1.0, "learning_rate": 4.994422271575872e-10, "loss": 0.4435, "step": 8723 }, { "epoch": 1.0, "learning_rate": 4.631318928427497e-10, "loss": 0.4719, "step": 8724 }, { "epoch": 1.0, "learning_rate": 4.2819171833019537e-10, "loss": 0.4333, "step": 8725 }, { "epoch": 1.0, "learning_rate": 3.946217084072057e-10, "loss": 0.4628, "step": 8726 }, { "epoch": 1.0, "learning_rate": 3.624218676734348e-10, "loss": 0.4442, "step": 8727 }, { "epoch": 1.0, "learning_rate": 3.315922005420191e-10, "loss": 0.467, "step": 8728 }, { "epoch": 1.0, "learning_rate": 3.0213271123735735e-10, "loss": 0.4376, "step": 8729 }, { "epoch": 1.0, "learning_rate": 2.740434037951101e-10, "loss": 0.4528, "step": 8730 }, { "epoch": 1.0, "learning_rate": 2.4732428206442063e-10, "loss": 0.4384, "step": 8731 }, { "epoch": 1.0, "learning_rate": 2.2197534970569424e-10, "loss": 0.4699, "step": 8732 }, { "epoch": 1.0, "learning_rate": 1.9799661019392901e-10, "loss": 0.4377, "step": 8733 }, { "epoch": 1.0, "learning_rate": 1.7538806681316467e-10, "loss": 0.4585, "step": 8734 }, { "epoch": 1.0, "learning_rate": 1.5414972266314389e-10, "loss": 0.45, "step": 8735 }, { "epoch": 1.0, "learning_rate": 1.3428158065154073e-10, "loss": 0.433, "step": 8736 }, { "epoch": 1.0, "learning_rate": 1.1578364350284254e-10, "loss": 0.4574, "step": 8737 }, { "epoch": 1.0, "learning_rate": 9.865591375168848e-11, "loss": 0.4435, "step": 8738 }, { "epoch": 1.0, "learning_rate": 8.289839374286956e-11, "loss": 0.4497, "step": 8739 }, { "epoch": 1.0, "learning_rate": 6.851108563687981e-11, "loss": 0.4621, "step": 8740 }, { "epoch": 1.0, "learning_rate": 5.549399140547529e-11, "loss": 0.4419, "step": 8741 }, { "epoch": 1.0, "learning_rate": 4.3847112831674196e-11, "loss": 0.4573, "step": 8742 }, { "epoch": 1.0, "learning_rate": 3.3570451511977245e-11, "loss": 0.4466, "step": 8743 }, { "epoch": 1.0, "learning_rate": 2.466400885303699e-11, "loss": 0.4322, "step": 8744 }, { "epoch": 1.0, "learning_rate": 1.7127786077208998e-11, "loss": 0.4459, "step": 8745 }, { "epoch": 1.0, "learning_rate": 1.0961784215890448e-11, "loss": 0.4587, "step": 8746 }, { "epoch": 1.0, "learning_rate": 6.166004113961066e-12, "loss": 0.4332, "step": 8747 }, { "epoch": 1.0, "learning_rate": 2.7404464297831057e-12, "loss": 0.452, "step": 8748 }, { "epoch": 1.0, "learning_rate": 6.8511163076046e-13, "loss": 0.4351, "step": 8749 }, { "epoch": 1.0, "learning_rate": 0.0, "loss": 0.4951, "step": 8750 }, { "epoch": 1.0, "step": 8750, "total_flos": 0.0, "train_loss": 0.09011299923147474, "train_runtime": 10298.0352, "train_samples_per_second": 438.849, "train_steps_per_second": 0.85 } ], "logging_steps": 1.0, "max_steps": 8750, "num_input_tokens_seen": 0, "num_train_epochs": 1, "save_steps": 100, "total_flos": 0.0, "train_batch_size": 16, "trial_name": null, "trial_params": null }