diff --git "a/self_to_selective_run_0_restarted/log2.txt" "b/self_to_selective_run_0_restarted/log2.txt" new file mode 100644--- /dev/null +++ "b/self_to_selective_run_0_restarted/log2.txt" @@ -0,0 +1,2714 @@ +max_steps: 2500 +0 val loss 3.2108 +0 val perplexity 24.7985 +0 hella 0.2879 +0 train 3.188860 (lr=8.3916e-07) (hash(x)=45139629) +1 train 3.210170 (lr=1.6783e-06) (hash(x)=40085918) +2 train 3.252200 (lr=2.5175e-06) (hash(x)=39437218) +3 train 3.221355 (lr=3.3566e-06) (hash(x)=38902640) +4 train 3.176795 (lr=4.1958e-06) (hash(x)=40916546) +5 train 3.216760 (lr=5.0350e-06) (hash(x)=38766569) +6 train 3.182583 (lr=5.8741e-06) (hash(x)=44673131) +7 train 3.221203 (lr=6.7133e-06) (hash(x)=41810941) +8 train 3.185651 (lr=7.5524e-06) (hash(x)=35843271) +9 train 3.236627 (lr=8.3916e-06) (hash(x)=41241157) +10 train 3.261769 (lr=9.2308e-06) (hash(x)=39820755) +11 train 3.242730 (lr=1.0070e-05) (hash(x)=44867914) +12 train 3.236105 (lr=1.0909e-05) (hash(x)=45634132) +13 train 3.238039 (lr=1.1748e-05) (hash(x)=41550360) +14 train 3.230192 (lr=1.2587e-05) (hash(x)=37900494) +15 train 3.179368 (lr=1.3427e-05) (hash(x)=47433035) +16 train 3.252406 (lr=1.4266e-05) (hash(x)=37736146) +17 train 3.209925 (lr=1.5105e-05) (hash(x)=40194237) +18 train 3.279535 (lr=1.5944e-05) (hash(x)=43645651) +19 train 3.182355 (lr=1.6783e-05) (hash(x)=41146626) +20 train 3.238630 (lr=1.7622e-05) (hash(x)=33771440) +21 train 3.222870 (lr=1.8462e-05) (hash(x)=37989611) +22 train 3.229191 (lr=1.9301e-05) (hash(x)=36728745) +23 train 3.325903 (lr=2.0140e-05) (hash(x)=50363432) +24 train 3.221967 (lr=2.0979e-05) (hash(x)=38675441) +25 val loss 3.1992 +25 val perplexity 24.5126 +25 train 3.279148 (lr=2.1818e-05) (hash(x)=41257552) +26 train 3.181159 (lr=2.2657e-05) (hash(x)=40050647) +27 train 3.276433 (lr=2.3497e-05) (hash(x)=39787728) +28 train 3.242238 (lr=2.4336e-05) (hash(x)=42651056) +29 train 3.258805 (lr=2.5175e-05) (hash(x)=38139665) +30 train 3.262764 (lr=2.6014e-05) (hash(x)=39311404) +31 train 3.250903 (lr=2.6853e-05) (hash(x)=40130466) +32 train 3.181154 (lr=2.7692e-05) (hash(x)=36659677) +33 train 3.196456 (lr=2.8531e-05) (hash(x)=33799980) +34 train 3.147905 (lr=2.9371e-05) (hash(x)=58139808) +35 train 3.130027 (lr=3.0210e-05) (hash(x)=29847449) +36 train 3.224982 (lr=3.1049e-05) (hash(x)=35668373) +37 train 3.165407 (lr=3.1888e-05) (hash(x)=40750587) +38 train 3.183480 (lr=3.2727e-05) (hash(x)=36323410) +39 train 3.152521 (lr=3.3566e-05) (hash(x)=39923591) +40 train 3.148239 (lr=3.4406e-05) (hash(x)=30172063) +41 train 3.185596 (lr=3.5245e-05) (hash(x)=37173479) +42 train 3.227866 (lr=3.6084e-05) (hash(x)=35680391) +43 train 3.189787 (lr=3.6923e-05) (hash(x)=46394316) +44 train 3.237585 (lr=3.7762e-05) (hash(x)=39877497) +45 train 3.261118 (lr=3.8601e-05) (hash(x)=51033830) +46 train 3.206652 (lr=3.9441e-05) (hash(x)=44283476) +47 train 3.179192 (lr=4.0280e-05) (hash(x)=35947128) +48 train 3.253129 (lr=4.1119e-05) (hash(x)=39673493) +49 train 3.293015 (lr=4.1958e-05) (hash(x)=41136140) +50 val loss 3.1954 +50 val perplexity 24.4208 +50 train 3.204135 (lr=4.2797e-05) (hash(x)=48422333) +51 train 3.251581 (lr=4.3636e-05) (hash(x)=40183642) +52 train 3.267971 (lr=4.4476e-05) (hash(x)=40351272) +53 train 3.266420 (lr=4.5315e-05) (hash(x)=35297194) +54 train 3.192312 (lr=4.6154e-05) (hash(x)=46125579) +55 train 3.202805 (lr=4.6993e-05) (hash(x)=38248426) +56 train 3.215544 (lr=4.7832e-05) (hash(x)=40448340) +57 train 3.159972 (lr=4.8671e-05) (hash(x)=44146752) +58 train 3.241081 (lr=4.9510e-05) (hash(x)=39395791) +59 train 3.193424 (lr=5.0350e-05) (hash(x)=38968710) +60 train 3.230428 (lr=5.1189e-05) (hash(x)=40327880) +61 train 3.200022 (lr=5.2028e-05) (hash(x)=40302068) +62 train 3.321117 (lr=5.2867e-05) (hash(x)=38218472) +63 train 3.296474 (lr=5.3706e-05) (hash(x)=36478415) +64 train 3.238307 (lr=5.4545e-05) (hash(x)=37508311) +65 train 3.201221 (lr=5.5385e-05) (hash(x)=37293910) +66 train 3.277448 (lr=5.6224e-05) (hash(x)=34296333) +67 train 3.217036 (lr=5.7063e-05) (hash(x)=46892614) +68 train 3.212727 (lr=5.7902e-05) (hash(x)=36312048) +69 train 3.199722 (lr=5.8741e-05) (hash(x)=39850010) +70 train 3.150677 (lr=5.9580e-05) (hash(x)=40331461) +71 train 3.204905 (lr=6.0420e-05) (hash(x)=35911842) +72 train 3.242416 (lr=6.1259e-05) (hash(x)=36004808) +73 train 3.181610 (lr=6.2098e-05) (hash(x)=34087934) +74 train 3.208276 (lr=6.2937e-05) (hash(x)=37490984) +75 val loss 3.1957 +75 val perplexity 24.4262 +75 train 3.155364 (lr=6.3776e-05) (hash(x)=41584400) +76 train 3.169448 (lr=6.4615e-05) (hash(x)=40209862) +77 train 3.191649 (lr=6.5455e-05) (hash(x)=39307212) +78 train 3.212517 (lr=6.6294e-05) (hash(x)=40355012) +79 train 3.181795 (lr=6.7133e-05) (hash(x)=42472212) +80 train 3.239005 (lr=6.7972e-05) (hash(x)=39486935) +81 train 3.219662 (lr=6.8811e-05) (hash(x)=45975249) +82 train 3.212671 (lr=6.9650e-05) (hash(x)=41472786) +83 train 3.233334 (lr=7.0490e-05) (hash(x)=38338768) +84 train 3.268187 (lr=7.1329e-05) (hash(x)=41278608) +85 train 3.246467 (lr=7.2168e-05) (hash(x)=47810152) +86 train 3.218241 (lr=7.3007e-05) (hash(x)=39879804) +87 train 3.272779 (lr=7.3846e-05) (hash(x)=38429116) +88 train 3.280233 (lr=7.4685e-05) (hash(x)=40666583) +89 train 3.201899 (lr=7.5524e-05) (hash(x)=34785747) +90 train 3.192552 (lr=7.6364e-05) (hash(x)=39194835) +91 train 3.318100 (lr=7.7203e-05) (hash(x)=42697095) +92 train 3.205111 (lr=7.8042e-05) (hash(x)=39119037) +93 train 3.226720 (lr=7.8881e-05) (hash(x)=43825870) +94 train 3.141108 (lr=7.9720e-05) (hash(x)=39843712) +95 train 3.270424 (lr=8.0559e-05) (hash(x)=42307415) +96 train 3.241421 (lr=8.1399e-05) (hash(x)=40879729) +97 train 3.189887 (lr=8.2238e-05) (hash(x)=39084196) +98 train 3.182296 (lr=8.3077e-05) (hash(x)=39072380) +99 train 3.214878 (lr=8.3916e-05) (hash(x)=37774632) +100 val loss 3.1953 +100 val perplexity 24.4169 +100 train 3.232985 (lr=8.4755e-05) (hash(x)=38242852) +101 train 3.154906 (lr=8.5594e-05) (hash(x)=47481547) +102 train 3.205056 (lr=8.6434e-05) (hash(x)=29646220) +103 train 3.216517 (lr=8.7273e-05) (hash(x)=39256869) +104 train 3.245875 (lr=8.8112e-05) (hash(x)=41662676) +105 train 3.203347 (lr=8.8951e-05) (hash(x)=41510127) +106 train 3.189881 (lr=8.9790e-05) (hash(x)=37963143) +107 train 3.258845 (lr=9.0629e-05) (hash(x)=41134836) +108 train 3.164810 (lr=9.1469e-05) (hash(x)=35407710) +109 train 3.215079 (lr=9.2308e-05) (hash(x)=41549763) +110 train 3.184008 (lr=9.3147e-05) (hash(x)=42188513) +111 train 3.203768 (lr=9.3986e-05) (hash(x)=44079319) +112 train 3.177841 (lr=9.4825e-05) (hash(x)=37270678) +113 train 3.242494 (lr=9.5664e-05) (hash(x)=39663509) +114 train 3.189794 (lr=9.6503e-05) (hash(x)=42219117) +115 train 3.175172 (lr=9.7343e-05) (hash(x)=43027774) +116 train 3.176968 (lr=9.8182e-05) (hash(x)=37997349) +117 train 3.251040 (lr=9.9021e-05) (hash(x)=43514823) +118 train 3.156171 (lr=9.9860e-05) (hash(x)=44226760) +119 train 3.277204 (lr=1.0070e-04) (hash(x)=36492021) +120 train 3.214025 (lr=1.0154e-04) (hash(x)=38505610) +121 train 3.278578 (lr=1.0238e-04) (hash(x)=44556113) +122 train 3.216431 (lr=1.0322e-04) (hash(x)=40774582) +123 train 3.206781 (lr=1.0406e-04) (hash(x)=40192579) +124 train 3.265087 (lr=1.0490e-04) (hash(x)=41821538) +125 val loss 3.1969 +125 val perplexity 24.4557 +125 train 3.206953 (lr=1.0573e-04) (hash(x)=39708159) +126 train 3.226967 (lr=1.0657e-04) (hash(x)=40473111) +127 train 3.224724 (lr=1.0741e-04) (hash(x)=38419253) +128 train 3.285569 (lr=1.0825e-04) (hash(x)=40895764) +129 train 3.173731 (lr=1.0909e-04) (hash(x)=43715420) +130 train 3.247999 (lr=1.0993e-04) (hash(x)=39082451) +131 train 3.222646 (lr=1.1077e-04) (hash(x)=46270726) +132 train 3.221644 (lr=1.1161e-04) (hash(x)=40065484) +133 train 3.269892 (lr=1.1245e-04) (hash(x)=42195345) +134 train 3.222236 (lr=1.1329e-04) (hash(x)=39206335) +135 train 3.303406 (lr=1.1413e-04) (hash(x)=44403491) +136 train 3.178816 (lr=1.1497e-04) (hash(x)=34899168) +137 train 3.231464 (lr=1.1580e-04) (hash(x)=39499428) +138 train 3.236811 (lr=1.1664e-04) (hash(x)=38404890) +139 train 3.250799 (lr=1.1748e-04) (hash(x)=38474967) +140 train 3.211131 (lr=1.1832e-04) (hash(x)=39744891) +141 train 3.195572 (lr=1.1916e-04) (hash(x)=44040862) +142 train 3.185149 (lr=1.2000e-04) (hash(x)=36323333) +143 train 3.215918 (lr=1.2084e-04) (hash(x)=39386364) +144 train 3.174016 (lr=1.2168e-04) (hash(x)=40427317) +145 train 3.159354 (lr=1.2252e-04) (hash(x)=42802607) +146 train 3.158020 (lr=1.2336e-04) (hash(x)=36840030) +147 train 3.178896 (lr=1.2420e-04) (hash(x)=40275305) +148 train 3.174115 (lr=1.2503e-04) (hash(x)=27565371) +149 train 3.158358 (lr=1.2587e-04) (hash(x)=39356489) +150 val loss 3.2012 +150 val perplexity 24.5627 +150 train 3.104550 (lr=1.2671e-04) (hash(x)=41248932) +151 train 3.162531 (lr=1.2755e-04) (hash(x)=33292198) +152 train 3.212072 (lr=1.2839e-04) (hash(x)=37246571) +153 train 3.193663 (lr=1.2923e-04) (hash(x)=44475699) +154 train 3.186467 (lr=1.3007e-04) (hash(x)=40873247) +155 train 3.247133 (lr=1.3091e-04) (hash(x)=41715891) +156 train 3.244513 (lr=1.3175e-04) (hash(x)=41786046) +157 train 3.231275 (lr=1.3259e-04) (hash(x)=41608043) +158 train 3.216074 (lr=1.3343e-04) (hash(x)=34153256) +159 train 3.260266 (lr=1.3427e-04) (hash(x)=37921676) +160 train 3.252272 (lr=1.3510e-04) (hash(x)=44285951) +161 train 3.203823 (lr=1.3594e-04) (hash(x)=38096180) +162 train 3.205808 (lr=1.3678e-04) (hash(x)=37180774) +163 train 3.268545 (lr=1.3762e-04) (hash(x)=42011682) +164 train 3.245454 (lr=1.3846e-04) (hash(x)=38499641) +165 train 3.281474 (lr=1.3930e-04) (hash(x)=44244047) +166 train 3.241771 (lr=1.4014e-04) (hash(x)=43565362) +167 train 3.240392 (lr=1.4098e-04) (hash(x)=37448390) +168 train 3.275696 (lr=1.4182e-04) (hash(x)=36594415) +169 train 3.188987 (lr=1.4266e-04) (hash(x)=41707842) +170 train 3.254439 (lr=1.4350e-04) (hash(x)=41965277) +171 train 3.260684 (lr=1.4434e-04) (hash(x)=34978908) +172 train 3.233830 (lr=1.4517e-04) (hash(x)=32286346) +173 train 3.240018 (lr=1.4601e-04) (hash(x)=42491155) +174 train 3.356848 (lr=1.4685e-04) (hash(x)=36950844) +175 val loss 3.2028 +175 val perplexity 24.6022 +175 train 3.206254 (lr=1.4769e-04) (hash(x)=36548378) +176 train 3.275970 (lr=1.4853e-04) (hash(x)=41133438) +177 train 3.254955 (lr=1.4937e-04) (hash(x)=44074665) +178 train 3.209630 (lr=1.5021e-04) (hash(x)=39075311) +179 train 3.202165 (lr=1.5105e-04) (hash(x)=48276963) +180 train 3.220315 (lr=1.5189e-04) (hash(x)=35201785) +181 train 3.143323 (lr=1.5273e-04) (hash(x)=37288788) +182 train 3.195181 (lr=1.5357e-04) (hash(x)=37072035) +183 train 3.207652 (lr=1.5441e-04) (hash(x)=45192047) +184 train 3.169029 (lr=1.5524e-04) (hash(x)=45691971) +185 train 3.218788 (lr=1.5608e-04) (hash(x)=40094358) +186 train 3.227720 (lr=1.5692e-04) (hash(x)=29645231) +187 train 3.156075 (lr=1.5776e-04) (hash(x)=40680328) +188 train 3.160506 (lr=1.5860e-04) (hash(x)=34945440) +189 train 3.171996 (lr=1.5944e-04) (hash(x)=49101559) +190 train 3.199035 (lr=1.6028e-04) (hash(x)=40318765) +191 train 3.286614 (lr=1.6112e-04) (hash(x)=43154319) +192 train 3.358171 (lr=1.6196e-04) (hash(x)=41898600) +193 train 3.287485 (lr=1.6280e-04) (hash(x)=41155729) +194 train 3.229035 (lr=1.6364e-04) (hash(x)=42277475) +195 train 3.284474 (lr=1.6448e-04) (hash(x)=39443611) +196 train 3.259376 (lr=1.6531e-04) (hash(x)=40025350) +197 train 3.219235 (lr=1.6615e-04) (hash(x)=36746685) +198 train 3.231637 (lr=1.6699e-04) (hash(x)=44832361) +199 train 3.256015 (lr=1.6783e-04) (hash(x)=37832288) +200 val loss 3.2072 +200 val perplexity 24.7100 +200 train 3.284872 (lr=1.6867e-04) (hash(x)=45640196) +201 train 3.241234 (lr=1.6951e-04) (hash(x)=45629369) +202 train 3.287164 (lr=1.7035e-04) (hash(x)=45476522) +203 train 3.251097 (lr=1.7119e-04) (hash(x)=44471578) +204 train 3.249347 (lr=1.7203e-04) (hash(x)=54274920) +205 train 3.246644 (lr=1.7287e-04) (hash(x)=44511457) +206 train 3.197383 (lr=1.7371e-04) (hash(x)=33479634) +207 train 3.238997 (lr=1.7455e-04) (hash(x)=40912591) +208 train 3.227397 (lr=1.7538e-04) (hash(x)=42122661) +209 train 3.281180 (lr=1.7622e-04) (hash(x)=49617387) +210 train 3.268987 (lr=1.7706e-04) (hash(x)=43417063) +211 train 3.269304 (lr=1.7790e-04) (hash(x)=36398599) +212 train 3.276407 (lr=1.7874e-04) (hash(x)=43883975) +213 train 3.221397 (lr=1.7958e-04) (hash(x)=34975551) +214 train 3.273792 (lr=1.8042e-04) (hash(x)=37049834) +215 train 3.226028 (lr=1.8126e-04) (hash(x)=39030011) +216 train 3.220252 (lr=1.8210e-04) (hash(x)=39672297) +217 train 3.141819 (lr=1.8294e-04) (hash(x)=49009965) +218 train 3.224496 (lr=1.8378e-04) (hash(x)=40777727) +219 train 3.195829 (lr=1.8462e-04) (hash(x)=44429939) +220 train 3.250571 (lr=1.8545e-04) (hash(x)=41760392) +221 train 3.186779 (lr=1.8629e-04) (hash(x)=35551075) +222 train 3.165211 (lr=1.8713e-04) (hash(x)=44813441) +223 train 3.233312 (lr=1.8797e-04) (hash(x)=43632162) +224 train 3.183312 (lr=1.8881e-04) (hash(x)=44958040) +225 val loss 3.2130 +225 val perplexity 24.8533 +225 train 3.168892 (lr=1.8965e-04) (hash(x)=41774801) +226 train 3.193253 (lr=1.9049e-04) (hash(x)=40041073) +227 train 3.252361 (lr=1.9133e-04) (hash(x)=37683316) +228 train 3.307604 (lr=1.9217e-04) (hash(x)=38844981) +229 train 3.269639 (lr=1.9301e-04) (hash(x)=22564688) +230 train 3.252237 (lr=1.9385e-04) (hash(x)=39871484) +231 train 3.275402 (lr=1.9469e-04) (hash(x)=43872958) +232 train 3.227078 (lr=1.9552e-04) (hash(x)=44580494) +233 train 3.245291 (lr=1.9636e-04) (hash(x)=34570448) +234 train 3.258671 (lr=1.9720e-04) (hash(x)=41647764) +235 train 3.254607 (lr=1.9804e-04) (hash(x)=42447423) +236 train 3.427083 (lr=1.9888e-04) (hash(x)=37854614) +237 train 3.196925 (lr=1.9972e-04) (hash(x)=33434096) +238 train 3.255851 (lr=2.0056e-04) (hash(x)=44998474) +239 train 3.271535 (lr=2.0140e-04) (hash(x)=42537868) +240 train 3.244548 (lr=2.0224e-04) (hash(x)=39650620) +241 train 3.268091 (lr=2.0308e-04) (hash(x)=43525301) +242 train 3.201042 (lr=2.0392e-04) (hash(x)=38926546) +243 train 3.273253 (lr=2.0476e-04) (hash(x)=40861613) +244 train 3.220031 (lr=2.0559e-04) (hash(x)=40462778) +245 train 3.230189 (lr=2.0643e-04) (hash(x)=41561116) +246 train 3.235812 (lr=2.0727e-04) (hash(x)=38815450) +247 train 3.262823 (lr=2.0811e-04) (hash(x)=31910694) +248 train 3.251402 (lr=2.0895e-04) (hash(x)=41167887) +249 train 3.283226 (lr=2.0979e-04) (hash(x)=35376527) +250 val loss 3.2163 +250 val perplexity 24.9362 +250 hella 0.2853 +250 train 3.251985 (lr=2.1063e-04) (hash(x)=35993491) +251 train 3.218689 (lr=2.1147e-04) (hash(x)=40660483) +252 train 3.200462 (lr=2.1231e-04) (hash(x)=37609395) +253 train 3.209288 (lr=2.1315e-04) (hash(x)=41181142) +254 train 3.213053 (lr=2.1399e-04) (hash(x)=35736560) +255 train 3.156324 (lr=2.1483e-04) (hash(x)=40724675) +256 train 3.176502 (lr=2.1566e-04) (hash(x)=38108232) +257 train 3.163134 (lr=2.1650e-04) (hash(x)=46313097) +258 train 3.231628 (lr=2.1734e-04) (hash(x)=39500175) +259 train 3.256361 (lr=2.1818e-04) (hash(x)=36741155) +260 train 3.189654 (lr=2.1902e-04) (hash(x)=37377326) +261 train 3.209828 (lr=2.1986e-04) (hash(x)=40879033) +262 train 3.214656 (lr=2.2070e-04) (hash(x)=41600523) +263 train 3.206513 (lr=2.2154e-04) (hash(x)=39594376) +264 train 3.192599 (lr=2.2238e-04) (hash(x)=41260157) +265 train 3.188475 (lr=2.2322e-04) (hash(x)=36377573) +266 train 3.167606 (lr=2.2406e-04) (hash(x)=41276740) +267 train 3.165098 (lr=2.2490e-04) (hash(x)=40220867) +268 train 3.247123 (lr=2.2573e-04) (hash(x)=38348548) +269 train 3.171829 (lr=2.2657e-04) (hash(x)=39225629) +270 train 3.232137 (lr=2.2741e-04) (hash(x)=39244397) +271 train 3.220442 (lr=2.2825e-04) (hash(x)=27385583) +272 train 3.190291 (lr=2.2909e-04) (hash(x)=39968102) +273 train 3.248634 (lr=2.2993e-04) (hash(x)=42465099) +274 train 3.229883 (lr=2.3077e-04) (hash(x)=43032093) +275 val loss 3.2169 +275 val perplexity 24.9503 +275 train 3.181202 (lr=2.3161e-04) (hash(x)=36597876) +276 train 3.284412 (lr=2.3245e-04) (hash(x)=40281752) +277 train 3.240707 (lr=2.3329e-04) (hash(x)=38343954) +278 train 3.280420 (lr=2.3413e-04) (hash(x)=43743130) +279 train 3.226279 (lr=2.3497e-04) (hash(x)=41388062) +280 train 3.244170 (lr=2.3580e-04) (hash(x)=40601760) +281 train 3.229652 (lr=2.3664e-04) (hash(x)=40388916) +282 train 3.257270 (lr=2.3748e-04) (hash(x)=33687560) +283 train 3.225372 (lr=2.3832e-04) (hash(x)=39924552) +284 train 3.310035 (lr=2.3916e-04) (hash(x)=42778901) +285 train 3.256431 (lr=2.4000e-04) (hash(x)=35148266) +286 train 3.192196 (lr=2.4084e-04) (hash(x)=46898906) +287 train 3.256575 (lr=2.4168e-04) (hash(x)=43768202) +288 train 3.216948 (lr=2.4252e-04) (hash(x)=34760716) +289 train 3.232610 (lr=2.4336e-04) (hash(x)=36379880) +290 train 3.254176 (lr=2.4420e-04) (hash(x)=38926815) +291 train 3.207439 (lr=2.4503e-04) (hash(x)=38752428) +292 train 3.205800 (lr=2.4587e-04) (hash(x)=41361646) +293 train 3.222862 (lr=2.4671e-04) (hash(x)=38054202) +294 train 3.217958 (lr=2.4755e-04) (hash(x)=39152755) +295 train 3.189409 (lr=2.4839e-04) (hash(x)=38357516) +296 train 3.186535 (lr=2.4923e-04) (hash(x)=40358075) +297 train 3.161336 (lr=2.5007e-04) (hash(x)=37312121) +298 train 3.227117 (lr=2.5091e-04) (hash(x)=38208240) +299 train 3.185762 (lr=2.5175e-04) (hash(x)=44166581) +300 val loss 3.2231 +300 val perplexity 25.1050 +300 train 3.230689 (lr=2.5259e-04) (hash(x)=36207463) +301 train 3.243681 (lr=2.5343e-04) (hash(x)=39314948) +302 train 3.248014 (lr=2.5427e-04) (hash(x)=45453384) +303 train 3.231873 (lr=2.5510e-04) (hash(x)=39892498) +304 train 3.245906 (lr=2.5594e-04) (hash(x)=43742971) +305 train 3.278923 (lr=2.5678e-04) (hash(x)=44244587) +306 train 3.225178 (lr=2.5762e-04) (hash(x)=43079665) +307 train 3.172477 (lr=2.5846e-04) (hash(x)=40828523) +308 train 3.215585 (lr=2.5930e-04) (hash(x)=48350120) +309 train 3.201304 (lr=2.6014e-04) (hash(x)=36814899) +310 train 3.254836 (lr=2.6098e-04) (hash(x)=41483667) +311 train 3.266809 (lr=2.6182e-04) (hash(x)=34943057) +312 train 3.310055 (lr=2.6266e-04) (hash(x)=42138343) +313 train 3.266549 (lr=2.6350e-04) (hash(x)=43042522) +314 train 3.299217 (lr=2.6434e-04) (hash(x)=44216200) +315 train 3.266652 (lr=2.6517e-04) (hash(x)=40404472) +316 train 3.278720 (lr=2.6601e-04) (hash(x)=38387871) +317 train 3.253120 (lr=2.6685e-04) (hash(x)=35370546) +318 train 3.257941 (lr=2.6769e-04) (hash(x)=43006298) +319 train 3.261929 (lr=2.6853e-04) (hash(x)=45103177) +320 train 3.280879 (lr=2.6937e-04) (hash(x)=43782093) +321 train 3.276434 (lr=2.7021e-04) (hash(x)=32874759) +322 train 3.236037 (lr=2.7105e-04) (hash(x)=42054371) +323 train 3.236205 (lr=2.7189e-04) (hash(x)=39429436) +324 train 3.276591 (lr=2.7273e-04) (hash(x)=37154970) +325 val loss 3.2256 +325 val perplexity 25.1680 +325 train 3.275380 (lr=2.7357e-04) (hash(x)=33537750) +326 train 3.237547 (lr=2.7441e-04) (hash(x)=44178457) +327 train 3.220344 (lr=2.7524e-04) (hash(x)=36044153) +328 train 3.251259 (lr=2.7608e-04) (hash(x)=41092165) +329 train 3.187704 (lr=2.7692e-04) (hash(x)=41459563) +330 train 3.252609 (lr=2.7776e-04) (hash(x)=54876733) +331 train 3.266204 (lr=2.7860e-04) (hash(x)=40597732) +332 train 3.265992 (lr=2.7944e-04) (hash(x)=42354810) +333 train 3.236773 (lr=2.8028e-04) (hash(x)=37439772) +334 train 3.266068 (lr=2.8112e-04) (hash(x)=38162048) +335 train 3.250945 (lr=2.8196e-04) (hash(x)=34847438) +336 train 3.208168 (lr=2.8280e-04) (hash(x)=36231770) +337 train 3.244793 (lr=2.8364e-04) (hash(x)=38866291) +338 train 3.226283 (lr=2.8448e-04) (hash(x)=37322941) +339 train 3.263640 (lr=2.8531e-04) (hash(x)=42629702) +340 train 3.218490 (lr=2.8615e-04) (hash(x)=39540180) +341 train 3.201584 (lr=2.8699e-04) (hash(x)=38683307) +342 train 3.189478 (lr=2.8783e-04) (hash(x)=38989220) +343 train 3.310941 (lr=2.8867e-04) (hash(x)=36725995) +344 train 3.249321 (lr=2.8951e-04) (hash(x)=38961210) +345 train 3.247175 (lr=2.9035e-04) (hash(x)=35271965) +346 train 3.225396 (lr=2.9119e-04) (hash(x)=48017493) +347 train 3.288209 (lr=2.9203e-04) (hash(x)=37927674) +348 train 3.225883 (lr=2.9287e-04) (hash(x)=41001564) +349 train 3.261631 (lr=2.9371e-04) (hash(x)=37683044) +350 val loss 3.2278 +350 val perplexity 25.2243 +350 train 3.276576 (lr=2.9455e-04) (hash(x)=41215123) +351 train 3.301016 (lr=2.9538e-04) (hash(x)=34767166) +352 train 3.256894 (lr=2.9622e-04) (hash(x)=40148811) +353 train 3.284310 (lr=2.9706e-04) (hash(x)=39932211) +354 train 3.238462 (lr=2.9790e-04) (hash(x)=37210485) +355 train 3.305850 (lr=2.9874e-04) (hash(x)=38585829) +356 train 3.278985 (lr=2.9958e-04) (hash(x)=45389632) +357 train 3.288383 (lr=3.0042e-04) (hash(x)=40826465) +358 train 3.232859 (lr=3.0126e-04) (hash(x)=41969443) +359 train 3.272092 (lr=3.0210e-04) (hash(x)=38278104) +360 train 3.268836 (lr=3.0294e-04) (hash(x)=37890168) +361 train 3.257813 (lr=3.0378e-04) (hash(x)=39802003) +362 train 3.190590 (lr=3.0462e-04) (hash(x)=34848764) +363 train 3.263285 (lr=3.0545e-04) (hash(x)=38798729) +364 train 3.217320 (lr=3.0629e-04) (hash(x)=29664956) +365 train 3.254126 (lr=3.0713e-04) (hash(x)=39546637) +366 train 3.302497 (lr=3.0797e-04) (hash(x)=40101833) +367 train 3.300212 (lr=3.0881e-04) (hash(x)=39886578) +368 train 3.211179 (lr=3.0965e-04) (hash(x)=38767570) +369 train 3.216907 (lr=3.1049e-04) (hash(x)=39475155) +370 train 3.209735 (lr=3.1133e-04) (hash(x)=39999281) +371 train 3.201679 (lr=3.1217e-04) (hash(x)=38911304) +372 train 3.249149 (lr=3.1301e-04) (hash(x)=39395614) +373 train 3.187395 (lr=3.1385e-04) (hash(x)=42311090) +374 train 3.237624 (lr=3.1469e-04) (hash(x)=38826699) +375 val loss 3.2373 +375 val perplexity 25.4637 +375 train 3.255544 (lr=3.1552e-04) (hash(x)=42876113) +376 train 3.267937 (lr=3.1636e-04) (hash(x)=37319948) +377 train 3.240422 (lr=3.1720e-04) (hash(x)=40796998) +378 train 3.322007 (lr=3.1804e-04) (hash(x)=37648208) +379 train 3.264425 (lr=3.1888e-04) (hash(x)=40023276) +380 train 3.200826 (lr=3.1972e-04) (hash(x)=41012662) +381 train 3.235671 (lr=3.2056e-04) (hash(x)=35353760) +382 train 3.232884 (lr=3.2140e-04) (hash(x)=37539108) +383 train 3.196033 (lr=3.2224e-04) (hash(x)=43169429) +384 train 3.251285 (lr=3.2308e-04) (hash(x)=34370950) +385 train 3.259008 (lr=3.2392e-04) (hash(x)=53251708) +386 train 3.293884 (lr=3.2476e-04) (hash(x)=43022970) +387 train 3.238677 (lr=3.2559e-04) (hash(x)=38948613) +388 train 3.228348 (lr=3.2643e-04) (hash(x)=32852975) +389 train 3.291195 (lr=3.2727e-04) (hash(x)=32549470) +390 train 3.234497 (lr=3.2811e-04) (hash(x)=36581623) +391 train 3.303847 (lr=3.2895e-04) (hash(x)=41095736) +392 train 3.266145 (lr=3.2979e-04) (hash(x)=35056803) +393 train 3.300159 (lr=3.3063e-04) (hash(x)=40006294) +394 train 3.265122 (lr=3.3147e-04) (hash(x)=40433910) +395 train 3.265574 (lr=3.3231e-04) (hash(x)=50077210) +396 train 3.269580 (lr=3.3315e-04) (hash(x)=37424726) +397 train 3.247319 (lr=3.3399e-04) (hash(x)=43514349) +398 train 3.247639 (lr=3.3483e-04) (hash(x)=35886098) +399 train 3.262782 (lr=3.3566e-04) (hash(x)=42960271) +400 val loss 3.2379 +400 val perplexity 25.4802 +400 train 3.258921 (lr=3.3650e-04) (hash(x)=37952826) +401 train 3.225997 (lr=3.3734e-04) (hash(x)=43892643) +402 train 3.211330 (lr=3.3818e-04) (hash(x)=36125569) +403 train 3.236471 (lr=3.3902e-04) (hash(x)=40102444) +404 train 3.229194 (lr=3.3986e-04) (hash(x)=41666406) +405 train 3.254796 (lr=3.4070e-04) (hash(x)=37459499) +406 train 3.173500 (lr=3.4154e-04) (hash(x)=44233924) +407 train 3.219419 (lr=3.4238e-04) (hash(x)=34666251) +408 train 3.259888 (lr=3.4322e-04) (hash(x)=46785085) +409 train 3.249492 (lr=3.4406e-04) (hash(x)=39473167) +410 train 3.262406 (lr=3.4490e-04) (hash(x)=37756807) +411 train 3.253291 (lr=3.4573e-04) (hash(x)=40685710) +412 train 3.234354 (lr=3.4657e-04) (hash(x)=51880970) +413 train 3.245161 (lr=3.4741e-04) (hash(x)=42678764) +414 train 3.241284 (lr=3.4825e-04) (hash(x)=39389558) +415 train 3.225661 (lr=3.4909e-04) (hash(x)=41466470) +416 train 3.287215 (lr=3.4993e-04) (hash(x)=44107557) +417 train 3.154819 (lr=3.5077e-04) (hash(x)=40649729) +418 train 3.221495 (lr=3.5161e-04) (hash(x)=27627663) +419 train 3.220423 (lr=3.5245e-04) (hash(x)=45276952) +420 train 3.249991 (lr=3.5329e-04) (hash(x)=40910703) +421 train 3.260306 (lr=3.5413e-04) (hash(x)=49131665) +422 train 3.286299 (lr=3.5497e-04) (hash(x)=44436967) +423 train 3.271866 (lr=3.5580e-04) (hash(x)=32187531) +424 train 3.231776 (lr=3.5664e-04) (hash(x)=36328281) +425 val loss 3.2511 +425 val perplexity 25.8175 +425 train 3.260003 (lr=3.5748e-04) (hash(x)=39041317) +426 train 3.274465 (lr=3.5832e-04) (hash(x)=44277248) +427 train 3.276428 (lr=3.5916e-04) (hash(x)=40066083) +428 train 3.314526 (lr=3.6000e-04) (hash(x)=41229570) +429 train 3.289736 (lr=3.6084e-04) (hash(x)=40445405) +430 train 3.346877 (lr=3.6168e-04) (hash(x)=41542299) +431 train 3.377554 (lr=3.6252e-04) (hash(x)=38698371) +432 train 3.361462 (lr=3.6336e-04) (hash(x)=35271695) +433 train 3.273361 (lr=3.6420e-04) (hash(x)=40905186) +434 train 3.261288 (lr=3.6503e-04) (hash(x)=43852277) +435 train 3.312571 (lr=3.6587e-04) (hash(x)=37995500) +436 train 3.326318 (lr=3.6671e-04) (hash(x)=45529988) +437 train 3.240896 (lr=3.6755e-04) (hash(x)=34043394) +438 train 3.246916 (lr=3.6839e-04) (hash(x)=41998697) +439 train 3.274296 (lr=3.6923e-04) (hash(x)=42996801) +440 train 3.278425 (lr=3.7007e-04) (hash(x)=38844602) +441 train 3.269735 (lr=3.7091e-04) (hash(x)=43567259) +442 train 3.276216 (lr=3.7175e-04) (hash(x)=38050262) +443 train 3.262886 (lr=3.7259e-04) (hash(x)=37444312) +444 train 3.244430 (lr=3.7343e-04) (hash(x)=40458175) +445 train 3.209620 (lr=3.7427e-04) (hash(x)=42938488) +446 train 3.279008 (lr=3.7510e-04) (hash(x)=38068128) +447 train 3.252793 (lr=3.7594e-04) (hash(x)=42954147) +448 train 3.327836 (lr=3.7678e-04) (hash(x)=40997142) +449 train 3.238181 (lr=3.7762e-04) (hash(x)=41949838) +450 val loss 3.2536 +450 val perplexity 25.8825 +450 train 3.400932 (lr=3.7846e-04) (hash(x)=46442168) +451 train 3.251357 (lr=3.7930e-04) (hash(x)=41193513) +452 train 3.223974 (lr=3.8014e-04) (hash(x)=42094359) +453 train 3.308260 (lr=3.8098e-04) (hash(x)=40224693) +454 train 3.322552 (lr=3.8182e-04) (hash(x)=40694172) +455 train 3.211985 (lr=3.8266e-04) (hash(x)=43849034) +456 train 3.290156 (lr=3.8350e-04) (hash(x)=43031818) +457 train 3.205769 (lr=3.8434e-04) (hash(x)=42648027) +458 train 3.318455 (lr=3.8517e-04) (hash(x)=41324822) +459 train 3.314360 (lr=3.8601e-04) (hash(x)=43615204) +460 train 3.246157 (lr=3.8685e-04) (hash(x)=42166024) +461 train 3.241877 (lr=3.8769e-04) (hash(x)=38679759) +462 train 3.255769 (lr=3.8853e-04) (hash(x)=34957253) +463 train 3.278873 (lr=3.8937e-04) (hash(x)=37168942) +464 train 3.324345 (lr=3.9021e-04) (hash(x)=36040623) +465 train 3.280344 (lr=3.9105e-04) (hash(x)=39944386) +466 train 3.267062 (lr=3.9189e-04) (hash(x)=40045771) +467 train 3.249286 (lr=3.9273e-04) (hash(x)=44407115) +468 train 3.297253 (lr=3.9357e-04) (hash(x)=44484426) +469 train 3.257634 (lr=3.9441e-04) (hash(x)=40789214) +470 train 3.269072 (lr=3.9524e-04) (hash(x)=39432959) +471 train 3.218879 (lr=3.9608e-04) (hash(x)=38648345) +472 train 3.291209 (lr=3.9692e-04) (hash(x)=41878775) +473 train 3.306014 (lr=3.9776e-04) (hash(x)=37828171) +474 train 3.279881 (lr=3.9860e-04) (hash(x)=42773508) +475 val loss 3.2521 +475 val perplexity 25.8436 +475 train 3.229876 (lr=3.9944e-04) (hash(x)=42981879) +476 train 3.229131 (lr=4.0028e-04) (hash(x)=39526595) +477 train 3.259519 (lr=4.0112e-04) (hash(x)=44116937) +478 train 3.244689 (lr=4.0196e-04) (hash(x)=43641905) +479 train 3.226527 (lr=4.0280e-04) (hash(x)=42470607) +480 train 3.222528 (lr=4.0364e-04) (hash(x)=38703129) +481 train 3.287268 (lr=4.0448e-04) (hash(x)=38442042) +482 train 3.257579 (lr=4.0531e-04) (hash(x)=37327148) +483 train 3.288312 (lr=4.0615e-04) (hash(x)=42418663) +484 train 3.256192 (lr=4.0699e-04) (hash(x)=40735368) +485 train 3.237785 (lr=4.0783e-04) (hash(x)=48465047) +486 train 3.249147 (lr=4.0867e-04) (hash(x)=34954901) +487 train 3.276341 (lr=4.0951e-04) (hash(x)=40681768) +488 train 3.300718 (lr=4.1035e-04) (hash(x)=37742200) +489 train 3.266953 (lr=4.1119e-04) (hash(x)=39088579) +490 train 3.272052 (lr=4.1203e-04) (hash(x)=39913142) +491 train 3.295114 (lr=4.1287e-04) (hash(x)=36971052) +492 train 3.293194 (lr=4.1371e-04) (hash(x)=35949497) +493 train 3.285457 (lr=4.1455e-04) (hash(x)=39550642) +494 train 3.330901 (lr=4.1538e-04) (hash(x)=48741738) +495 train 3.216320 (lr=4.1622e-04) (hash(x)=39586059) +496 train 3.307419 (lr=4.1706e-04) (hash(x)=42632671) +497 train 3.241969 (lr=4.1790e-04) (hash(x)=40622843) +498 train 3.261941 (lr=4.1874e-04) (hash(x)=40265835) +499 train 3.328933 (lr=4.1958e-04) (hash(x)=44697460) +500 val loss 3.2572 +500 val perplexity 25.9770 +500 hella 0.2840 +500 train 3.318066 (lr=4.2042e-04) (hash(x)=30483869) +501 train 3.291111 (lr=4.2126e-04) (hash(x)=42169061) +502 train 3.245790 (lr=4.2210e-04) (hash(x)=41684737) +503 train 3.236382 (lr=4.2294e-04) (hash(x)=38235292) +504 train 3.318565 (lr=4.2378e-04) (hash(x)=36158582) +505 train 3.346879 (lr=4.2462e-04) (hash(x)=40754658) +506 train 3.276640 (lr=4.2545e-04) (hash(x)=43182360) +507 train 3.238719 (lr=4.2629e-04) (hash(x)=39572352) +508 train 3.308569 (lr=4.2713e-04) (hash(x)=36969797) +509 train 3.330495 (lr=4.2797e-04) (hash(x)=40058482) +510 train 3.246832 (lr=4.2881e-04) (hash(x)=35740449) +511 train 3.229458 (lr=4.2965e-04) (hash(x)=27670931) +512 train 3.211760 (lr=4.3049e-04) (hash(x)=35150740) +513 train 3.270516 (lr=4.3133e-04) (hash(x)=35016917) +514 train 3.249013 (lr=4.3217e-04) (hash(x)=38682756) +515 train 3.272719 (lr=4.3301e-04) (hash(x)=39106562) +516 train 3.358249 (lr=4.3385e-04) (hash(x)=39428603) +517 train 3.332795 (lr=4.3469e-04) (hash(x)=42612112) +518 train 3.309698 (lr=4.3552e-04) (hash(x)=39441406) +519 train 3.223217 (lr=4.3636e-04) (hash(x)=34709583) +520 train 3.207419 (lr=4.3720e-04) (hash(x)=39562317) +521 train 3.299530 (lr=4.3804e-04) (hash(x)=39583758) +522 train 3.308862 (lr=4.3888e-04) (hash(x)=44874234) +523 train 3.333098 (lr=4.3972e-04) (hash(x)=38391012) +524 train 3.374120 (lr=4.4056e-04) (hash(x)=44985871) +525 val loss 3.2696 +525 val perplexity 26.3001 +525 train 3.322748 (lr=4.4140e-04) (hash(x)=41831592) +526 train 3.313788 (lr=4.4224e-04) (hash(x)=44214015) +527 train 3.303121 (lr=4.4308e-04) (hash(x)=38458588) +528 train 3.243906 (lr=4.4392e-04) (hash(x)=34893332) +529 train 3.270003 (lr=4.4476e-04) (hash(x)=34547329) +530 train 3.321211 (lr=4.4559e-04) (hash(x)=42863637) +531 train 3.270474 (lr=4.4643e-04) (hash(x)=37059451) +532 train 3.281693 (lr=4.4727e-04) (hash(x)=42751953) +533 train 3.256982 (lr=4.4811e-04) (hash(x)=45020382) +534 train 3.309428 (lr=4.4895e-04) (hash(x)=45022326) +535 train 3.373766 (lr=4.4979e-04) (hash(x)=40098059) +536 train 3.321029 (lr=4.5063e-04) (hash(x)=39151557) +537 train 3.268144 (lr=4.5147e-04) (hash(x)=42315898) +538 train 3.291312 (lr=4.5231e-04) (hash(x)=43793759) +539 train 3.346560 (lr=4.5315e-04) (hash(x)=36061233) +540 train 3.278664 (lr=4.5399e-04) (hash(x)=40459859) +541 train 3.289929 (lr=4.5483e-04) (hash(x)=45919037) +542 train 3.308162 (lr=4.5566e-04) (hash(x)=38338965) +543 train 3.269930 (lr=4.5650e-04) (hash(x)=38884260) +544 train 3.272179 (lr=4.5734e-04) (hash(x)=37265988) +545 train 3.342009 (lr=4.5818e-04) (hash(x)=41942323) +546 train 3.348345 (lr=4.5902e-04) (hash(x)=41835453) +547 train 3.289212 (lr=4.5986e-04) (hash(x)=40584244) +548 train 3.256776 (lr=4.6070e-04) (hash(x)=37195679) +549 train 3.281730 (lr=4.6154e-04) (hash(x)=40858497) +550 val loss 3.2696 +550 val perplexity 26.3021 +550 train 3.288745 (lr=4.6238e-04) (hash(x)=42139122) +551 train 3.279516 (lr=4.6322e-04) (hash(x)=39953271) +552 train 3.238705 (lr=4.6406e-04) (hash(x)=44119297) +553 train 3.270301 (lr=4.6490e-04) (hash(x)=53072781) +554 train 3.271532 (lr=4.6573e-04) (hash(x)=36810184) +555 train 3.262812 (lr=4.6657e-04) (hash(x)=40857238) +556 train 3.293499 (lr=4.6741e-04) (hash(x)=41336790) +557 train 3.256098 (lr=4.6825e-04) (hash(x)=44111018) +558 train 3.246073 (lr=4.6909e-04) (hash(x)=38075206) +559 train 3.246317 (lr=4.6993e-04) (hash(x)=40911304) +560 train 3.296389 (lr=4.7077e-04) (hash(x)=37405237) +561 train 3.295834 (lr=4.7161e-04) (hash(x)=41471451) +562 train 3.374693 (lr=4.7245e-04) (hash(x)=31096571) +563 train 3.323635 (lr=4.7329e-04) (hash(x)=38458753) +564 train 3.279131 (lr=4.7413e-04) (hash(x)=38188773) +565 train 3.278409 (lr=4.7497e-04) (hash(x)=37424927) +566 train 3.288112 (lr=4.7580e-04) (hash(x)=43214465) +567 train 3.300266 (lr=4.7664e-04) (hash(x)=37286236) +568 train 3.316252 (lr=4.7748e-04) (hash(x)=38315861) +569 train 3.296781 (lr=4.7832e-04) (hash(x)=47418732) +570 train 3.378994 (lr=4.7916e-04) (hash(x)=43721721) +571 train 3.265891 (lr=4.8000e-04) (hash(x)=42444603) +572 train 3.396063 (lr=4.8084e-04) (hash(x)=43075348) +573 train 3.317782 (lr=4.8168e-04) (hash(x)=43481237) +574 train 3.279052 (lr=4.8252e-04) (hash(x)=41688432) +575 val loss 3.2764 +575 val perplexity 26.4805 +575 train 3.396676 (lr=4.8336e-04) (hash(x)=36657433) +576 train 3.324876 (lr=4.8420e-04) (hash(x)=40373772) +577 train 3.263401 (lr=4.8503e-04) (hash(x)=41906797) +578 train 3.343299 (lr=4.8587e-04) (hash(x)=38023259) +579 train 3.256950 (lr=4.8671e-04) (hash(x)=42489581) +580 train 3.374172 (lr=4.8755e-04) (hash(x)=40972706) +581 train 3.328948 (lr=4.8839e-04) (hash(x)=39010938) +582 train 3.344221 (lr=4.8923e-04) (hash(x)=36787319) +583 train 3.323186 (lr=4.9007e-04) (hash(x)=37207799) +584 train 3.286663 (lr=4.9091e-04) (hash(x)=34781806) +585 train 3.286661 (lr=4.9175e-04) (hash(x)=40812060) +586 train 3.291377 (lr=4.9259e-04) (hash(x)=39626954) +587 train 3.321775 (lr=4.9343e-04) (hash(x)=43983725) +588 train 3.266236 (lr=4.9427e-04) (hash(x)=35035541) +589 train 3.242346 (lr=4.9510e-04) (hash(x)=39042350) +590 train 3.361746 (lr=4.9594e-04) (hash(x)=38975166) +591 train 3.243824 (lr=4.9678e-04) (hash(x)=37293608) +592 train 3.235366 (lr=4.9762e-04) (hash(x)=44391666) +593 train 3.281267 (lr=4.9846e-04) (hash(x)=38196886) +594 train 3.304746 (lr=4.9930e-04) (hash(x)=41324953) +595 train 3.312991 (lr=5.0014e-04) (hash(x)=39631132) +596 train 3.335827 (lr=5.0098e-04) (hash(x)=38412600) +597 train 3.252549 (lr=5.0182e-04) (hash(x)=43423466) +598 train 3.316258 (lr=5.0266e-04) (hash(x)=40272757) +599 train 3.318518 (lr=5.0350e-04) (hash(x)=43378227) +600 val loss 3.2799 +600 val perplexity 26.5740 +600 train 3.303079 (lr=5.0434e-04) (hash(x)=39984095) +601 train 3.273619 (lr=5.0517e-04) (hash(x)=29648373) +602 train 3.316287 (lr=5.0601e-04) (hash(x)=42683949) +603 train 3.289851 (lr=5.0685e-04) (hash(x)=43930731) +604 train 3.255086 (lr=5.0769e-04) (hash(x)=46096356) +605 train 3.364946 (lr=5.0853e-04) (hash(x)=37091783) +606 train 3.263491 (lr=5.0937e-04) (hash(x)=38148466) +607 train 3.315711 (lr=5.1021e-04) (hash(x)=43291875) +608 train 3.266280 (lr=5.1105e-04) (hash(x)=36008196) +609 train 3.339887 (lr=5.1189e-04) (hash(x)=49633954) +610 train 3.326223 (lr=5.1273e-04) (hash(x)=37921385) +611 train 3.338983 (lr=5.1357e-04) (hash(x)=37263142) +612 train 3.414657 (lr=5.1441e-04) (hash(x)=40488619) +613 train 3.324513 (lr=5.1524e-04) (hash(x)=42151010) +614 train 3.264045 (lr=5.1608e-04) (hash(x)=42966895) +615 train 3.285918 (lr=5.1692e-04) (hash(x)=40782716) +616 train 3.304768 (lr=5.1776e-04) (hash(x)=43818385) +617 train 3.329885 (lr=5.1860e-04) (hash(x)=37230748) +618 train 3.309114 (lr=5.1944e-04) (hash(x)=43000696) +619 train 3.391006 (lr=5.2028e-04) (hash(x)=40255431) +620 train 3.337078 (lr=5.2112e-04) (hash(x)=39193758) +621 train 3.273063 (lr=5.2196e-04) (hash(x)=41800741) +622 train 3.313095 (lr=5.2280e-04) (hash(x)=37653367) +623 train 3.328111 (lr=5.2364e-04) (hash(x)=41930421) +624 train 3.289440 (lr=5.2448e-04) (hash(x)=41355454) +625 val loss 3.2848 +625 val perplexity 26.7032 +625 train 3.244143 (lr=5.2531e-04) (hash(x)=48087904) +626 train 3.262414 (lr=5.2615e-04) (hash(x)=41553046) +627 train 3.284008 (lr=5.2699e-04) (hash(x)=40352059) +628 train 3.292843 (lr=5.2783e-04) (hash(x)=38856977) +629 train 3.222003 (lr=5.2867e-04) (hash(x)=43128805) +630 train 3.308345 (lr=5.2951e-04) (hash(x)=37250136) +631 train 3.340319 (lr=5.3035e-04) (hash(x)=39777756) +632 train 3.234882 (lr=5.3119e-04) (hash(x)=36305357) +633 train 3.292531 (lr=5.3203e-04) (hash(x)=39367198) +634 train 3.280626 (lr=5.3287e-04) (hash(x)=40242582) +635 train 3.358690 (lr=5.3371e-04) (hash(x)=42464122) +636 train 3.330877 (lr=5.3455e-04) (hash(x)=41510997) +637 train 3.303590 (lr=5.3538e-04) (hash(x)=35862943) +638 train 3.320675 (lr=5.3622e-04) (hash(x)=46620072) +639 train 3.389352 (lr=5.3706e-04) (hash(x)=39831528) +640 train 3.383523 (lr=5.3790e-04) (hash(x)=43031187) +641 train 3.338926 (lr=5.3874e-04) (hash(x)=43340475) +642 train 3.301379 (lr=5.3958e-04) (hash(x)=43411475) +643 train 3.251754 (lr=5.4042e-04) (hash(x)=36793170) +644 train 3.325233 (lr=5.4126e-04) (hash(x)=38691938) +645 train 3.293574 (lr=5.4210e-04) (hash(x)=42864915) +646 train 3.304761 (lr=5.4294e-04) (hash(x)=40546833) +647 train 3.317239 (lr=5.4378e-04) (hash(x)=38515240) +648 train 3.318382 (lr=5.4462e-04) (hash(x)=39233131) +649 train 3.338044 (lr=5.4545e-04) (hash(x)=49840445) +650 val loss 3.2890 +650 val perplexity 26.8148 +650 train 3.310285 (lr=5.4629e-04) (hash(x)=56645602) +651 train 3.408989 (lr=5.4713e-04) (hash(x)=37992784) +652 train 3.336506 (lr=5.4797e-04) (hash(x)=34059789) +653 train 3.308382 (lr=5.4881e-04) (hash(x)=40402037) +654 train 3.375352 (lr=5.4965e-04) (hash(x)=38072809) +655 train 3.311672 (lr=5.5049e-04) (hash(x)=40113736) +656 train 3.311733 (lr=5.5133e-04) (hash(x)=43215171) +657 train 3.348651 (lr=5.5217e-04) (hash(x)=41836965) +658 train 3.340961 (lr=5.5301e-04) (hash(x)=35783759) +659 train 3.314900 (lr=5.5385e-04) (hash(x)=41732323) +660 train 3.268070 (lr=5.5469e-04) (hash(x)=38153008) +661 train 3.273662 (lr=5.5552e-04) (hash(x)=44736389) +662 train 3.292401 (lr=5.5636e-04) (hash(x)=29938060) +663 train 3.243684 (lr=5.5720e-04) (hash(x)=44715934) +664 train 3.344959 (lr=5.5804e-04) (hash(x)=45226902) +665 train 3.286958 (lr=5.5888e-04) (hash(x)=35871559) +666 train 3.295585 (lr=5.5972e-04) (hash(x)=39766299) +667 train 3.351629 (lr=5.6056e-04) (hash(x)=40065060) +668 train 3.278718 (lr=5.6140e-04) (hash(x)=35628651) +669 train 3.371896 (lr=5.6224e-04) (hash(x)=32456750) +670 train 3.359426 (lr=5.6308e-04) (hash(x)=41364659) +671 train 3.357903 (lr=5.6392e-04) (hash(x)=40262234) +672 train 3.383301 (lr=5.6476e-04) (hash(x)=39588447) +673 train 3.360382 (lr=5.6559e-04) (hash(x)=43807485) +674 train 3.316695 (lr=5.6643e-04) (hash(x)=39713061) +675 val loss 3.2951 +675 val perplexity 26.9791 +675 train 3.292665 (lr=5.6727e-04) (hash(x)=37130235) +676 train 3.346793 (lr=5.6811e-04) (hash(x)=44225881) +677 train 3.418056 (lr=5.6895e-04) (hash(x)=40877864) +678 train 3.329269 (lr=5.6979e-04) (hash(x)=42780856) +679 train 3.285942 (lr=5.7063e-04) (hash(x)=39012554) +680 train 3.315508 (lr=5.7147e-04) (hash(x)=49042245) +681 train 3.307147 (lr=5.7231e-04) (hash(x)=38931901) +682 train 3.291947 (lr=5.7315e-04) (hash(x)=43435357) +683 train 3.319344 (lr=5.7399e-04) (hash(x)=41565218) +684 train 3.362681 (lr=5.7483e-04) (hash(x)=36311728) +685 train 3.373999 (lr=5.7566e-04) (hash(x)=39603093) +686 train 3.335708 (lr=5.7650e-04) (hash(x)=37376512) +687 train 3.358831 (lr=5.7734e-04) (hash(x)=41976781) +688 train 3.305523 (lr=5.7818e-04) (hash(x)=40946340) +689 train 3.307913 (lr=5.7902e-04) (hash(x)=38994999) +690 train 3.364226 (lr=5.7986e-04) (hash(x)=37981861) +691 train 3.302724 (lr=5.8070e-04) (hash(x)=39694781) +692 train 3.366254 (lr=5.8154e-04) (hash(x)=42403643) +693 train 3.387747 (lr=5.8238e-04) (hash(x)=44475934) +694 train 3.287847 (lr=5.8322e-04) (hash(x)=39772877) +695 train 3.346834 (lr=5.8406e-04) (hash(x)=39045113) +696 train 3.281369 (lr=5.8490e-04) (hash(x)=40840908) +697 train 3.306516 (lr=5.8573e-04) (hash(x)=36269126) +698 train 3.343663 (lr=5.8657e-04) (hash(x)=33591977) +699 train 3.268478 (lr=5.8741e-04) (hash(x)=44552747) +700 val loss 3.2985 +700 val perplexity 27.0708 +700 train 3.347619 (lr=5.8825e-04) (hash(x)=40225050) +701 train 3.281080 (lr=5.8909e-04) (hash(x)=39782847) +702 train 3.283315 (lr=5.8993e-04) (hash(x)=38550708) +703 train 3.240273 (lr=5.9077e-04) (hash(x)=38852745) +704 train 3.310759 (lr=5.9161e-04) (hash(x)=48676800) +705 train 3.334638 (lr=5.9245e-04) (hash(x)=37916409) +706 train 3.307055 (lr=5.9329e-04) (hash(x)=37766140) +707 train 3.284875 (lr=5.9413e-04) (hash(x)=43458512) +708 train 3.311787 (lr=5.9497e-04) (hash(x)=38571055) +709 train 3.349421 (lr=5.9580e-04) (hash(x)=41352945) +710 train 3.295010 (lr=5.9664e-04) (hash(x)=40578200) +711 train 3.310658 (lr=5.9748e-04) (hash(x)=37848579) +712 train 3.355964 (lr=5.9832e-04) (hash(x)=38873773) +713 train 3.288124 (lr=5.9916e-04) (hash(x)=37655437) +714 train 3.288500 (lr=6.0000e-04) (hash(x)=40063950) +715 train 3.359801 (lr=6.0000e-04) (hash(x)=35322850) +716 train 3.432407 (lr=6.0000e-04) (hash(x)=43236859) +717 train 3.432174 (lr=6.0000e-04) (hash(x)=37300290) +718 train 3.344039 (lr=6.0000e-04) (hash(x)=39020214) +719 train 3.400637 (lr=5.9999e-04) (hash(x)=42318881) +720 train 3.377214 (lr=5.9999e-04) (hash(x)=45029979) +721 train 3.334618 (lr=5.9998e-04) (hash(x)=45907686) +722 train 3.270325 (lr=5.9998e-04) (hash(x)=39078453) +723 train 3.375270 (lr=5.9997e-04) (hash(x)=39610966) +724 train 3.325827 (lr=5.9997e-04) (hash(x)=39368256) +725 val loss 3.3006 +725 val perplexity 27.1289 +725 train 3.320276 (lr=5.9996e-04) (hash(x)=43256701) +726 train 3.399893 (lr=5.9995e-04) (hash(x)=69566261) +727 train 3.350579 (lr=5.9994e-04) (hash(x)=39594567) +728 train 3.329896 (lr=5.9993e-04) (hash(x)=37766083) +729 train 3.361276 (lr=5.9992e-04) (hash(x)=36765282) +730 train 3.333490 (lr=5.9991e-04) (hash(x)=42186978) +731 train 3.396247 (lr=5.9989e-04) (hash(x)=23819865) +732 train 3.346505 (lr=5.9988e-04) (hash(x)=39777738) +733 train 3.271148 (lr=5.9986e-04) (hash(x)=37054409) +734 train 3.328517 (lr=5.9985e-04) (hash(x)=36194778) +735 train 3.305109 (lr=5.9983e-04) (hash(x)=40423147) +736 train 3.305711 (lr=5.9982e-04) (hash(x)=42517385) +737 train 3.353032 (lr=5.9980e-04) (hash(x)=47849113) +738 train 3.408038 (lr=5.9978e-04) (hash(x)=41956330) +739 train 3.276037 (lr=5.9976e-04) (hash(x)=44653805) +740 train 3.315097 (lr=5.9974e-04) (hash(x)=41607922) +741 train 3.276075 (lr=5.9972e-04) (hash(x)=38915126) +742 train 3.353289 (lr=5.9970e-04) (hash(x)=37530631) +743 train 3.263848 (lr=5.9967e-04) (hash(x)=37394124) +744 train 3.420861 (lr=5.9965e-04) (hash(x)=39918010) +745 train 3.287963 (lr=5.9962e-04) (hash(x)=38288818) +746 train 3.277514 (lr=5.9960e-04) (hash(x)=42158008) +747 train 3.281941 (lr=5.9957e-04) (hash(x)=39150796) +748 train 3.275072 (lr=5.9954e-04) (hash(x)=37363642) +749 train 3.313231 (lr=5.9952e-04) (hash(x)=40921015) +750 val loss 3.3024 +750 val perplexity 27.1771 +750 hella 0.2820 +750 train 3.297691 (lr=5.9949e-04) (hash(x)=45108714) +751 train 3.264790 (lr=5.9946e-04) (hash(x)=40502641) +752 train 3.280670 (lr=5.9943e-04) (hash(x)=34229600) +753 train 3.333694 (lr=5.9940e-04) (hash(x)=45270783) +754 train 3.307635 (lr=5.9936e-04) (hash(x)=47657850) +755 train 3.313584 (lr=5.9933e-04) (hash(x)=41611307) +756 train 3.310146 (lr=5.9930e-04) (hash(x)=40586604) +757 train 3.354365 (lr=5.9926e-04) (hash(x)=37068219) +758 train 3.345196 (lr=5.9923e-04) (hash(x)=49808077) +759 train 3.361019 (lr=5.9919e-04) (hash(x)=42570262) +760 train 3.345048 (lr=5.9915e-04) (hash(x)=36327528) +761 train 3.417598 (lr=5.9912e-04) (hash(x)=42311189) +762 train 3.358256 (lr=5.9908e-04) (hash(x)=41529683) +763 train 3.358593 (lr=5.9904e-04) (hash(x)=37092098) +764 train 3.369166 (lr=5.9900e-04) (hash(x)=37470292) +765 train 3.471427 (lr=5.9896e-04) (hash(x)=38619461) +766 train 3.312889 (lr=5.9891e-04) (hash(x)=37642328) +767 train 3.315664 (lr=5.9887e-04) (hash(x)=37894743) +768 train 3.289246 (lr=5.9883e-04) (hash(x)=37406252) +769 train 3.294086 (lr=5.9878e-04) (hash(x)=52475395) +770 train 3.318250 (lr=5.9874e-04) (hash(x)=38604350) +771 train 3.395555 (lr=5.9869e-04) (hash(x)=42701789) +772 train 3.337803 (lr=5.9864e-04) (hash(x)=32858945) +773 train 3.359527 (lr=5.9859e-04) (hash(x)=37075744) +774 train 3.352750 (lr=5.9855e-04) (hash(x)=38462866) +775 val loss 3.3130 +775 val perplexity 27.4680 +775 train 3.292016 (lr=5.9850e-04) (hash(x)=38559624) +776 train 3.301734 (lr=5.9845e-04) (hash(x)=44091922) +777 train 3.394579 (lr=5.9839e-04) (hash(x)=38145601) +778 train 3.364999 (lr=5.9834e-04) (hash(x)=39474846) +779 train 3.314486 (lr=5.9829e-04) (hash(x)=40349195) +780 train 3.273721 (lr=5.9824e-04) (hash(x)=43229796) +781 train 3.333047 (lr=5.9818e-04) (hash(x)=44067943) +782 train 3.336271 (lr=5.9812e-04) (hash(x)=37468690) +783 train 3.344418 (lr=5.9807e-04) (hash(x)=40373355) +784 train 3.332223 (lr=5.9801e-04) (hash(x)=49714714) +785 train 3.337447 (lr=5.9795e-04) (hash(x)=38895371) +786 train 3.335134 (lr=5.9789e-04) (hash(x)=45506962) +787 train 3.324823 (lr=5.9784e-04) (hash(x)=44620551) +788 train 3.352851 (lr=5.9777e-04) (hash(x)=40339708) +789 train 3.292516 (lr=5.9771e-04) (hash(x)=38767294) +790 train 3.317325 (lr=5.9765e-04) (hash(x)=39631038) +791 train 3.304017 (lr=5.9759e-04) (hash(x)=38496894) +792 train 3.328069 (lr=5.9752e-04) (hash(x)=41606627) +793 train 3.392493 (lr=5.9746e-04) (hash(x)=37598835) +794 train 3.351565 (lr=5.9739e-04) (hash(x)=35765947) +795 train 3.370168 (lr=5.9733e-04) (hash(x)=35218744) +796 train 3.270530 (lr=5.9726e-04) (hash(x)=38277599) +797 train 3.306581 (lr=5.9719e-04) (hash(x)=42823327) +798 train 3.350179 (lr=5.9712e-04) (hash(x)=41700831) +799 train 3.315153 (lr=5.9705e-04) (hash(x)=39347280) +800 val loss 3.3054 +800 val perplexity 27.2583 +800 train 3.342799 (lr=5.9698e-04) (hash(x)=39653582) +801 train 3.321471 (lr=5.9691e-04) (hash(x)=41586935) +802 train 3.350344 (lr=5.9684e-04) (hash(x)=40615613) +803 train 3.382905 (lr=5.9677e-04) (hash(x)=33663383) +804 train 3.311943 (lr=5.9669e-04) (hash(x)=42168942) +805 train 3.271276 (lr=5.9662e-04) (hash(x)=39934888) +806 train 3.324009 (lr=5.9654e-04) (hash(x)=36449311) +807 train 3.358610 (lr=5.9647e-04) (hash(x)=40138292) +808 train 3.323452 (lr=5.9639e-04) (hash(x)=38653513) +809 train 3.294690 (lr=5.9631e-04) (hash(x)=40334705) +810 train 3.301781 (lr=5.9623e-04) (hash(x)=47530436) +811 train 3.291191 (lr=5.9616e-04) (hash(x)=40259973) +812 train 3.318787 (lr=5.9607e-04) (hash(x)=40879958) +813 train 3.319958 (lr=5.9599e-04) (hash(x)=37835111) +814 train 3.350449 (lr=5.9591e-04) (hash(x)=46068395) +815 train 3.278173 (lr=5.9583e-04) (hash(x)=40782273) +816 train 3.309933 (lr=5.9575e-04) (hash(x)=37184299) +817 train 3.358669 (lr=5.9566e-04) (hash(x)=34932063) +818 train 3.374641 (lr=5.9558e-04) (hash(x)=42632017) +819 train 3.268628 (lr=5.9549e-04) (hash(x)=38585352) +820 train 3.287426 (lr=5.9540e-04) (hash(x)=36627253) +821 train 3.323379 (lr=5.9532e-04) (hash(x)=39629854) +822 train 3.319829 (lr=5.9523e-04) (hash(x)=37619856) +823 train 3.293731 (lr=5.9514e-04) (hash(x)=40931236) +824 train 3.351607 (lr=5.9505e-04) (hash(x)=32774956) +825 val loss 3.3064 +825 val perplexity 27.2854 +825 train 3.302734 (lr=5.9496e-04) (hash(x)=39240156) +826 train 3.378056 (lr=5.9486e-04) (hash(x)=43593249) +827 train 3.340452 (lr=5.9477e-04) (hash(x)=41343081) +828 train 3.300323 (lr=5.9468e-04) (hash(x)=41007316) +829 train 3.365509 (lr=5.9458e-04) (hash(x)=43183490) +830 train 3.307930 (lr=5.9449e-04) (hash(x)=38341342) +831 train 3.368065 (lr=5.9439e-04) (hash(x)=38488825) +832 train 3.298906 (lr=5.9430e-04) (hash(x)=38005712) +833 train 3.331005 (lr=5.9420e-04) (hash(x)=38813064) +834 train 3.315803 (lr=5.9410e-04) (hash(x)=41832942) +835 train 3.349760 (lr=5.9400e-04) (hash(x)=40098400) +836 train 3.290140 (lr=5.9390e-04) (hash(x)=47241699) +837 train 3.422352 (lr=5.9380e-04) (hash(x)=35577065) +838 train 3.294747 (lr=5.9370e-04) (hash(x)=41039694) +839 train 3.367740 (lr=5.9360e-04) (hash(x)=37499519) +840 train 3.295970 (lr=5.9349e-04) (hash(x)=37605077) +841 train 3.323065 (lr=5.9339e-04) (hash(x)=33078676) +842 train 3.314281 (lr=5.9328e-04) (hash(x)=37792946) +843 train 3.329109 (lr=5.9318e-04) (hash(x)=35393448) +844 train 3.297678 (lr=5.9307e-04) (hash(x)=36139333) +845 train 3.312480 (lr=5.9296e-04) (hash(x)=34003628) +846 train 3.424620 (lr=5.9286e-04) (hash(x)=42236468) +847 train 3.261665 (lr=5.9275e-04) (hash(x)=37695501) +848 train 3.299239 (lr=5.9264e-04) (hash(x)=34985499) +849 train 3.276549 (lr=5.9253e-04) (hash(x)=38722597) +850 val loss 3.3074 +850 val perplexity 27.3144 +850 train 3.308583 (lr=5.9241e-04) (hash(x)=38925573) +851 train 3.282915 (lr=5.9230e-04) (hash(x)=40978553) +852 train 3.270549 (lr=5.9219e-04) (hash(x)=41071151) +853 train 3.354008 (lr=5.9208e-04) (hash(x)=41346359) +854 train 3.350556 (lr=5.9196e-04) (hash(x)=43103331) +855 train 3.255393 (lr=5.9185e-04) (hash(x)=39993348) +856 train 3.366497 (lr=5.9173e-04) (hash(x)=43350849) +857 train 3.341176 (lr=5.9161e-04) (hash(x)=40131133) +858 train 3.315848 (lr=5.9149e-04) (hash(x)=47427051) +859 train 3.308410 (lr=5.9138e-04) (hash(x)=38516664) +860 train 3.341880 (lr=5.9126e-04) (hash(x)=37065178) +861 train 3.279750 (lr=5.9114e-04) (hash(x)=38385195) +862 train 3.316788 (lr=5.9101e-04) (hash(x)=41132568) +863 train 3.338404 (lr=5.9089e-04) (hash(x)=45852405) +864 train 3.379773 (lr=5.9077e-04) (hash(x)=46142957) +865 train 3.300624 (lr=5.9065e-04) (hash(x)=37674315) +866 train 3.370498 (lr=5.9052e-04) (hash(x)=40551807) +867 train 3.431355 (lr=5.9040e-04) (hash(x)=35428929) +868 train 3.339293 (lr=5.9027e-04) (hash(x)=39900258) +869 train 3.359302 (lr=5.9014e-04) (hash(x)=42762731) +870 train 3.335392 (lr=5.9002e-04) (hash(x)=35060049) +871 train 3.429202 (lr=5.8989e-04) (hash(x)=39976425) +872 train 3.324827 (lr=5.8976e-04) (hash(x)=38214454) +873 train 3.344672 (lr=5.8963e-04) (hash(x)=42364096) +874 train 3.370833 (lr=5.8950e-04) (hash(x)=38654188) +875 val loss 3.3033 +875 val perplexity 27.2012 +875 train 3.414412 (lr=5.8937e-04) (hash(x)=40761828) +876 train 3.340573 (lr=5.8923e-04) (hash(x)=45687266) +877 train 3.343111 (lr=5.8910e-04) (hash(x)=39312694) +878 train 3.326719 (lr=5.8897e-04) (hash(x)=36394130) +879 train 3.264065 (lr=5.8883e-04) (hash(x)=66071500) +880 train 3.311596 (lr=5.8869e-04) (hash(x)=38569900) +881 train 3.288641 (lr=5.8856e-04) (hash(x)=33699086) +882 train 3.369281 (lr=5.8842e-04) (hash(x)=32519322) +883 train 3.319025 (lr=5.8828e-04) (hash(x)=39641265) +884 train 3.312980 (lr=5.8814e-04) (hash(x)=44408846) +885 train 3.301936 (lr=5.8800e-04) (hash(x)=32330480) +886 train 3.318280 (lr=5.8786e-04) (hash(x)=42447782) +887 train 3.365102 (lr=5.8772e-04) (hash(x)=41354450) +888 train 3.300578 (lr=5.8758e-04) (hash(x)=40576941) +889 train 3.372003 (lr=5.8744e-04) (hash(x)=40444791) +890 train 3.300646 (lr=5.8729e-04) (hash(x)=45378763) +891 train 3.325591 (lr=5.8715e-04) (hash(x)=38851912) +892 train 3.284502 (lr=5.8700e-04) (hash(x)=44515373) +893 train 3.318650 (lr=5.8686e-04) (hash(x)=44532900) +894 train 3.356808 (lr=5.8671e-04) (hash(x)=49302694) +895 train 3.401053 (lr=5.8656e-04) (hash(x)=37746808) +896 train 3.280532 (lr=5.8642e-04) (hash(x)=41579253) +897 train 3.284887 (lr=5.8627e-04) (hash(x)=41792192) +898 train 3.309274 (lr=5.8612e-04) (hash(x)=36578813) +899 train 3.321672 (lr=5.8597e-04) (hash(x)=39146280) +900 val loss 3.3013 +900 val perplexity 27.1468 +900 train 3.315093 (lr=5.8581e-04) (hash(x)=38092182) +901 train 3.330921 (lr=5.8566e-04) (hash(x)=41684237) +902 train 3.345007 (lr=5.8551e-04) (hash(x)=36795766) +903 train 3.397699 (lr=5.8535e-04) (hash(x)=33939329) +904 train 3.325243 (lr=5.8520e-04) (hash(x)=36397918) +905 train 3.349005 (lr=5.8504e-04) (hash(x)=40620613) +906 train 3.411980 (lr=5.8489e-04) (hash(x)=42761291) +907 train 3.338989 (lr=5.8473e-04) (hash(x)=38698600) +908 train 3.471313 (lr=5.8457e-04) (hash(x)=37086298) +909 train 3.308287 (lr=5.8441e-04) (hash(x)=36306169) +910 train 3.368429 (lr=5.8425e-04) (hash(x)=34975881) +911 train 3.380259 (lr=5.8409e-04) (hash(x)=45313690) +912 train 3.396895 (lr=5.8393e-04) (hash(x)=36771818) +913 train 3.352238 (lr=5.8377e-04) (hash(x)=34594639) +914 train 3.312431 (lr=5.8361e-04) (hash(x)=42405006) +915 train 3.311236 (lr=5.8345e-04) (hash(x)=38610975) +916 train 3.311289 (lr=5.8328e-04) (hash(x)=40928704) +917 train 3.327881 (lr=5.8312e-04) (hash(x)=41602844) +918 train 3.315010 (lr=5.8295e-04) (hash(x)=44618165) +919 train 3.363048 (lr=5.8278e-04) (hash(x)=40549309) +920 train 3.270802 (lr=5.8262e-04) (hash(x)=37190519) +921 train 3.300708 (lr=5.8245e-04) (hash(x)=39152271) +922 train 3.323272 (lr=5.8228e-04) (hash(x)=39238802) +923 train 3.316915 (lr=5.8211e-04) (hash(x)=45161966) +924 train 3.251153 (lr=5.8194e-04) (hash(x)=41243789) +925 val loss 3.3045 +925 val perplexity 27.2339 +925 train 3.289578 (lr=5.8177e-04) (hash(x)=43482615) +926 train 3.354106 (lr=5.8160e-04) (hash(x)=45015737) +927 train 3.299091 (lr=5.8142e-04) (hash(x)=42818104) +928 train 3.363080 (lr=5.8125e-04) (hash(x)=36241177) +929 train 3.366659 (lr=5.8107e-04) (hash(x)=41300720) +930 train 3.350844 (lr=5.8090e-04) (hash(x)=41719287) +931 train 3.315918 (lr=5.8072e-04) (hash(x)=45132690) +932 train 3.297800 (lr=5.8055e-04) (hash(x)=48688021) +933 train 3.309858 (lr=5.8037e-04) (hash(x)=34670038) +934 train 3.364506 (lr=5.8019e-04) (hash(x)=40038592) +935 train 3.329410 (lr=5.8001e-04) (hash(x)=35109955) +936 train 3.363720 (lr=5.7983e-04) (hash(x)=41393849) +937 train 3.330168 (lr=5.7965e-04) (hash(x)=41680355) +938 train 3.362713 (lr=5.7947e-04) (hash(x)=25945232) +939 train 3.291922 (lr=5.7929e-04) (hash(x)=39977991) +940 train 3.287713 (lr=5.7911e-04) (hash(x)=40379888) +941 train 3.365014 (lr=5.7892e-04) (hash(x)=40534971) +942 train 3.352053 (lr=5.7874e-04) (hash(x)=39389012) +943 train 3.373327 (lr=5.7855e-04) (hash(x)=37163383) +944 train 3.364157 (lr=5.7837e-04) (hash(x)=41875016) +945 train 3.335896 (lr=5.7818e-04) (hash(x)=38280763) +946 train 3.393673 (lr=5.7799e-04) (hash(x)=40022515) +947 train 3.357941 (lr=5.7780e-04) (hash(x)=38346031) +948 train 3.582369 (lr=5.7761e-04) (hash(x)=43418428) +949 train 3.316856 (lr=5.7742e-04) (hash(x)=39303793) +950 val loss 3.3060 +950 val perplexity 27.2754 +950 train 3.426165 (lr=5.7723e-04) (hash(x)=45726687) +951 train 3.313914 (lr=5.7704e-04) (hash(x)=38324356) +952 train 3.282005 (lr=5.7685e-04) (hash(x)=38122452) +953 train 3.296214 (lr=5.7666e-04) (hash(x)=30169930) +954 train 3.312480 (lr=5.7646e-04) (hash(x)=38960292) +955 train 3.246385 (lr=5.7627e-04) (hash(x)=39141688) +956 train 3.341323 (lr=5.7607e-04) (hash(x)=41185634) +957 train 3.288545 (lr=5.7588e-04) (hash(x)=40018402) +958 train 3.319247 (lr=5.7568e-04) (hash(x)=40073964) +959 train 3.254483 (lr=5.7548e-04) (hash(x)=45028086) +960 train 3.278660 (lr=5.7529e-04) (hash(x)=43997058) +961 train 3.292697 (lr=5.7509e-04) (hash(x)=34708259) +962 train 3.372743 (lr=5.7489e-04) (hash(x)=34651410) +963 train 3.272929 (lr=5.7469e-04) (hash(x)=38728781) +964 train 3.383946 (lr=5.7449e-04) (hash(x)=43979758) +965 train 3.388941 (lr=5.7428e-04) (hash(x)=40997721) +966 train 3.293779 (lr=5.7408e-04) (hash(x)=37971810) +967 train 3.343479 (lr=5.7388e-04) (hash(x)=43792649) +968 train 3.377371 (lr=5.7367e-04) (hash(x)=44971396) +969 train 3.422727 (lr=5.7347e-04) (hash(x)=41142642) +970 train 3.269267 (lr=5.7326e-04) (hash(x)=46233422) +971 train 3.310530 (lr=5.7306e-04) (hash(x)=40692727) +972 train 3.304075 (lr=5.7285e-04) (hash(x)=38718756) +973 train 3.286105 (lr=5.7264e-04) (hash(x)=42131042) +974 train 3.339827 (lr=5.7243e-04) (hash(x)=36341492) +975 val loss 3.2980 +975 val perplexity 27.0592 +975 train 3.335539 (lr=5.7222e-04) (hash(x)=46072106) +976 train 3.379056 (lr=5.7201e-04) (hash(x)=40035336) +977 train 3.328197 (lr=5.7180e-04) (hash(x)=47803749) +978 train 3.332076 (lr=5.7159e-04) (hash(x)=43247521) +979 train 3.366739 (lr=5.7138e-04) (hash(x)=37627670) +980 train 3.305417 (lr=5.7116e-04) (hash(x)=39637270) +981 train 3.395566 (lr=5.7095e-04) (hash(x)=41717100) +982 train 3.350986 (lr=5.7073e-04) (hash(x)=39704195) +983 train 3.336194 (lr=5.7052e-04) (hash(x)=37720937) +984 train 3.340769 (lr=5.7030e-04) (hash(x)=43876559) +985 train 3.419091 (lr=5.7008e-04) (hash(x)=43782527) +986 train 3.356003 (lr=5.6987e-04) (hash(x)=40875624) +987 train 3.292574 (lr=5.6965e-04) (hash(x)=42787331) +988 train 3.331186 (lr=5.6943e-04) (hash(x)=38346755) +989 train 3.272264 (lr=5.6921e-04) (hash(x)=40502548) +990 train 3.264494 (lr=5.6899e-04) (hash(x)=45653458) +991 train 3.285812 (lr=5.6877e-04) (hash(x)=49983434) +992 train 3.290422 (lr=5.6854e-04) (hash(x)=39939815) +993 train 3.334520 (lr=5.6832e-04) (hash(x)=42208875) +994 train 3.290647 (lr=5.6810e-04) (hash(x)=32909933) +995 train 3.332891 (lr=5.6787e-04) (hash(x)=37617340) +996 train 3.300418 (lr=5.6765e-04) (hash(x)=34882224) +997 train 3.343617 (lr=5.6742e-04) (hash(x)=36240264) +998 train 3.315077 (lr=5.6720e-04) (hash(x)=37466827) +999 train 3.354597 (lr=5.6697e-04) (hash(x)=46731360) +1000 val loss 3.3120 +1000 val perplexity 27.4388 +1000 hella 0.2816 +1000 train 3.354616 (lr=5.6674e-04) (hash(x)=38259788) +1001 train 3.315068 (lr=5.6651e-04) (hash(x)=39986803) +1002 train 3.308269 (lr=5.6628e-04) (hash(x)=35534106) +1003 train 3.316445 (lr=5.6605e-04) (hash(x)=38710791) +1004 train 3.341246 (lr=5.6582e-04) (hash(x)=42136532) +1005 train 3.371834 (lr=5.6559e-04) (hash(x)=38447668) +1006 train 3.274629 (lr=5.6536e-04) (hash(x)=38086106) +1007 train 3.321367 (lr=5.6512e-04) (hash(x)=37896807) +1008 train 3.308686 (lr=5.6489e-04) (hash(x)=39838508) +1009 train 3.359637 (lr=5.6465e-04) (hash(x)=42983008) +1010 train 3.349885 (lr=5.6442e-04) (hash(x)=37879033) +1011 train 3.321376 (lr=5.6418e-04) (hash(x)=40266335) +1012 train 3.349489 (lr=5.6395e-04) (hash(x)=48654989) +1013 train 3.465202 (lr=5.6371e-04) (hash(x)=34204794) +1014 train 3.341062 (lr=5.6347e-04) (hash(x)=38030214) +1015 train 3.349506 (lr=5.6323e-04) (hash(x)=35145589) +1016 train 3.355400 (lr=5.6299e-04) (hash(x)=37755043) +1017 train 3.341312 (lr=5.6275e-04) (hash(x)=40788735) +1018 train 3.429115 (lr=5.6251e-04) (hash(x)=47543123) +1019 train 3.382512 (lr=5.6227e-04) (hash(x)=35663269) +1020 train 3.349150 (lr=5.6202e-04) (hash(x)=35802333) +1021 train 3.307950 (lr=5.6178e-04) (hash(x)=43795973) +1022 train 3.364079 (lr=5.6154e-04) (hash(x)=44824186) +1023 train 3.339589 (lr=5.6129e-04) (hash(x)=39042856) +1024 train 3.330900 (lr=5.6105e-04) (hash(x)=42729079) +1025 val loss 3.2985 +1025 val perplexity 27.0730 +1025 train 3.276234 (lr=5.6080e-04) (hash(x)=34043578) +1026 train 3.310078 (lr=5.6055e-04) (hash(x)=33126235) +1027 train 3.371984 (lr=5.6031e-04) (hash(x)=44891665) +1028 train 3.277772 (lr=5.6006e-04) (hash(x)=39189706) +1029 train 3.323407 (lr=5.5981e-04) (hash(x)=39545035) +1030 train 3.351743 (lr=5.5956e-04) (hash(x)=35645099) +1031 train 3.322877 (lr=5.5931e-04) (hash(x)=48424449) +1032 train 3.288828 (lr=5.5906e-04) (hash(x)=56814915) +1033 train 3.255849 (lr=5.5880e-04) (hash(x)=42803627) +1034 train 3.245120 (lr=5.5855e-04) (hash(x)=44146453) +1035 train 3.285050 (lr=5.5830e-04) (hash(x)=39325736) +1036 train 3.264024 (lr=5.5804e-04) (hash(x)=38304947) +1037 train 3.334048 (lr=5.5779e-04) (hash(x)=38337913) +1038 train 3.368427 (lr=5.5753e-04) (hash(x)=43161847) +1039 train 3.309593 (lr=5.5728e-04) (hash(x)=40675920) +1040 train 3.370563 (lr=5.5702e-04) (hash(x)=37319063) +1041 train 3.288466 (lr=5.5676e-04) (hash(x)=39004997) +1042 train 3.312186 (lr=5.5651e-04) (hash(x)=47166456) +1043 train 3.311754 (lr=5.5625e-04) (hash(x)=36913429) +1044 train 3.307413 (lr=5.5599e-04) (hash(x)=39056701) +1045 train 3.356579 (lr=5.5573e-04) (hash(x)=45421796) +1046 train 3.354339 (lr=5.5547e-04) (hash(x)=36160608) +1047 train 3.360981 (lr=5.5520e-04) (hash(x)=43076985) +1048 train 3.321566 (lr=5.5494e-04) (hash(x)=30507378) +1049 train 3.323468 (lr=5.5468e-04) (hash(x)=45041067) +1050 val loss 3.2956 +1050 val perplexity 26.9935 +1050 train 3.344305 (lr=5.5441e-04) (hash(x)=42747809) +1051 train 3.377254 (lr=5.5415e-04) (hash(x)=43506947) +1052 train 3.328801 (lr=5.5388e-04) (hash(x)=40783958) +1053 train 3.393998 (lr=5.5362e-04) (hash(x)=44791537) +1054 train 3.336300 (lr=5.5335e-04) (hash(x)=41427328) +1055 train 3.310909 (lr=5.5308e-04) (hash(x)=35154738) +1056 train 3.362327 (lr=5.5282e-04) (hash(x)=44362704) +1057 train 3.393444 (lr=5.5255e-04) (hash(x)=35793761) +1058 train 3.342751 (lr=5.5228e-04) (hash(x)=36460310) +1059 train 3.407602 (lr=5.5201e-04) (hash(x)=38511358) +1060 train 3.349198 (lr=5.5174e-04) (hash(x)=40022979) +1061 train 3.321412 (lr=5.5147e-04) (hash(x)=36505590) +1062 train 3.318002 (lr=5.5119e-04) (hash(x)=41472583) +1063 train 3.265956 (lr=5.5092e-04) (hash(x)=37541927) +1064 train 3.321599 (lr=5.5065e-04) (hash(x)=35943974) +1065 train 3.288446 (lr=5.5037e-04) (hash(x)=45725108) +1066 train 3.305224 (lr=5.5010e-04) (hash(x)=41448922) +1067 train 3.342351 (lr=5.4982e-04) (hash(x)=39486090) +1068 train 3.354583 (lr=5.4955e-04) (hash(x)=39976931) +1069 train 3.308798 (lr=5.4927e-04) (hash(x)=35687278) +1070 train 3.251938 (lr=5.4899e-04) (hash(x)=35355158) +1071 train 3.265251 (lr=5.4871e-04) (hash(x)=36996201) +1072 train 3.245654 (lr=5.4843e-04) (hash(x)=40199326) +1073 train 3.244185 (lr=5.4815e-04) (hash(x)=38830465) +1074 train 3.297732 (lr=5.4787e-04) (hash(x)=42611204) +1075 val loss 3.2919 +1075 val perplexity 26.8927 +1075 train 3.367773 (lr=5.4759e-04) (hash(x)=38546908) +1076 train 3.345248 (lr=5.4731e-04) (hash(x)=35090984) +1077 train 3.262281 (lr=5.4703e-04) (hash(x)=40771570) +1078 train 3.297897 (lr=5.4675e-04) (hash(x)=41632090) +1079 train 3.341362 (lr=5.4646e-04) (hash(x)=40226910) +1080 train 3.286685 (lr=5.4618e-04) (hash(x)=40341768) +1081 train 3.317158 (lr=5.4589e-04) (hash(x)=33363996) +1082 train 3.345828 (lr=5.4561e-04) (hash(x)=33695913) +1083 train 3.403521 (lr=5.4532e-04) (hash(x)=46436324) +1084 train 3.323102 (lr=5.4503e-04) (hash(x)=37553901) +1085 train 3.341651 (lr=5.4475e-04) (hash(x)=37956850) +1086 train 3.349155 (lr=5.4446e-04) (hash(x)=31887011) +1087 train 3.310434 (lr=5.4417e-04) (hash(x)=46147811) +1088 train 3.293821 (lr=5.4388e-04) (hash(x)=43133315) +1089 train 3.389830 (lr=5.4359e-04) (hash(x)=42249123) +1090 train 3.368762 (lr=5.4330e-04) (hash(x)=43433659) +1091 train 3.410495 (lr=5.4301e-04) (hash(x)=38783511) +1092 train 3.348524 (lr=5.4271e-04) (hash(x)=40312733) +1093 train 3.359149 (lr=5.4242e-04) (hash(x)=39463476) +1094 train 3.337964 (lr=5.4213e-04) (hash(x)=39843092) +1095 train 3.349276 (lr=5.4183e-04) (hash(x)=30702715) +1096 train 3.277423 (lr=5.4154e-04) (hash(x)=43189659) +1097 train 3.318753 (lr=5.4124e-04) (hash(x)=40329272) +1098 train 3.348983 (lr=5.4095e-04) (hash(x)=37797506) +1099 train 3.314929 (lr=5.4065e-04) (hash(x)=36421442) +1100 val loss 3.2956 +1100 val perplexity 26.9939 +1100 train 3.310699 (lr=5.4035e-04) (hash(x)=38385429) +1101 train 3.326031 (lr=5.4005e-04) (hash(x)=37740942) +1102 train 3.275000 (lr=5.3975e-04) (hash(x)=39616330) +1103 train 3.303461 (lr=5.3946e-04) (hash(x)=36669428) +1104 train 3.310378 (lr=5.3915e-04) (hash(x)=43951920) +1105 train 3.226639 (lr=5.3885e-04) (hash(x)=41776245) +1106 train 3.259569 (lr=5.3855e-04) (hash(x)=46196653) +1107 train 3.261366 (lr=5.3825e-04) (hash(x)=38677786) +1108 train 3.276481 (lr=5.3795e-04) (hash(x)=42350771) +1109 train 3.204938 (lr=5.3764e-04) (hash(x)=38009483) +1110 train 3.340300 (lr=5.3734e-04) (hash(x)=44555136) +1111 train 3.302994 (lr=5.3704e-04) (hash(x)=41733955) +1112 train 3.325189 (lr=5.3673e-04) (hash(x)=42427295) +1113 train 3.307445 (lr=5.3642e-04) (hash(x)=48048304) +1114 train 3.343986 (lr=5.3612e-04) (hash(x)=42866277) +1115 train 3.272760 (lr=5.3581e-04) (hash(x)=40469369) +1116 train 3.319786 (lr=5.3550e-04) (hash(x)=36507138) +1117 train 3.259008 (lr=5.3519e-04) (hash(x)=42924578) +1118 train 3.289931 (lr=5.3488e-04) (hash(x)=42847929) +1119 train 3.276306 (lr=5.3457e-04) (hash(x)=42491517) +1120 train 3.314617 (lr=5.3426e-04) (hash(x)=37507657) +1121 train 3.283342 (lr=5.3395e-04) (hash(x)=39659597) +1122 train 3.354067 (lr=5.3364e-04) (hash(x)=39790875) +1123 train 3.315947 (lr=5.3333e-04) (hash(x)=42448764) +1124 train 3.330831 (lr=5.3302e-04) (hash(x)=45090726) +1125 val loss 3.2874 +1125 val perplexity 26.7719 +1125 train 3.344871 (lr=5.3270e-04) (hash(x)=39648838) +1126 train 3.413704 (lr=5.3239e-04) (hash(x)=45058839) +1127 train 3.327638 (lr=5.3207e-04) (hash(x)=37194937) +1128 train 3.340443 (lr=5.3176e-04) (hash(x)=36891310) +1129 train 3.356966 (lr=5.3144e-04) (hash(x)=37486036) +1130 train 3.353731 (lr=5.3113e-04) (hash(x)=49452418) +1131 train 3.387845 (lr=5.3081e-04) (hash(x)=38560900) +1132 train 3.296344 (lr=5.3049e-04) (hash(x)=39370068) +1133 train 3.314002 (lr=5.3017e-04) (hash(x)=37736397) +1134 train 3.360266 (lr=5.2985e-04) (hash(x)=37822910) +1135 train 3.301275 (lr=5.2953e-04) (hash(x)=38882563) +1136 train 3.309966 (lr=5.2921e-04) (hash(x)=34037164) +1137 train 3.249722 (lr=5.2889e-04) (hash(x)=38704838) +1138 train 3.231123 (lr=5.2857e-04) (hash(x)=37853907) +1139 train 3.316841 (lr=5.2825e-04) (hash(x)=38738519) +1140 train 3.256415 (lr=5.2792e-04) (hash(x)=37453717) +1141 train 3.269556 (lr=5.2760e-04) (hash(x)=33339496) +1142 train 3.286184 (lr=5.2728e-04) (hash(x)=45646188) +1143 train 3.341795 (lr=5.2695e-04) (hash(x)=42314467) +1144 train 3.292365 (lr=5.2663e-04) (hash(x)=35054019) +1145 train 3.240709 (lr=5.2630e-04) (hash(x)=42263264) +1146 train 3.245614 (lr=5.2597e-04) (hash(x)=37198639) +1147 train 3.288842 (lr=5.2565e-04) (hash(x)=32163188) +1148 train 3.329484 (lr=5.2532e-04) (hash(x)=40648352) +1149 train 3.299650 (lr=5.2499e-04) (hash(x)=39881159) +1150 val loss 3.2872 +1150 val perplexity 26.7681 +1150 train 3.314563 (lr=5.2466e-04) (hash(x)=41265793) +1151 train 3.343322 (lr=5.2433e-04) (hash(x)=40309695) +1152 train 3.356673 (lr=5.2400e-04) (hash(x)=36746188) +1153 train 3.323818 (lr=5.2367e-04) (hash(x)=42954207) +1154 train 3.368424 (lr=5.2334e-04) (hash(x)=39243781) +1155 train 3.382593 (lr=5.2301e-04) (hash(x)=41747540) +1156 train 3.313076 (lr=5.2267e-04) (hash(x)=40499683) +1157 train 3.331265 (lr=5.2234e-04) (hash(x)=43164299) +1158 train 3.446682 (lr=5.2201e-04) (hash(x)=41156396) +1159 train 3.361506 (lr=5.2167e-04) (hash(x)=44110407) +1160 train 3.338482 (lr=5.2134e-04) (hash(x)=38127989) +1161 train 3.261809 (lr=5.2100e-04) (hash(x)=37855623) +1162 train 3.398008 (lr=5.2067e-04) (hash(x)=43262926) +1163 train 3.384193 (lr=5.2033e-04) (hash(x)=41375649) +1164 train 3.332202 (lr=5.1999e-04) (hash(x)=43807592) +1165 train 3.363470 (lr=5.1965e-04) (hash(x)=40676687) +1166 train 3.314995 (lr=5.1932e-04) (hash(x)=37816824) +1167 train 3.325182 (lr=5.1898e-04) (hash(x)=41800751) +1168 train 3.349487 (lr=5.1864e-04) (hash(x)=35681452) +1169 train 3.288806 (lr=5.1830e-04) (hash(x)=39162014) +1170 train 3.324909 (lr=5.1796e-04) (hash(x)=41006385) +1171 train 3.376823 (lr=5.1761e-04) (hash(x)=39169701) +1172 train 3.205763 (lr=5.1727e-04) (hash(x)=39586924) +1173 train 3.312923 (lr=5.1693e-04) (hash(x)=39910967) +1174 train 3.295381 (lr=5.1659e-04) (hash(x)=40046720) +1175 val loss 3.2869 +1175 val perplexity 26.7588 +1175 train 3.299757 (lr=5.1624e-04) (hash(x)=32570405) +1176 train 3.284462 (lr=5.1590e-04) (hash(x)=39195667) +1177 train 3.312025 (lr=5.1555e-04) (hash(x)=41718755) +1178 train 3.267867 (lr=5.1521e-04) (hash(x)=35553657) +1179 train 3.328298 (lr=5.1486e-04) (hash(x)=41124581) +1180 train 3.287957 (lr=5.1452e-04) (hash(x)=47398992) +1181 train 3.291907 (lr=5.1417e-04) (hash(x)=39056766) +1182 train 3.267929 (lr=5.1382e-04) (hash(x)=41055038) +1183 train 3.292418 (lr=5.1347e-04) (hash(x)=41819366) +1184 train 3.242483 (lr=5.1312e-04) (hash(x)=46694713) +1185 train 3.324704 (lr=5.1277e-04) (hash(x)=39437401) +1186 train 3.364383 (lr=5.1242e-04) (hash(x)=36888069) +1187 train 3.325828 (lr=5.1207e-04) (hash(x)=45929995) +1188 train 3.335308 (lr=5.1172e-04) (hash(x)=38546732) +1189 train 3.347815 (lr=5.1137e-04) (hash(x)=36680802) +1190 train 3.363842 (lr=5.1102e-04) (hash(x)=38786934) +1191 train 3.363204 (lr=5.1067e-04) (hash(x)=44930201) +1192 train 3.255285 (lr=5.1031e-04) (hash(x)=42393922) +1193 train 3.321240 (lr=5.0996e-04) (hash(x)=36078148) +1194 train 3.290506 (lr=5.0960e-04) (hash(x)=28341513) +1195 train 3.351316 (lr=5.0925e-04) (hash(x)=38190734) +1196 train 3.345533 (lr=5.0889e-04) (hash(x)=35948974) +1197 train 3.350020 (lr=5.0854e-04) (hash(x)=38341663) +1198 train 3.318807 (lr=5.0818e-04) (hash(x)=40685865) +1199 train 3.300825 (lr=5.0782e-04) (hash(x)=42763687) +1200 val loss 3.2891 +1200 val perplexity 26.8178 +1200 train 3.350645 (lr=5.0746e-04) (hash(x)=36510407) +1201 train 3.321133 (lr=5.0711e-04) (hash(x)=36741367) +1202 train 3.419550 (lr=5.0675e-04) (hash(x)=28412303) +1203 train 3.301863 (lr=5.0639e-04) (hash(x)=40457902) +1204 train 3.362588 (lr=5.0603e-04) (hash(x)=42491717) +1205 train 3.301311 (lr=5.0567e-04) (hash(x)=37482597) +1206 train 3.342213 (lr=5.0531e-04) (hash(x)=36012514) +1207 train 3.338910 (lr=5.0494e-04) (hash(x)=36387693) +1208 train 3.340410 (lr=5.0458e-04) (hash(x)=37483864) +1209 train 3.310048 (lr=5.0422e-04) (hash(x)=34596280) +1210 train 3.272423 (lr=5.0386e-04) (hash(x)=41634000) +1211 train 3.271992 (lr=5.0349e-04) (hash(x)=37487762) +1212 train 3.298360 (lr=5.0313e-04) (hash(x)=38347748) +1213 train 3.257198 (lr=5.0276e-04) (hash(x)=41344044) +1214 train 3.262406 (lr=5.0240e-04) (hash(x)=46863337) +1215 train 3.244890 (lr=5.0203e-04) (hash(x)=39037377) +1216 train 3.252921 (lr=5.0166e-04) (hash(x)=38801326) +1217 train 3.281106 (lr=5.0130e-04) (hash(x)=39327359) +1218 train 3.301770 (lr=5.0093e-04) (hash(x)=43151597) +1219 train 3.293507 (lr=5.0056e-04) (hash(x)=40129808) +1220 train 3.294514 (lr=5.0019e-04) (hash(x)=37291065) +1221 train 3.285643 (lr=4.9982e-04) (hash(x)=39773254) +1222 train 3.300490 (lr=4.9945e-04) (hash(x)=43667465) +1223 train 3.305688 (lr=4.9908e-04) (hash(x)=39131272) +1224 train 3.400890 (lr=4.9871e-04) (hash(x)=44103497) +1225 val loss 3.2817 +1225 val perplexity 26.6197 +1225 train 3.246879 (lr=4.9834e-04) (hash(x)=40691059) +1226 train 3.391816 (lr=4.9797e-04) (hash(x)=37598284) +1227 train 3.315708 (lr=4.9760e-04) (hash(x)=41591858) +1228 train 3.346153 (lr=4.9723e-04) (hash(x)=46667993) +1229 train 3.273892 (lr=4.9685e-04) (hash(x)=42954613) +1230 train 3.248708 (lr=4.9648e-04) (hash(x)=38245122) +1231 train 3.096381 (lr=4.9610e-04) (hash(x)=40408023) +1232 train 3.326403 (lr=4.9573e-04) (hash(x)=38539618) +1233 train 3.328393 (lr=4.9535e-04) (hash(x)=36535091) +1234 train 3.335335 (lr=4.9498e-04) (hash(x)=38548597) +1235 train 3.368284 (lr=4.9460e-04) (hash(x)=36491984) +1236 train 3.274086 (lr=4.9422e-04) (hash(x)=43141110) +1237 train 3.356190 (lr=4.9385e-04) (hash(x)=37903413) +1238 train 3.378433 (lr=4.9347e-04) (hash(x)=40042314) +1239 train 3.417743 (lr=4.9309e-04) (hash(x)=40277225) +1240 train 3.334957 (lr=4.9271e-04) (hash(x)=46159886) +1241 train 3.291672 (lr=4.9233e-04) (hash(x)=40452730) +1242 train 3.365424 (lr=4.9195e-04) (hash(x)=42740600) +1243 train 3.324234 (lr=4.9157e-04) (hash(x)=40163565) +1244 train 3.387341 (lr=4.9119e-04) (hash(x)=39163304) +1245 train 3.412989 (lr=4.9081e-04) (hash(x)=36990849) +1246 train 3.318247 (lr=4.9043e-04) (hash(x)=38984729) +1247 train 3.257343 (lr=4.9004e-04) (hash(x)=41197400) +1248 train 3.240033 (lr=4.8966e-04) (hash(x)=40075903) +1249 train 3.348331 (lr=4.8928e-04) (hash(x)=39298262) +1250 val loss 3.2836 +1250 val perplexity 26.6726 +1250 hella 0.2821 +1250 train 3.261740 (lr=4.8889e-04) (hash(x)=46144039) +1251 train 3.219538 (lr=4.8851e-04) (hash(x)=37024814) +1252 train 3.252364 (lr=4.8812e-04) (hash(x)=37124594) +1253 train 3.239949 (lr=4.8774e-04) (hash(x)=38583567) +1254 train 3.299442 (lr=4.8735e-04) (hash(x)=38675015) +1255 train 3.262612 (lr=4.8697e-04) (hash(x)=39654694) +1256 train 3.262064 (lr=4.8658e-04) (hash(x)=37285090) +1257 train 3.255364 (lr=4.8619e-04) (hash(x)=40107816) +1258 train 3.303387 (lr=4.8580e-04) (hash(x)=35623735) +1259 train 3.343078 (lr=4.8542e-04) (hash(x)=40237332) +1260 train 3.329415 (lr=4.8503e-04) (hash(x)=40100893) +1261 train 3.274264 (lr=4.8464e-04) (hash(x)=45124397) +1262 train 3.319643 (lr=4.8425e-04) (hash(x)=38438370) +1263 train 3.272336 (lr=4.8386e-04) (hash(x)=39559121) +1264 train 3.386246 (lr=4.8347e-04) (hash(x)=40593074) +1265 train 3.349120 (lr=4.8308e-04) (hash(x)=29069034) +1266 train 3.327642 (lr=4.8268e-04) (hash(x)=45199483) +1267 train 3.365158 (lr=4.8229e-04) (hash(x)=41148702) +1268 train 3.351280 (lr=4.8190e-04) (hash(x)=37334515) +1269 train 3.329659 (lr=4.8151e-04) (hash(x)=41293871) +1270 train 3.335042 (lr=4.8111e-04) (hash(x)=36886272) +1271 train 3.351181 (lr=4.8072e-04) (hash(x)=36672708) +1272 train 3.322778 (lr=4.8032e-04) (hash(x)=36317321) +1273 train 3.382790 (lr=4.7993e-04) (hash(x)=33958793) +1274 train 3.312306 (lr=4.7953e-04) (hash(x)=39225371) +1275 val loss 3.2793 +1275 val perplexity 26.5559 +1275 train 3.339274 (lr=4.7914e-04) (hash(x)=40935461) +1276 train 3.325573 (lr=4.7874e-04) (hash(x)=40185627) +1277 train 3.326092 (lr=4.7835e-04) (hash(x)=40690388) +1278 train 3.285831 (lr=4.7795e-04) (hash(x)=37890590) +1279 train 3.476016 (lr=4.7755e-04) (hash(x)=38244980) +1280 train 3.338696 (lr=4.7715e-04) (hash(x)=36925406) +1281 train 3.309455 (lr=4.7675e-04) (hash(x)=37872328) +1282 train 3.342942 (lr=4.7635e-04) (hash(x)=40164657) +1283 train 3.271099 (lr=4.7595e-04) (hash(x)=42375623) +1284 train 3.296741 (lr=4.7555e-04) (hash(x)=44936125) +1285 train 3.327364 (lr=4.7515e-04) (hash(x)=40451167) +1286 train 3.266821 (lr=4.7475e-04) (hash(x)=40729072) +1287 train 3.314111 (lr=4.7435e-04) (hash(x)=36024219) +1288 train 3.291495 (lr=4.7395e-04) (hash(x)=42637621) +1289 train 3.340467 (lr=4.7355e-04) (hash(x)=39712686) +1290 train 3.285119 (lr=4.7315e-04) (hash(x)=36857687) +1291 train 3.269586 (lr=4.7274e-04) (hash(x)=33573246) +1292 train 3.285590 (lr=4.7234e-04) (hash(x)=35736716) +1293 train 3.252886 (lr=4.7193e-04) (hash(x)=37201641) +1294 train 3.312443 (lr=4.7153e-04) (hash(x)=39084919) +1295 train 3.271648 (lr=4.7113e-04) (hash(x)=36283426) +1296 train 3.235553 (lr=4.7072e-04) (hash(x)=56110699) +1297 train 3.289788 (lr=4.7031e-04) (hash(x)=39704634) +1298 train 3.243474 (lr=4.6991e-04) (hash(x)=39707432) +1299 train 3.301358 (lr=4.6950e-04) (hash(x)=38400003) +1300 val loss 3.2764 +1300 val perplexity 26.4797 +1300 train 3.306445 (lr=4.6909e-04) (hash(x)=33831302) +1301 train 3.243367 (lr=4.6869e-04) (hash(x)=43120379) +1302 train 3.262793 (lr=4.6828e-04) (hash(x)=43516041) +1303 train 3.246762 (lr=4.6787e-04) (hash(x)=43250783) +1304 train 3.328827 (lr=4.6746e-04) (hash(x)=32840703) +1305 train 3.239157 (lr=4.6705e-04) (hash(x)=44849759) +1306 train 3.212572 (lr=4.6664e-04) (hash(x)=39518164) +1307 train 3.261796 (lr=4.6623e-04) (hash(x)=41335201) +1308 train 3.310780 (lr=4.6582e-04) (hash(x)=40915034) +1309 train 3.332818 (lr=4.6541e-04) (hash(x)=40093508) +1310 train 3.381927 (lr=4.6500e-04) (hash(x)=40037948) +1311 train 3.296527 (lr=4.6459e-04) (hash(x)=37728713) +1312 train 3.358385 (lr=4.6418e-04) (hash(x)=40690279) +1313 train 3.304103 (lr=4.6376e-04) (hash(x)=35412857) +1314 train 3.392497 (lr=4.6335e-04) (hash(x)=35525132) +1315 train 3.293284 (lr=4.6294e-04) (hash(x)=52011371) +1316 train 3.287557 (lr=4.6252e-04) (hash(x)=36480522) +1317 train 3.301067 (lr=4.6211e-04) (hash(x)=38040952) +1318 train 3.311764 (lr=4.6169e-04) (hash(x)=39093150) +1319 train 3.289346 (lr=4.6128e-04) (hash(x)=42079976) +1320 train 3.328548 (lr=4.6086e-04) (hash(x)=33277541) +1321 train 3.260725 (lr=4.6045e-04) (hash(x)=34147161) +1322 train 3.274237 (lr=4.6003e-04) (hash(x)=39644302) +1323 train 3.282117 (lr=4.5962e-04) (hash(x)=44779232) +1324 train 3.265670 (lr=4.5920e-04) (hash(x)=38520750) +1325 val loss 3.2756 +1325 val perplexity 26.4578 +1325 train 3.267365 (lr=4.5878e-04) (hash(x)=40663579) +1326 train 3.253336 (lr=4.5836e-04) (hash(x)=39777955) +1327 train 3.256373 (lr=4.5794e-04) (hash(x)=40761539) +1328 train 3.260446 (lr=4.5753e-04) (hash(x)=38195837) +1329 train 3.257487 (lr=4.5711e-04) (hash(x)=43195524) +1330 train 3.283612 (lr=4.5669e-04) (hash(x)=42089861) +1331 train 3.284552 (lr=4.5627e-04) (hash(x)=36211418) +1332 train 3.249240 (lr=4.5585e-04) (hash(x)=38307699) +1333 train 3.288564 (lr=4.5543e-04) (hash(x)=36863554) +1334 train 3.313014 (lr=4.5501e-04) (hash(x)=38132363) +1335 train 3.213975 (lr=4.5458e-04) (hash(x)=38194817) +1336 train 3.246494 (lr=4.5416e-04) (hash(x)=39539344) +1337 train 3.267940 (lr=4.5374e-04) (hash(x)=38541454) +1338 train 3.272973 (lr=4.5332e-04) (hash(x)=47904118) +1339 train 3.298921 (lr=4.5289e-04) (hash(x)=39933041) +1340 train 3.222360 (lr=4.5247e-04) (hash(x)=37637490) +1341 train 3.262579 (lr=4.5205e-04) (hash(x)=42139442) +1342 train 3.248047 (lr=4.5162e-04) (hash(x)=35934912) +1343 train 3.302522 (lr=4.5120e-04) (hash(x)=48823338) +1344 train 3.256904 (lr=4.5077e-04) (hash(x)=49115440) +1345 train 3.300764 (lr=4.5035e-04) (hash(x)=38703517) +1346 train 3.326438 (lr=4.4992e-04) (hash(x)=44848473) +1347 train 3.318638 (lr=4.4950e-04) (hash(x)=38919316) +1348 train 3.330583 (lr=4.4907e-04) (hash(x)=44936860) +1349 train 3.387609 (lr=4.4864e-04) (hash(x)=37849585) +1350 val loss 3.2661 +1350 val perplexity 26.2090 +1350 train 3.269374 (lr=4.4822e-04) (hash(x)=40918624) +1351 train 3.323258 (lr=4.4779e-04) (hash(x)=37599016) +1352 train 3.297241 (lr=4.4736e-04) (hash(x)=44397107) +1353 train 3.287842 (lr=4.4693e-04) (hash(x)=38161434) +1354 train 3.293662 (lr=4.4651e-04) (hash(x)=39047794) +1355 train 3.305627 (lr=4.4608e-04) (hash(x)=38489148) +1356 train 3.343147 (lr=4.4565e-04) (hash(x)=39504147) +1357 train 3.374524 (lr=4.4522e-04) (hash(x)=38702055) +1358 train 3.251864 (lr=4.4479e-04) (hash(x)=37528416) +1359 train 3.375572 (lr=4.4436e-04) (hash(x)=41174668) +1360 train 3.274051 (lr=4.4393e-04) (hash(x)=41585975) +1361 train 3.323668 (lr=4.4350e-04) (hash(x)=38379328) +1362 train 3.334449 (lr=4.4307e-04) (hash(x)=39583598) +1363 train 3.262573 (lr=4.4263e-04) (hash(x)=37458083) +1364 train 3.260324 (lr=4.4220e-04) (hash(x)=34688419) +1365 train 3.243323 (lr=4.4177e-04) (hash(x)=37093896) +1366 train 3.264951 (lr=4.4134e-04) (hash(x)=38861712) +1367 train 3.174399 (lr=4.4090e-04) (hash(x)=23550426) +1368 train 3.234195 (lr=4.4047e-04) (hash(x)=42137700) +1369 train 3.290488 (lr=4.4004e-04) (hash(x)=37060133) +1370 train 3.253551 (lr=4.3960e-04) (hash(x)=45739654) +1371 train 3.288732 (lr=4.3917e-04) (hash(x)=39427106) +1372 train 3.259333 (lr=4.3873e-04) (hash(x)=37120578) +1373 train 3.291646 (lr=4.3830e-04) (hash(x)=39860157) +1374 train 3.236897 (lr=4.3786e-04) (hash(x)=39290017) +1375 val loss 3.2625 +1375 val perplexity 26.1152 +1375 train 3.320230 (lr=4.3743e-04) (hash(x)=37244844) +1376 train 3.341229 (lr=4.3699e-04) (hash(x)=40432807) +1377 train 3.288800 (lr=4.3655e-04) (hash(x)=41225710) +1378 train 3.293099 (lr=4.3612e-04) (hash(x)=47049581) +1379 train 3.246913 (lr=4.3568e-04) (hash(x)=39406495) +1380 train 3.296351 (lr=4.3524e-04) (hash(x)=39127468) +1381 train 3.260353 (lr=4.3480e-04) (hash(x)=41911648) +1382 train 3.261763 (lr=4.3437e-04) (hash(x)=43133629) +1383 train 3.335563 (lr=4.3393e-04) (hash(x)=37283330) +1384 train 3.369015 (lr=4.3349e-04) (hash(x)=47191691) +1385 train 3.302108 (lr=4.3305e-04) (hash(x)=37766051) +1386 train 3.359694 (lr=4.3261e-04) (hash(x)=41699002) +1387 train 3.292019 (lr=4.3217e-04) (hash(x)=40364724) +1388 train 3.373484 (lr=4.3173e-04) (hash(x)=39738928) +1389 train 3.299696 (lr=4.3129e-04) (hash(x)=39659604) +1390 train 3.308591 (lr=4.3085e-04) (hash(x)=41402382) +1391 train 3.315047 (lr=4.3041e-04) (hash(x)=41037808) +1392 train 3.362841 (lr=4.2997e-04) (hash(x)=40860873) +1393 train 3.286460 (lr=4.2953e-04) (hash(x)=44430309) +1394 train 3.364479 (lr=4.2908e-04) (hash(x)=39878886) +1395 train 3.274521 (lr=4.2864e-04) (hash(x)=42737625) +1396 train 3.215331 (lr=4.2820e-04) (hash(x)=38285554) +1397 train 3.261464 (lr=4.2776e-04) (hash(x)=44353011) +1398 train 3.291091 (lr=4.2731e-04) (hash(x)=46890003) +1399 train 3.254843 (lr=4.2687e-04) (hash(x)=41076421) +1400 val loss 3.2645 +1400 val perplexity 26.1679 +1400 train 3.254497 (lr=4.2643e-04) (hash(x)=44362880) +1401 train 3.210367 (lr=4.2598e-04) (hash(x)=42430839) +1402 train 3.222520 (lr=4.2554e-04) (hash(x)=38768810) +1403 train 3.257919 (lr=4.2509e-04) (hash(x)=35764146) +1404 train 3.282436 (lr=4.2465e-04) (hash(x)=43856369) +1405 train 3.334722 (lr=4.2420e-04) (hash(x)=38787294) +1406 train 3.250153 (lr=4.2376e-04) (hash(x)=40608924) +1407 train 3.259876 (lr=4.2331e-04) (hash(x)=41795971) +1408 train 3.311702 (lr=4.2287e-04) (hash(x)=39889402) +1409 train 3.280544 (lr=4.2242e-04) (hash(x)=38251290) +1410 train 3.322867 (lr=4.2197e-04) (hash(x)=41623547) +1411 train 3.350786 (lr=4.2153e-04) (hash(x)=43622263) +1412 train 3.272982 (lr=4.2108e-04) (hash(x)=40792375) +1413 train 3.336279 (lr=4.2063e-04) (hash(x)=39780943) +1414 train 3.271462 (lr=4.2018e-04) (hash(x)=39467196) +1415 train 3.368441 (lr=4.1974e-04) (hash(x)=32100034) +1416 train 3.319520 (lr=4.1929e-04) (hash(x)=39976402) +1417 train 3.283653 (lr=4.1884e-04) (hash(x)=40356088) +1418 train 3.308766 (lr=4.1839e-04) (hash(x)=42497111) +1419 train 3.318784 (lr=4.1794e-04) (hash(x)=43064048) +1420 train 3.269221 (lr=4.1749e-04) (hash(x)=41962489) +1421 train 3.323027 (lr=4.1704e-04) (hash(x)=40477651) +1422 train 3.339953 (lr=4.1659e-04) (hash(x)=48335128) +1423 train 3.342857 (lr=4.1614e-04) (hash(x)=33410523) +1424 train 3.332408 (lr=4.1569e-04) (hash(x)=39230347) +1425 val loss 3.2654 +1425 val perplexity 26.1904 +1425 train 3.314472 (lr=4.1524e-04) (hash(x)=38302623) +1426 train 3.353229 (lr=4.1479e-04) (hash(x)=32546404) +1427 train 3.286991 (lr=4.1434e-04) (hash(x)=38178758) +1428 train 3.397202 (lr=4.1389e-04) (hash(x)=38180434) +1429 train 3.324953 (lr=4.1343e-04) (hash(x)=38579115) +1430 train 3.305095 (lr=4.1298e-04) (hash(x)=39141505) +1431 train 3.300657 (lr=4.1253e-04) (hash(x)=38759223) +1432 train 3.304950 (lr=4.1208e-04) (hash(x)=40416349) +1433 train 3.376691 (lr=4.1162e-04) (hash(x)=40665148) +1434 train 3.313803 (lr=4.1117e-04) (hash(x)=42747047) +1435 train 3.267261 (lr=4.1072e-04) (hash(x)=38994336) +1436 train 3.284484 (lr=4.1026e-04) (hash(x)=43581943) +1437 train 3.229019 (lr=4.0981e-04) (hash(x)=36109750) +1438 train 3.272534 (lr=4.0936e-04) (hash(x)=38435961) +1439 train 3.267527 (lr=4.0890e-04) (hash(x)=35390493) +1440 train 3.329157 (lr=4.0845e-04) (hash(x)=38954690) +1441 train 3.284160 (lr=4.0799e-04) (hash(x)=43563271) +1442 train 3.235402 (lr=4.0754e-04) (hash(x)=37573463) +1443 train 3.214846 (lr=4.0708e-04) (hash(x)=43225754) +1444 train 3.244333 (lr=4.0663e-04) (hash(x)=40274308) +1445 train 3.189131 (lr=4.0617e-04) (hash(x)=40593347) +1446 train 3.226950 (lr=4.0572e-04) (hash(x)=38916215) +1447 train 3.263590 (lr=4.0526e-04) (hash(x)=42053841) +1448 train 3.277019 (lr=4.0480e-04) (hash(x)=40352409) +1449 train 3.277288 (lr=4.0435e-04) (hash(x)=39607176) +1450 val loss 3.2540 +1450 val perplexity 25.8924 +1450 train 3.292847 (lr=4.0389e-04) (hash(x)=37635541) +1451 train 3.243500 (lr=4.0343e-04) (hash(x)=44540916) +1452 train 3.291124 (lr=4.0297e-04) (hash(x)=41991488) +1453 train 3.292513 (lr=4.0252e-04) (hash(x)=41481379) +1454 train 3.307668 (lr=4.0206e-04) (hash(x)=42646440) +1455 train 3.245224 (lr=4.0160e-04) (hash(x)=39574589) +1456 train 3.289577 (lr=4.0114e-04) (hash(x)=44798584) +1457 train 3.311811 (lr=4.0068e-04) (hash(x)=44520321) +1458 train 3.268231 (lr=4.0023e-04) (hash(x)=35459071) +1459 train 3.332103 (lr=3.9977e-04) (hash(x)=39527511) +1460 train 3.385240 (lr=3.9931e-04) (hash(x)=32949197) +1461 train 3.326185 (lr=3.9885e-04) (hash(x)=37194616) +1462 train 3.334765 (lr=3.9839e-04) (hash(x)=40296128) +1463 train 3.318813 (lr=3.9793e-04) (hash(x)=43129511) +1464 train 3.318205 (lr=3.9747e-04) (hash(x)=41910070) +1465 train 3.341460 (lr=3.9701e-04) (hash(x)=39165053) +1466 train 3.313695 (lr=3.9655e-04) (hash(x)=38398284) +1467 train 3.291786 (lr=3.9609e-04) (hash(x)=35935367) +1468 train 3.284599 (lr=3.9563e-04) (hash(x)=38388449) +1469 train 3.312512 (lr=3.9517e-04) (hash(x)=31138209) +1470 train 3.322227 (lr=3.9470e-04) (hash(x)=41871807) +1471 train 3.226751 (lr=3.9424e-04) (hash(x)=39368019) +1472 train 3.284444 (lr=3.9378e-04) (hash(x)=41237444) +1473 train 3.237185 (lr=3.9332e-04) (hash(x)=42991689) +1474 train 3.262642 (lr=3.9286e-04) (hash(x)=38217708) +1475 val loss 3.2534 +1475 val perplexity 25.8776 +1475 train 3.222987 (lr=3.9239e-04) (hash(x)=38114803) +1476 train 3.261957 (lr=3.9193e-04) (hash(x)=40551117) +1477 train 3.358295 (lr=3.9147e-04) (hash(x)=52744946) +1478 train 3.278604 (lr=3.9101e-04) (hash(x)=35808619) +1479 train 3.287839 (lr=3.9054e-04) (hash(x)=40311539) +1480 train 3.244472 (lr=3.9008e-04) (hash(x)=45796944) +1481 train 3.304912 (lr=3.8962e-04) (hash(x)=38215815) +1482 train 3.319643 (lr=3.8915e-04) (hash(x)=42135205) +1483 train 3.276005 (lr=3.8869e-04) (hash(x)=34109574) +1484 train 3.328987 (lr=3.8823e-04) (hash(x)=32093391) +1485 train 3.332730 (lr=3.8776e-04) (hash(x)=37332378) +1486 train 3.229790 (lr=3.8730e-04) (hash(x)=42475410) +1487 train 3.273177 (lr=3.8683e-04) (hash(x)=31804345) +1488 train 3.232828 (lr=3.8637e-04) (hash(x)=49418346) +1489 train 3.207266 (lr=3.8590e-04) (hash(x)=42965318) +1490 train 3.261632 (lr=3.8544e-04) (hash(x)=37389562) +1491 train 3.283251 (lr=3.8497e-04) (hash(x)=42288964) +1492 train 3.240224 (lr=3.8451e-04) (hash(x)=39807121) +1493 train 3.302104 (lr=3.8404e-04) (hash(x)=40313360) +1494 train 3.261197 (lr=3.8358e-04) (hash(x)=41706723) +1495 train 3.282547 (lr=3.8311e-04) (hash(x)=40829448) +1496 train 3.275269 (lr=3.8265e-04) (hash(x)=40963468) +1497 train 3.288844 (lr=3.8218e-04) (hash(x)=41394160) +1498 train 3.276536 (lr=3.8171e-04) (hash(x)=37971848) +1499 train 3.301325 (lr=3.8125e-04) (hash(x)=40504140) +1500 val loss 3.2510 +1500 val perplexity 25.8165 +1500 hella 0.2808 +1500 train 3.363853 (lr=3.8078e-04) (hash(x)=38437238) +1501 train 3.325911 (lr=3.8031e-04) (hash(x)=36779321) +1502 train 3.326355 (lr=3.7985e-04) (hash(x)=41735244) +1503 train 3.324284 (lr=3.7938e-04) (hash(x)=40214283) +1504 train 3.335333 (lr=3.7891e-04) (hash(x)=45624869) +1505 train 3.334893 (lr=3.7844e-04) (hash(x)=39644174) +1506 train 3.263528 (lr=3.7798e-04) (hash(x)=36700464) +1507 train 3.257099 (lr=3.7751e-04) (hash(x)=43603225) +1508 train 3.252246 (lr=3.7704e-04) (hash(x)=38127029) +1509 train 3.195961 (lr=3.7657e-04) (hash(x)=38141868) +1510 train 3.283391 (lr=3.7610e-04) (hash(x)=45921763) +1511 train 3.272612 (lr=3.7564e-04) (hash(x)=37979059) +1512 train 3.270656 (lr=3.7517e-04) (hash(x)=33990585) +1513 train 3.255932 (lr=3.7470e-04) (hash(x)=37242510) +1514 train 3.251043 (lr=3.7423e-04) (hash(x)=37199291) +1515 train 3.302726 (lr=3.7376e-04) (hash(x)=37602195) +1516 train 3.270227 (lr=3.7329e-04) (hash(x)=42568654) +1517 train 3.288457 (lr=3.7282e-04) (hash(x)=36878775) +1518 train 3.257869 (lr=3.7235e-04) (hash(x)=54862739) +1519 train 3.263519 (lr=3.7189e-04) (hash(x)=38539806) +1520 train 3.247023 (lr=3.7142e-04) (hash(x)=37679700) +1521 train 3.218805 (lr=3.7095e-04) (hash(x)=42360543) +1522 train 3.257734 (lr=3.7048e-04) (hash(x)=41082767) +1523 train 3.235063 (lr=3.7001e-04) (hash(x)=41961680) +1524 train 3.193478 (lr=3.6954e-04) (hash(x)=45941898) +1525 val loss 3.2456 +1525 val perplexity 25.6782 +1525 train 3.320429 (lr=3.6907e-04) (hash(x)=40745810) +1526 train 3.210381 (lr=3.6860e-04) (hash(x)=44385964) +1527 train 3.198321 (lr=3.6813e-04) (hash(x)=44101752) +1528 train 3.299877 (lr=3.6766e-04) (hash(x)=35883317) +1529 train 3.313793 (lr=3.6718e-04) (hash(x)=38282851) +1530 train 3.301355 (lr=3.6671e-04) (hash(x)=41585307) +1531 train 3.254501 (lr=3.6624e-04) (hash(x)=39010792) +1532 train 3.280310 (lr=3.6577e-04) (hash(x)=43656072) +1533 train 3.317724 (lr=3.6530e-04) (hash(x)=50035175) +1534 train 3.303927 (lr=3.6483e-04) (hash(x)=40950253) +1535 train 3.292932 (lr=3.6436e-04) (hash(x)=40806684) +1536 train 3.281129 (lr=3.6389e-04) (hash(x)=39464310) +1537 train 3.280722 (lr=3.6342e-04) (hash(x)=47629719) +1538 train 3.261075 (lr=3.6294e-04) (hash(x)=40370491) +1539 train 3.241009 (lr=3.6247e-04) (hash(x)=36751618) +1540 train 3.311562 (lr=3.6200e-04) (hash(x)=41475872) +1541 train 3.298558 (lr=3.6153e-04) (hash(x)=33338071) +1542 train 3.284684 (lr=3.6106e-04) (hash(x)=33648781) +1543 train 3.270928 (lr=3.6058e-04) (hash(x)=41832498) +1544 train 3.321207 (lr=3.6011e-04) (hash(x)=38669834) +1545 train 3.288306 (lr=3.5964e-04) (hash(x)=39270511) +1546 train 3.217741 (lr=3.5917e-04) (hash(x)=37652214) +1547 train 3.315107 (lr=3.5870e-04) (hash(x)=36231307) +1548 train 3.278179 (lr=3.5822e-04) (hash(x)=36901038) +1549 train 3.244011 (lr=3.5775e-04) (hash(x)=41482882) +1550 val loss 3.2439 +1550 val perplexity 25.6331 +1550 train 3.291362 (lr=3.5728e-04) (hash(x)=41557319) +1551 train 3.246365 (lr=3.5680e-04) (hash(x)=41474046) +1552 train 3.286222 (lr=3.5633e-04) (hash(x)=37056152) +1553 train 3.320092 (lr=3.5586e-04) (hash(x)=39959453) +1554 train 3.229634 (lr=3.5539e-04) (hash(x)=43716624) +1555 train 3.304968 (lr=3.5491e-04) (hash(x)=39217682) +1556 train 3.216599 (lr=3.5444e-04) (hash(x)=38289480) +1557 train 3.220414 (lr=3.5397e-04) (hash(x)=37990193) +1558 train 3.296796 (lr=3.5349e-04) (hash(x)=41000789) +1559 train 3.311285 (lr=3.5302e-04) (hash(x)=48376281) +1560 train 3.211907 (lr=3.5255e-04) (hash(x)=32921213) +1561 train 3.369801 (lr=3.5207e-04) (hash(x)=38895745) +1562 train 3.313920 (lr=3.5160e-04) (hash(x)=39818693) +1563 train 3.209257 (lr=3.5112e-04) (hash(x)=48181852) +1564 train 3.257323 (lr=3.5065e-04) (hash(x)=39309475) +1565 train 3.273262 (lr=3.5018e-04) (hash(x)=41385503) +1566 train 3.274280 (lr=3.4970e-04) (hash(x)=34765243) +1567 train 3.241324 (lr=3.4923e-04) (hash(x)=36375896) +1568 train 3.236854 (lr=3.4876e-04) (hash(x)=39280048) +1569 train 3.222917 (lr=3.4828e-04) (hash(x)=41802736) +1570 train 3.247226 (lr=3.4781e-04) (hash(x)=37277722) +1571 train 3.279045 (lr=3.4733e-04) (hash(x)=39908040) +1572 train 3.292723 (lr=3.4686e-04) (hash(x)=38589955) +1573 train 3.228196 (lr=3.4638e-04) (hash(x)=35086657) +1574 train 3.314123 (lr=3.4591e-04) (hash(x)=45604881) +1575 val loss 3.2391 +1575 val perplexity 25.5116 +1575 train 3.201085 (lr=3.4544e-04) (hash(x)=38510152) +1576 train 3.300543 (lr=3.4496e-04) (hash(x)=35775283) +1577 train 3.349681 (lr=3.4449e-04) (hash(x)=36416373) +1578 train 3.244648 (lr=3.4401e-04) (hash(x)=45364220) +1579 train 3.279973 (lr=3.4354e-04) (hash(x)=43335655) +1580 train 3.343429 (lr=3.4306e-04) (hash(x)=40709619) +1581 train 3.218524 (lr=3.4259e-04) (hash(x)=42606714) +1582 train 3.274136 (lr=3.4211e-04) (hash(x)=37243792) +1583 train 3.315675 (lr=3.4164e-04) (hash(x)=36351019) +1584 train 3.342993 (lr=3.4116e-04) (hash(x)=44440032) +1585 train 3.206742 (lr=3.4069e-04) (hash(x)=39961610) +1586 train 3.285097 (lr=3.4021e-04) (hash(x)=45330469) +1587 train 3.266128 (lr=3.3974e-04) (hash(x)=41485976) +1588 train 3.271896 (lr=3.3926e-04) (hash(x)=39083408) +1589 train 3.204138 (lr=3.3879e-04) (hash(x)=41128869) +1590 train 3.245745 (lr=3.3831e-04) (hash(x)=42037900) +1591 train 3.220410 (lr=3.3784e-04) (hash(x)=44436095) +1592 train 3.218613 (lr=3.3736e-04) (hash(x)=38884979) +1593 train 3.279368 (lr=3.3689e-04) (hash(x)=36553809) +1594 train 3.219196 (lr=3.3641e-04) (hash(x)=40612555) +1595 train 3.208724 (lr=3.3594e-04) (hash(x)=37326976) +1596 train 3.260921 (lr=3.3546e-04) (hash(x)=41158468) +1597 train 3.206905 (lr=3.3499e-04) (hash(x)=56912213) +1598 train 3.308151 (lr=3.3451e-04) (hash(x)=37908861) +1599 train 3.249130 (lr=3.3404e-04) (hash(x)=38022013) +1600 val loss 3.2401 +1600 val perplexity 25.5371 +1600 train 3.245176 (lr=3.3356e-04) (hash(x)=33829496) +1601 train 3.235037 (lr=3.3309e-04) (hash(x)=37185914) +1602 train 3.184836 (lr=3.3261e-04) (hash(x)=38817079) +1603 train 3.288249 (lr=3.3214e-04) (hash(x)=33242340) +1604 train 3.247543 (lr=3.3166e-04) (hash(x)=35693832) +1605 train 3.246823 (lr=3.3119e-04) (hash(x)=43559771) +1606 train 3.241871 (lr=3.3071e-04) (hash(x)=39394699) +1607 train 3.258960 (lr=3.3024e-04) (hash(x)=41509330) +1608 train 3.279260 (lr=3.2976e-04) (hash(x)=38624098) +1609 train 3.362192 (lr=3.2929e-04) (hash(x)=38706711) +1610 train 3.245588 (lr=3.2881e-04) (hash(x)=41727145) +1611 train 3.343051 (lr=3.2834e-04) (hash(x)=42452935) +1612 train 3.244937 (lr=3.2786e-04) (hash(x)=40154850) +1613 train 3.244156 (lr=3.2739e-04) (hash(x)=37455717) +1614 train 3.262235 (lr=3.2691e-04) (hash(x)=38644705) +1615 train 3.270588 (lr=3.2644e-04) (hash(x)=31903442) +1616 train 3.244617 (lr=3.2596e-04) (hash(x)=42959822) +1617 train 3.279221 (lr=3.2549e-04) (hash(x)=42824164) +1618 train 3.238466 (lr=3.2501e-04) (hash(x)=43450900) +1619 train 3.271219 (lr=3.2454e-04) (hash(x)=37444037) +1620 train 3.326133 (lr=3.2406e-04) (hash(x)=37396491) +1621 train 3.234607 (lr=3.2359e-04) (hash(x)=37369825) +1622 train 3.342620 (lr=3.2311e-04) (hash(x)=39563580) +1623 train 3.249398 (lr=3.2264e-04) (hash(x)=38796654) +1624 train 3.246705 (lr=3.2216e-04) (hash(x)=39448215) +1625 val loss 3.2366 +1625 val perplexity 25.4468 +1625 train 3.201710 (lr=3.2169e-04) (hash(x)=36582844) +1626 train 3.300834 (lr=3.2121e-04) (hash(x)=30087474) +1627 train 3.205949 (lr=3.2074e-04) (hash(x)=41779884) +1628 train 3.242489 (lr=3.2026e-04) (hash(x)=42409089) +1629 train 3.217831 (lr=3.1979e-04) (hash(x)=37002488) +1630 train 3.264272 (lr=3.1931e-04) (hash(x)=40652429) +1631 train 3.236899 (lr=3.1884e-04) (hash(x)=32432582) +1632 train 3.274159 (lr=3.1836e-04) (hash(x)=43322092) +1633 train 3.288680 (lr=3.1789e-04) (hash(x)=33593703) +1634 train 3.272465 (lr=3.1741e-04) (hash(x)=42670273) +1635 train 3.331185 (lr=3.1694e-04) (hash(x)=39806845) +1636 train 3.260592 (lr=3.1646e-04) (hash(x)=36772212) +1637 train 3.242445 (lr=3.1599e-04) (hash(x)=38951346) +1638 train 3.280698 (lr=3.1551e-04) (hash(x)=40576002) +1639 train 3.243823 (lr=3.1504e-04) (hash(x)=40449639) +1640 train 3.317309 (lr=3.1456e-04) (hash(x)=40189321) +1641 train 3.224088 (lr=3.1409e-04) (hash(x)=42829377) +1642 train 3.212140 (lr=3.1362e-04) (hash(x)=47534151) +1643 train 3.304203 (lr=3.1314e-04) (hash(x)=42333404) +1644 train 3.299316 (lr=3.1267e-04) (hash(x)=42281866) +1645 train 3.274815 (lr=3.1219e-04) (hash(x)=39005235) +1646 train 3.292387 (lr=3.1172e-04) (hash(x)=45286999) +1647 train 3.258063 (lr=3.1124e-04) (hash(x)=26004601) +1648 train 3.331745 (lr=3.1077e-04) (hash(x)=40474528) +1649 train 3.221615 (lr=3.1030e-04) (hash(x)=48719475) +1650 val loss 3.2296 +1650 val perplexity 25.2687 +1650 train 3.259109 (lr=3.0982e-04) (hash(x)=44026569) +1651 train 3.248416 (lr=3.0935e-04) (hash(x)=36454237) +1652 train 3.263535 (lr=3.0888e-04) (hash(x)=39992748) +1653 train 3.272856 (lr=3.0840e-04) (hash(x)=35636527) +1654 train 3.200178 (lr=3.0793e-04) (hash(x)=35404180) +1655 train 3.246858 (lr=3.0745e-04) (hash(x)=33832069) +1656 train 3.237771 (lr=3.0698e-04) (hash(x)=42319641) +1657 train 3.224629 (lr=3.0651e-04) (hash(x)=45652712) +1658 train 3.276791 (lr=3.0603e-04) (hash(x)=41600654) +1659 train 3.243922 (lr=3.0556e-04) (hash(x)=32927581) +1660 train 3.264238 (lr=3.0509e-04) (hash(x)=36118637) +1661 train 3.190368 (lr=3.0461e-04) (hash(x)=45184693) +1662 train 3.223465 (lr=3.0414e-04) (hash(x)=40389631) +1663 train 3.193904 (lr=3.0367e-04) (hash(x)=45560774) +1664 train 3.320172 (lr=3.0320e-04) (hash(x)=40929062) +1665 train 3.246727 (lr=3.0272e-04) (hash(x)=43411667) +1666 train 3.224555 (lr=3.0225e-04) (hash(x)=34675070) +1667 train 3.248943 (lr=3.0178e-04) (hash(x)=35481718) +1668 train 3.310820 (lr=3.0130e-04) (hash(x)=34177516) +1669 train 3.221120 (lr=3.0083e-04) (hash(x)=39107630) +1670 train 3.248811 (lr=3.0036e-04) (hash(x)=38636541) +1671 train 3.257601 (lr=2.9989e-04) (hash(x)=37606649) +1672 train 3.294472 (lr=2.9942e-04) (hash(x)=41607734) +1673 train 3.260998 (lr=2.9894e-04) (hash(x)=55090583) +1674 train 3.468100 (lr=2.9847e-04) (hash(x)=50859180) +1675 val loss 3.2332 +1675 val perplexity 25.3612 +1675 train 3.344836 (lr=2.9800e-04) (hash(x)=41804716) +1676 train 3.234068 (lr=2.9753e-04) (hash(x)=42448271) +1677 train 3.405189 (lr=2.9706e-04) (hash(x)=45277899) +1678 train 3.354347 (lr=2.9658e-04) (hash(x)=40619199) +1679 train 3.194472 (lr=2.9611e-04) (hash(x)=36934831) +1680 train 3.270220 (lr=2.9564e-04) (hash(x)=40306159) +1681 train 3.255213 (lr=2.9517e-04) (hash(x)=48311984) +1682 train 3.257687 (lr=2.9470e-04) (hash(x)=43254652) +1683 train 3.273958 (lr=2.9423e-04) (hash(x)=44552557) +1684 train 3.295833 (lr=2.9376e-04) (hash(x)=37204210) +1685 train 3.236464 (lr=2.9329e-04) (hash(x)=39905120) +1686 train 3.205500 (lr=2.9282e-04) (hash(x)=45680667) +1687 train 3.255460 (lr=2.9234e-04) (hash(x)=40288658) +1688 train 3.292935 (lr=2.9187e-04) (hash(x)=42647543) +1689 train 3.251855 (lr=2.9140e-04) (hash(x)=32757022) +1690 train 3.304486 (lr=2.9093e-04) (hash(x)=39924777) +1691 train 3.253551 (lr=2.9046e-04) (hash(x)=38815006) +1692 train 3.263701 (lr=2.8999e-04) (hash(x)=41749184) +1693 train 3.254134 (lr=2.8952e-04) (hash(x)=39643878) +1694 train 3.312846 (lr=2.8905e-04) (hash(x)=41412647) +1695 train 3.278178 (lr=2.8858e-04) (hash(x)=36309717) +1696 train 3.232444 (lr=2.8811e-04) (hash(x)=41616084) +1697 train 3.166148 (lr=2.8765e-04) (hash(x)=40804767) +1698 train 3.199450 (lr=2.8718e-04) (hash(x)=36961803) +1699 train 3.254374 (lr=2.8671e-04) (hash(x)=43500878) +1700 val loss 3.2291 +1700 val perplexity 25.2563 +1700 train 3.279798 (lr=2.8624e-04) (hash(x)=40781516) +1701 train 3.215210 (lr=2.8577e-04) (hash(x)=41619439) +1702 train 3.195870 (lr=2.8530e-04) (hash(x)=39873528) +1703 train 3.284061 (lr=2.8483e-04) (hash(x)=43492816) +1704 train 3.205495 (lr=2.8436e-04) (hash(x)=40868445) +1705 train 3.186826 (lr=2.8390e-04) (hash(x)=37380922) +1706 train 3.219397 (lr=2.8343e-04) (hash(x)=39549113) +1707 train 3.265593 (lr=2.8296e-04) (hash(x)=38369687) +1708 train 3.205846 (lr=2.8249e-04) (hash(x)=42429052) +1709 train 3.245359 (lr=2.8202e-04) (hash(x)=43578169) +1710 train 3.272828 (lr=2.8156e-04) (hash(x)=44686910) +1711 train 3.251350 (lr=2.8109e-04) (hash(x)=38043866) +1712 train 3.221106 (lr=2.8062e-04) (hash(x)=38100009) +1713 train 3.296350 (lr=2.8015e-04) (hash(x)=37868652) +1714 train 3.257079 (lr=2.7969e-04) (hash(x)=39759105) +1715 train 3.287197 (lr=2.7922e-04) (hash(x)=42151981) +1716 train 3.261547 (lr=2.7875e-04) (hash(x)=39273803) +1717 train 3.304644 (lr=2.7829e-04) (hash(x)=34622458) +1718 train 3.296021 (lr=2.7782e-04) (hash(x)=42321027) +1719 train 3.158977 (lr=2.7735e-04) (hash(x)=41680118) +1720 train 3.225459 (lr=2.7689e-04) (hash(x)=39405712) +1721 train 3.281402 (lr=2.7642e-04) (hash(x)=41681095) +1722 train 3.248887 (lr=2.7596e-04) (hash(x)=36043266) +1723 train 3.245803 (lr=2.7549e-04) (hash(x)=43014900) +1724 train 3.298281 (lr=2.7503e-04) (hash(x)=40348318) +1725 val loss 3.2225 +1725 val perplexity 25.0899 +1725 train 3.292219 (lr=2.7456e-04) (hash(x)=38895974) +1726 train 3.272167 (lr=2.7410e-04) (hash(x)=37137066) +1727 train 3.288555 (lr=2.7363e-04) (hash(x)=38770970) +1728 train 3.255865 (lr=2.7317e-04) (hash(x)=38293287) +1729 train 3.239870 (lr=2.7270e-04) (hash(x)=41389085) +1730 train 3.269382 (lr=2.7224e-04) (hash(x)=44153301) +1731 train 3.285167 (lr=2.7177e-04) (hash(x)=38603796) +1732 train 3.184755 (lr=2.7131e-04) (hash(x)=41618930) +1733 train 3.257094 (lr=2.7085e-04) (hash(x)=39420921) +1734 train 3.271162 (lr=2.7038e-04) (hash(x)=42442829) +1735 train 3.206495 (lr=2.6992e-04) (hash(x)=47354161) +1736 train 3.241241 (lr=2.6946e-04) (hash(x)=38452655) +1737 train 3.237236 (lr=2.6899e-04) (hash(x)=40384920) +1738 train 3.170589 (lr=2.6853e-04) (hash(x)=38868555) +1739 train 3.281293 (lr=2.6807e-04) (hash(x)=42552345) +1740 train 3.274852 (lr=2.6761e-04) (hash(x)=32415631) +1741 train 3.153691 (lr=2.6714e-04) (hash(x)=42465685) +1742 train 3.218582 (lr=2.6668e-04) (hash(x)=37492090) +1743 train 3.221865 (lr=2.6622e-04) (hash(x)=43243129) +1744 train 3.233768 (lr=2.6576e-04) (hash(x)=36160899) +1745 train 3.273994 (lr=2.6530e-04) (hash(x)=35230723) +1746 train 3.192858 (lr=2.6483e-04) (hash(x)=36098109) +1747 train 3.211461 (lr=2.6437e-04) (hash(x)=39140567) +1748 train 3.265207 (lr=2.6391e-04) (hash(x)=36853859) +1749 train 3.244279 (lr=2.6345e-04) (hash(x)=40983988) +1750 val loss 3.2210 +1750 val perplexity 25.0544 +1750 hella 0.2821 +1750 train 3.246015 (lr=2.6299e-04) (hash(x)=35524701) +1751 train 3.286753 (lr=2.6253e-04) (hash(x)=44082117) +1752 train 3.271877 (lr=2.6207e-04) (hash(x)=40325612) +1753 train 3.354148 (lr=2.6161e-04) (hash(x)=40052964) +1754 train 3.312106 (lr=2.6115e-04) (hash(x)=40311202) +1755 train 3.282332 (lr=2.6069e-04) (hash(x)=42038695) +1756 train 3.220282 (lr=2.6023e-04) (hash(x)=40995491) +1757 train 3.268796 (lr=2.5977e-04) (hash(x)=44242585) +1758 train 3.276194 (lr=2.5932e-04) (hash(x)=42642242) +1759 train 3.288083 (lr=2.5886e-04) (hash(x)=43702114) +1760 train 3.264890 (lr=2.5840e-04) (hash(x)=36490688) +1761 train 3.276682 (lr=2.5794e-04) (hash(x)=41920961) +1762 train 3.273992 (lr=2.5748e-04) (hash(x)=44048262) +1763 train 3.303403 (lr=2.5703e-04) (hash(x)=36995202) +1764 train 3.217310 (lr=2.5657e-04) (hash(x)=41158267) +1765 train 3.218967 (lr=2.5611e-04) (hash(x)=43844858) +1766 train 3.269735 (lr=2.5565e-04) (hash(x)=39451655) +1767 train 3.316052 (lr=2.5520e-04) (hash(x)=41001514) +1768 train 3.262410 (lr=2.5474e-04) (hash(x)=37800166) +1769 train 3.195050 (lr=2.5428e-04) (hash(x)=35307895) +1770 train 3.236211 (lr=2.5383e-04) (hash(x)=38281275) +1771 train 3.333802 (lr=2.5337e-04) (hash(x)=32674945) +1772 train 3.217360 (lr=2.5292e-04) (hash(x)=36258225) +1773 train 3.249336 (lr=2.5246e-04) (hash(x)=38289568) +1774 train 3.252531 (lr=2.5201e-04) (hash(x)=44607425) +1775 val loss 3.2174 +1775 val perplexity 24.9637 +1775 train 3.174542 (lr=2.5155e-04) (hash(x)=46626508) +1776 train 3.260229 (lr=2.5110e-04) (hash(x)=44275246) +1777 train 3.184038 (lr=2.5064e-04) (hash(x)=38647259) +1778 train 3.200795 (lr=2.5019e-04) (hash(x)=41453360) +1779 train 3.243863 (lr=2.4974e-04) (hash(x)=42583385) +1780 train 3.192542 (lr=2.4928e-04) (hash(x)=36312646) +1781 train 3.233576 (lr=2.4883e-04) (hash(x)=42975378) +1782 train 3.267978 (lr=2.4838e-04) (hash(x)=36797403) +1783 train 3.279062 (lr=2.4792e-04) (hash(x)=36974561) +1784 train 3.221891 (lr=2.4747e-04) (hash(x)=38831856) +1785 train 3.237763 (lr=2.4702e-04) (hash(x)=47339990) +1786 train 3.224107 (lr=2.4657e-04) (hash(x)=39603929) +1787 train 3.227729 (lr=2.4611e-04) (hash(x)=43278203) +1788 train 3.218491 (lr=2.4566e-04) (hash(x)=38723817) +1789 train 3.220418 (lr=2.4521e-04) (hash(x)=34155227) +1790 train 3.250545 (lr=2.4476e-04) (hash(x)=38472940) +1791 train 3.230571 (lr=2.4431e-04) (hash(x)=40729061) +1792 train 3.250022 (lr=2.4386e-04) (hash(x)=38509923) +1793 train 3.231724 (lr=2.4341e-04) (hash(x)=39985846) +1794 train 3.179636 (lr=2.4296e-04) (hash(x)=35047735) +1795 train 3.282080 (lr=2.4251e-04) (hash(x)=40488790) +1796 train 3.231949 (lr=2.4206e-04) (hash(x)=39602899) +1797 train 3.235473 (lr=2.4161e-04) (hash(x)=40197576) +1798 train 3.253954 (lr=2.4116e-04) (hash(x)=40856357) +1799 train 3.278501 (lr=2.4071e-04) (hash(x)=39957542) +1800 val loss 3.2134 +1800 val perplexity 24.8640 +1800 train 3.252983 (lr=2.4026e-04) (hash(x)=38583196) +1801 train 3.290623 (lr=2.3982e-04) (hash(x)=39373095) +1802 train 3.290672 (lr=2.3937e-04) (hash(x)=38874817) +1803 train 3.214489 (lr=2.3892e-04) (hash(x)=42238098) +1804 train 3.229688 (lr=2.3847e-04) (hash(x)=39524613) +1805 train 3.261172 (lr=2.3803e-04) (hash(x)=33472701) +1806 train 3.223542 (lr=2.3758e-04) (hash(x)=37746329) +1807 train 3.207047 (lr=2.3713e-04) (hash(x)=38029517) +1808 train 3.261840 (lr=2.3669e-04) (hash(x)=40741670) +1809 train 3.203547 (lr=2.3624e-04) (hash(x)=42397049) +1810 train 3.198976 (lr=2.3580e-04) (hash(x)=41011013) +1811 train 3.244263 (lr=2.3535e-04) (hash(x)=34476572) +1812 train 3.231594 (lr=2.3491e-04) (hash(x)=43120148) +1813 train 3.202306 (lr=2.3446e-04) (hash(x)=37985253) +1814 train 3.250341 (lr=2.3402e-04) (hash(x)=44040974) +1815 train 3.172713 (lr=2.3357e-04) (hash(x)=37513379) +1816 train 3.197300 (lr=2.3313e-04) (hash(x)=38836355) +1817 train 3.206135 (lr=2.3269e-04) (hash(x)=31824634) +1818 train 3.254334 (lr=2.3224e-04) (hash(x)=41528556) +1819 train 3.290797 (lr=2.3180e-04) (hash(x)=36254437) +1820 train 3.270416 (lr=2.3136e-04) (hash(x)=36928765) +1821 train 3.212972 (lr=2.3092e-04) (hash(x)=39807164) +1822 train 3.241275 (lr=2.3047e-04) (hash(x)=39759717) +1823 train 3.141451 (lr=2.3003e-04) (hash(x)=39225987) +1824 train 3.205263 (lr=2.2959e-04) (hash(x)=42296575) +1825 val loss 3.2097 +1825 val perplexity 24.7709 +1825 train 3.181390 (lr=2.2915e-04) (hash(x)=37985027) +1826 train 3.252151 (lr=2.2871e-04) (hash(x)=38654248) +1827 train 3.121562 (lr=2.2827e-04) (hash(x)=34974492) +1828 train 3.226080 (lr=2.2783e-04) (hash(x)=35772664) +1829 train 3.228004 (lr=2.2739e-04) (hash(x)=34555551) +1830 train 3.153117 (lr=2.2695e-04) (hash(x)=40229913) +1831 train 3.182893 (lr=2.2651e-04) (hash(x)=35861584) +1832 train 3.197702 (lr=2.2607e-04) (hash(x)=39536353) +1833 train 3.230463 (lr=2.2563e-04) (hash(x)=42091346) +1834 train 3.234297 (lr=2.2520e-04) (hash(x)=38472944) +1835 train 3.239589 (lr=2.2476e-04) (hash(x)=43872622) +1836 train 3.245009 (lr=2.2432e-04) (hash(x)=42242242) +1837 train 3.220756 (lr=2.2388e-04) (hash(x)=39853898) +1838 train 3.210279 (lr=2.2345e-04) (hash(x)=39377932) +1839 train 3.228456 (lr=2.2301e-04) (hash(x)=35654146) +1840 train 3.297413 (lr=2.2257e-04) (hash(x)=45179539) +1841 train 3.245961 (lr=2.2214e-04) (hash(x)=37773645) +1842 train 3.235965 (lr=2.2170e-04) (hash(x)=33911115) +1843 train 3.307305 (lr=2.2127e-04) (hash(x)=46110624) +1844 train 3.288793 (lr=2.2083e-04) (hash(x)=38908139) +1845 train 3.239395 (lr=2.2040e-04) (hash(x)=33973175) +1846 train 3.257918 (lr=2.1996e-04) (hash(x)=38302612) +1847 train 3.202480 (lr=2.1953e-04) (hash(x)=36436634) +1848 train 3.286590 (lr=2.1910e-04) (hash(x)=48358906) +1849 train 3.214869 (lr=2.1866e-04) (hash(x)=36116003) +1850 val loss 3.2092 +1850 val perplexity 24.7589 +1850 train 3.189213 (lr=2.1823e-04) (hash(x)=39425759) +1851 train 3.273628 (lr=2.1780e-04) (hash(x)=39043755) +1852 train 3.229943 (lr=2.1737e-04) (hash(x)=39043160) +1853 train 3.199236 (lr=2.1693e-04) (hash(x)=34777699) +1854 train 3.212109 (lr=2.1650e-04) (hash(x)=41703133) +1855 train 3.221383 (lr=2.1607e-04) (hash(x)=41244835) +1856 train 3.196274 (lr=2.1564e-04) (hash(x)=40143237) +1857 train 3.245989 (lr=2.1521e-04) (hash(x)=39529987) +1858 train 3.161592 (lr=2.1478e-04) (hash(x)=40583463) +1859 train 3.169218 (lr=2.1435e-04) (hash(x)=41784763) +1860 train 3.192044 (lr=2.1392e-04) (hash(x)=43587657) +1861 train 3.198513 (lr=2.1349e-04) (hash(x)=38820023) +1862 train 3.274941 (lr=2.1307e-04) (hash(x)=44516678) +1863 train 3.147079 (lr=2.1264e-04) (hash(x)=41862598) +1864 train 3.227850 (lr=2.1221e-04) (hash(x)=42100212) +1865 train 3.172650 (lr=2.1178e-04) (hash(x)=38022721) +1866 train 3.308240 (lr=2.1136e-04) (hash(x)=45254479) +1867 train 3.180629 (lr=2.1093e-04) (hash(x)=38264559) +1868 train 3.232266 (lr=2.1050e-04) (hash(x)=33883031) +1869 train 3.204190 (lr=2.1008e-04) (hash(x)=51791533) +1870 train 3.219502 (lr=2.0965e-04) (hash(x)=43669267) +1871 train 3.202670 (lr=2.0923e-04) (hash(x)=35253716) +1872 train 3.264106 (lr=2.0880e-04) (hash(x)=39148672) +1873 train 3.234597 (lr=2.0838e-04) (hash(x)=37991643) +1874 train 3.317046 (lr=2.0795e-04) (hash(x)=37119027) +1875 val loss 3.2035 +1875 val perplexity 24.6185 +1875 train 3.239594 (lr=2.0753e-04) (hash(x)=41326216) +1876 train 3.239051 (lr=2.0711e-04) (hash(x)=39854220) +1877 train 3.217125 (lr=2.0668e-04) (hash(x)=41991136) +1878 train 3.265463 (lr=2.0626e-04) (hash(x)=36037199) +1879 train 3.208701 (lr=2.0584e-04) (hash(x)=36706310) +1880 train 3.214015 (lr=2.0542e-04) (hash(x)=40161570) +1881 train 3.248534 (lr=2.0499e-04) (hash(x)=42034992) +1882 train 3.230705 (lr=2.0457e-04) (hash(x)=39694307) +1883 train 3.269697 (lr=2.0415e-04) (hash(x)=51318633) +1884 train 3.203427 (lr=2.0373e-04) (hash(x)=43914810) +1885 train 3.174237 (lr=2.0331e-04) (hash(x)=47910571) +1886 train 3.173986 (lr=2.0289e-04) (hash(x)=38378705) +1887 train 3.222652 (lr=2.0247e-04) (hash(x)=34411132) +1888 train 3.214168 (lr=2.0206e-04) (hash(x)=39626067) +1889 train 3.226400 (lr=2.0164e-04) (hash(x)=39601420) +1890 train 3.241733 (lr=2.0122e-04) (hash(x)=38445224) +1891 train 3.165795 (lr=2.0080e-04) (hash(x)=39879155) +1892 train 3.168354 (lr=2.0038e-04) (hash(x)=37319131) +1893 train 3.254172 (lr=1.9997e-04) (hash(x)=34303403) +1894 train 3.240737 (lr=1.9955e-04) (hash(x)=40040013) +1895 train 3.168389 (lr=1.9914e-04) (hash(x)=38657107) +1896 train 3.204543 (lr=1.9872e-04) (hash(x)=37318657) +1897 train 3.186850 (lr=1.9831e-04) (hash(x)=38363594) +1898 train 3.231563 (lr=1.9789e-04) (hash(x)=39803775) +1899 train 3.205999 (lr=1.9748e-04) (hash(x)=37776267) +1900 val loss 3.2002 +1900 val perplexity 24.5365 +1900 train 3.264389 (lr=1.9706e-04) (hash(x)=40745086) +1901 train 3.225794 (lr=1.9665e-04) (hash(x)=41579754) +1902 train 3.233960 (lr=1.9624e-04) (hash(x)=43711725) +1903 train 3.209531 (lr=1.9582e-04) (hash(x)=62352416) +1904 train 3.221849 (lr=1.9541e-04) (hash(x)=40340295) +1905 train 3.190908 (lr=1.9500e-04) (hash(x)=42373720) +1906 train 3.224402 (lr=1.9459e-04) (hash(x)=41797502) +1907 train 3.177154 (lr=1.9418e-04) (hash(x)=38466306) +1908 train 3.274211 (lr=1.9377e-04) (hash(x)=40876142) +1909 train 3.254783 (lr=1.9336e-04) (hash(x)=42449998) +1910 train 3.261122 (lr=1.9295e-04) (hash(x)=37469065) +1911 train 3.382546 (lr=1.9254e-04) (hash(x)=37519721) +1912 train 3.270185 (lr=1.9213e-04) (hash(x)=42852068) +1913 train 3.323944 (lr=1.9172e-04) (hash(x)=42649536) +1914 train 3.271092 (lr=1.9131e-04) (hash(x)=38977108) +1915 train 3.286382 (lr=1.9091e-04) (hash(x)=40671446) +1916 train 3.238861 (lr=1.9050e-04) (hash(x)=40624763) +1917 train 3.215987 (lr=1.9009e-04) (hash(x)=36612581) +1918 train 3.196985 (lr=1.8969e-04) (hash(x)=41975117) +1919 train 3.212104 (lr=1.8928e-04) (hash(x)=38070401) +1920 train 3.249581 (lr=1.8887e-04) (hash(x)=36383399) +1921 train 3.228707 (lr=1.8847e-04) (hash(x)=37339967) +1922 train 3.271787 (lr=1.8807e-04) (hash(x)=40022455) +1923 train 3.221542 (lr=1.8766e-04) (hash(x)=44200932) +1924 train 3.195146 (lr=1.8726e-04) (hash(x)=38713515) +1925 val loss 3.1994 +1925 val perplexity 24.5188 +1925 train 3.145016 (lr=1.8685e-04) (hash(x)=41063198) +1926 train 3.185942 (lr=1.8645e-04) (hash(x)=38678388) +1927 train 3.212201 (lr=1.8605e-04) (hash(x)=41482231) +1928 train 3.160076 (lr=1.8565e-04) (hash(x)=36427402) +1929 train 3.202048 (lr=1.8525e-04) (hash(x)=34968726) +1930 train 3.151781 (lr=1.8485e-04) (hash(x)=44726703) +1931 train 3.240967 (lr=1.8445e-04) (hash(x)=47879253) +1932 train 3.175279 (lr=1.8405e-04) (hash(x)=40711990) +1933 train 3.279497 (lr=1.8365e-04) (hash(x)=39311079) +1934 train 3.204220 (lr=1.8325e-04) (hash(x)=36459944) +1935 train 3.234447 (lr=1.8285e-04) (hash(x)=41197842) +1936 train 3.283351 (lr=1.8245e-04) (hash(x)=40707274) +1937 train 3.193746 (lr=1.8205e-04) (hash(x)=47145492) +1938 train 3.213556 (lr=1.8165e-04) (hash(x)=44838248) +1939 train 3.277774 (lr=1.8126e-04) (hash(x)=45484104) +1940 train 3.209962 (lr=1.8086e-04) (hash(x)=42386311) +1941 train 3.222975 (lr=1.8047e-04) (hash(x)=40383139) +1942 train 3.211974 (lr=1.8007e-04) (hash(x)=39352126) +1943 train 3.172028 (lr=1.7968e-04) (hash(x)=40822576) +1944 train 3.239057 (lr=1.7928e-04) (hash(x)=36346100) +1945 train 3.182785 (lr=1.7889e-04) (hash(x)=43538952) +1946 train 3.296746 (lr=1.7849e-04) (hash(x)=35546325) +1947 train 3.243500 (lr=1.7810e-04) (hash(x)=39383956) +1948 train 3.231143 (lr=1.7771e-04) (hash(x)=40325433) +1949 train 3.252161 (lr=1.7732e-04) (hash(x)=32774161) +1950 val loss 3.1955 +1950 val perplexity 24.4230 +1950 train 3.241665 (lr=1.7692e-04) (hash(x)=39278923) +1951 train 3.213823 (lr=1.7653e-04) (hash(x)=41395758) +1952 train 3.282988 (lr=1.7614e-04) (hash(x)=37147728) +1953 train 3.246962 (lr=1.7575e-04) (hash(x)=42987332) +1954 train 3.177680 (lr=1.7536e-04) (hash(x)=40006196) +1955 train 3.201205 (lr=1.7497e-04) (hash(x)=36782902) +1956 train 3.234619 (lr=1.7458e-04) (hash(x)=39212041) +1957 train 3.251037 (lr=1.7420e-04) (hash(x)=39234915) +1958 train 3.199675 (lr=1.7381e-04) (hash(x)=41502665) +1959 train 3.226540 (lr=1.7342e-04) (hash(x)=38241684) +1960 train 3.182420 (lr=1.7303e-04) (hash(x)=38451469) +1961 train 3.206050 (lr=1.7265e-04) (hash(x)=42052249) +1962 train 3.166573 (lr=1.7226e-04) (hash(x)=40124702) +1963 train 3.168465 (lr=1.7188e-04) (hash(x)=36476310) +1964 train 3.189315 (lr=1.7149e-04) (hash(x)=43841129) +1965 train 3.183025 (lr=1.7111e-04) (hash(x)=38754223) +1966 train 3.223260 (lr=1.7072e-04) (hash(x)=37875792) +1967 train 3.215266 (lr=1.7034e-04) (hash(x)=31093128) +1968 train 3.136075 (lr=1.6996e-04) (hash(x)=44102074) +1969 train 3.162869 (lr=1.6957e-04) (hash(x)=37806170) +1970 train 3.215866 (lr=1.6919e-04) (hash(x)=34817054) +1971 train 3.254388 (lr=1.6881e-04) (hash(x)=36103193) +1972 train 3.274875 (lr=1.6843e-04) (hash(x)=42313249) +1973 train 3.240678 (lr=1.6805e-04) (hash(x)=42586398) +1974 train 3.147765 (lr=1.6767e-04) (hash(x)=32107049) +1975 val loss 3.1932 +1975 val perplexity 24.3666 +1975 train 3.205764 (lr=1.6729e-04) (hash(x)=41638887) +1976 train 3.143480 (lr=1.6691e-04) (hash(x)=41275749) +1977 train 3.268363 (lr=1.6653e-04) (hash(x)=40327176) +1978 train 3.132615 (lr=1.6615e-04) (hash(x)=41294622) +1979 train 3.184149 (lr=1.6578e-04) (hash(x)=38125940) +1980 train 3.224453 (lr=1.6540e-04) (hash(x)=43669684) +1981 train 3.268689 (lr=1.6502e-04) (hash(x)=38192507) +1982 train 3.273597 (lr=1.6465e-04) (hash(x)=39282466) +1983 train 3.312757 (lr=1.6427e-04) (hash(x)=40664429) +1984 train 3.197439 (lr=1.6390e-04) (hash(x)=40858725) +1985 train 3.222574 (lr=1.6352e-04) (hash(x)=41472331) +1986 train 3.294549 (lr=1.6315e-04) (hash(x)=37847115) +1987 train 3.223296 (lr=1.6277e-04) (hash(x)=38027535) +1988 train 3.224029 (lr=1.6240e-04) (hash(x)=36579844) +1989 train 3.209898 (lr=1.6203e-04) (hash(x)=33109563) +1990 train 3.286825 (lr=1.6166e-04) (hash(x)=37300169) +1991 train 3.252459 (lr=1.6129e-04) (hash(x)=41056681) +1992 train 3.225785 (lr=1.6092e-04) (hash(x)=38755469) +1993 train 3.218891 (lr=1.6055e-04) (hash(x)=37288866) +1994 train 3.234530 (lr=1.6018e-04) (hash(x)=39367307) +1995 train 3.280242 (lr=1.5981e-04) (hash(x)=42781180) +1996 train 3.291843 (lr=1.5944e-04) (hash(x)=38374888) +1997 train 3.270628 (lr=1.5907e-04) (hash(x)=36511864) +1998 train 3.240833 (lr=1.5870e-04) (hash(x)=35179159) +1999 train 3.174346 (lr=1.5834e-04) (hash(x)=38117453) +2000 val loss 3.1891 +2000 val perplexity 24.2663 +2000 hella 0.2922 +2000 train 3.222191 (lr=1.5797e-04) (hash(x)=56707943) +2001 train 3.219169 (lr=1.5760e-04) (hash(x)=44301613) +2002 train 3.202171 (lr=1.5724e-04) (hash(x)=38242023) +2003 train 3.179437 (lr=1.5687e-04) (hash(x)=42642635) +2004 train 3.267187 (lr=1.5651e-04) (hash(x)=39913397) +2005 train 3.139140 (lr=1.5614e-04) (hash(x)=40378503) +2006 train 3.208698 (lr=1.5578e-04) (hash(x)=33648095) +2007 train 3.208868 (lr=1.5542e-04) (hash(x)=39054195) +2008 train 3.233824 (lr=1.5506e-04) (hash(x)=37751564) +2009 train 3.174890 (lr=1.5469e-04) (hash(x)=53792326) +2010 train 3.201140 (lr=1.5433e-04) (hash(x)=41344408) +2011 train 3.200078 (lr=1.5397e-04) (hash(x)=37943051) +2012 train 3.190244 (lr=1.5361e-04) (hash(x)=51214508) +2013 train 3.203146 (lr=1.5325e-04) (hash(x)=41798429) +2014 train 3.189331 (lr=1.5289e-04) (hash(x)=42796699) +2015 train 3.235545 (lr=1.5254e-04) (hash(x)=35321138) +2016 train 3.275719 (lr=1.5218e-04) (hash(x)=40488653) +2017 train 3.251620 (lr=1.5182e-04) (hash(x)=45676195) +2018 train 3.187697 (lr=1.5146e-04) (hash(x)=44989178) +2019 train 3.157319 (lr=1.5111e-04) (hash(x)=48323507) +2020 train 3.171504 (lr=1.5075e-04) (hash(x)=38157824) +2021 train 3.300977 (lr=1.5040e-04) (hash(x)=43330854) +2022 train 3.194975 (lr=1.5004e-04) (hash(x)=34851965) +2023 train 3.234914 (lr=1.4969e-04) (hash(x)=36575731) +2024 train 3.316779 (lr=1.4933e-04) (hash(x)=35421942) +2025 val loss 3.1869 +2025 val perplexity 24.2133 +2025 train 3.273551 (lr=1.4898e-04) (hash(x)=41999425) +2026 train 3.233250 (lr=1.4863e-04) (hash(x)=35860217) +2027 train 3.172820 (lr=1.4828e-04) (hash(x)=42528401) +2028 train 3.211511 (lr=1.4793e-04) (hash(x)=41091574) +2029 train 3.253445 (lr=1.4758e-04) (hash(x)=37256546) +2030 train 3.279229 (lr=1.4723e-04) (hash(x)=41212406) +2031 train 3.233808 (lr=1.4688e-04) (hash(x)=36826074) +2032 train 3.270710 (lr=1.4653e-04) (hash(x)=44498338) +2033 train 3.272779 (lr=1.4618e-04) (hash(x)=41055576) +2034 train 3.225005 (lr=1.4583e-04) (hash(x)=42002770) +2035 train 3.206840 (lr=1.4548e-04) (hash(x)=39497225) +2036 train 3.183893 (lr=1.4514e-04) (hash(x)=37688576) +2037 train 3.206529 (lr=1.4479e-04) (hash(x)=41782547) +2038 train 3.198198 (lr=1.4445e-04) (hash(x)=40767783) +2039 train 3.175855 (lr=1.4410e-04) (hash(x)=33968013) +2040 train 3.188486 (lr=1.4376e-04) (hash(x)=40611535) +2041 train 3.194689 (lr=1.4341e-04) (hash(x)=42473918) +2042 train 3.244920 (lr=1.4307e-04) (hash(x)=43515427) +2043 train 3.189587 (lr=1.4273e-04) (hash(x)=45518785) +2044 train 3.185007 (lr=1.4239e-04) (hash(x)=48218335) +2045 train 3.208585 (lr=1.4204e-04) (hash(x)=35671746) +2046 train 3.171389 (lr=1.4170e-04) (hash(x)=39638937) +2047 train 3.191227 (lr=1.4136e-04) (hash(x)=42198603) +2048 train 3.173256 (lr=1.4102e-04) (hash(x)=45724980) +2049 train 3.242420 (lr=1.4068e-04) (hash(x)=42263113) +2050 val loss 3.1868 +2050 val perplexity 24.2103 +2050 train 3.234306 (lr=1.4035e-04) (hash(x)=42104484) +2051 train 3.215526 (lr=1.4001e-04) (hash(x)=42229444) +2052 train 3.212276 (lr=1.3967e-04) (hash(x)=36239903) +2053 train 3.213213 (lr=1.3933e-04) (hash(x)=42763715) +2054 train 3.228881 (lr=1.3900e-04) (hash(x)=33808762) +2055 train 3.172179 (lr=1.3866e-04) (hash(x)=37785783) +2056 train 3.188059 (lr=1.3833e-04) (hash(x)=39274589) +2057 train 3.230011 (lr=1.3799e-04) (hash(x)=41367976) +2058 train 3.206701 (lr=1.3766e-04) (hash(x)=37422228) +2059 train 3.191833 (lr=1.3733e-04) (hash(x)=49976931) +2060 train 3.249191 (lr=1.3699e-04) (hash(x)=42083354) +2061 train 3.342964 (lr=1.3666e-04) (hash(x)=37573186) +2062 train 3.268910 (lr=1.3633e-04) (hash(x)=37524849) +2063 train 3.353073 (lr=1.3600e-04) (hash(x)=30872569) +2064 train 3.214433 (lr=1.3567e-04) (hash(x)=32410222) +2065 train 3.234764 (lr=1.3534e-04) (hash(x)=42107359) +2066 train 3.206204 (lr=1.3501e-04) (hash(x)=39880022) +2067 train 3.206251 (lr=1.3468e-04) (hash(x)=39953179) +2068 train 3.223487 (lr=1.3435e-04) (hash(x)=33601035) +2069 train 3.249161 (lr=1.3403e-04) (hash(x)=46413652) +2070 train 3.270621 (lr=1.3370e-04) (hash(x)=42357168) +2071 train 3.252203 (lr=1.3337e-04) (hash(x)=41716589) +2072 train 3.224942 (lr=1.3305e-04) (hash(x)=42298602) +2073 train 3.208803 (lr=1.3272e-04) (hash(x)=38659578) +2074 train 3.128889 (lr=1.3240e-04) (hash(x)=41165235) +2075 val loss 3.1841 +2075 val perplexity 24.1467 +2075 train 3.177361 (lr=1.3208e-04) (hash(x)=37372216) +2076 train 3.201893 (lr=1.3175e-04) (hash(x)=36306660) +2077 train 3.163636 (lr=1.3143e-04) (hash(x)=45823400) +2078 train 3.235507 (lr=1.3111e-04) (hash(x)=34639008) +2079 train 3.197582 (lr=1.3079e-04) (hash(x)=37572560) +2080 train 3.223686 (lr=1.3047e-04) (hash(x)=38363212) +2081 train 3.201016 (lr=1.3015e-04) (hash(x)=36687297) +2082 train 3.237901 (lr=1.2983e-04) (hash(x)=40789881) +2083 train 3.176155 (lr=1.2951e-04) (hash(x)=36223347) +2084 train 3.255848 (lr=1.2919e-04) (hash(x)=38503995) +2085 train 3.175615 (lr=1.2887e-04) (hash(x)=41601267) +2086 train 3.140862 (lr=1.2856e-04) (hash(x)=47210040) +2087 train 3.174895 (lr=1.2824e-04) (hash(x)=37664200) +2088 train 3.194806 (lr=1.2793e-04) (hash(x)=38694549) +2089 train 3.160042 (lr=1.2761e-04) (hash(x)=42828395) +2090 train 3.160867 (lr=1.2730e-04) (hash(x)=39138645) +2091 train 3.219427 (lr=1.2698e-04) (hash(x)=41811722) +2092 train 3.173548 (lr=1.2667e-04) (hash(x)=43183242) +2093 train 3.250135 (lr=1.2636e-04) (hash(x)=40259485) +2094 train 3.272863 (lr=1.2605e-04) (hash(x)=35380905) +2095 train 3.218509 (lr=1.2574e-04) (hash(x)=38930488) +2096 train 3.198859 (lr=1.2543e-04) (hash(x)=38366106) +2097 train 3.189930 (lr=1.2512e-04) (hash(x)=37892754) +2098 train 3.224765 (lr=1.2481e-04) (hash(x)=31422378) +2099 train 3.254600 (lr=1.2450e-04) (hash(x)=40519642) +2100 val loss 3.1796 +2100 val perplexity 24.0367 +2100 train 3.257238 (lr=1.2419e-04) (hash(x)=35457917) +2101 train 3.173871 (lr=1.2388e-04) (hash(x)=40280995) +2102 train 3.236063 (lr=1.2358e-04) (hash(x)=35826732) +2103 train 3.171950 (lr=1.2327e-04) (hash(x)=39143515) +2104 train 3.235286 (lr=1.2296e-04) (hash(x)=39554058) +2105 train 3.241625 (lr=1.2266e-04) (hash(x)=36339775) +2106 train 3.220742 (lr=1.2236e-04) (hash(x)=41530741) +2107 train 3.157305 (lr=1.2205e-04) (hash(x)=41060610) +2108 train 3.189696 (lr=1.2175e-04) (hash(x)=35755130) +2109 train 3.200193 (lr=1.2145e-04) (hash(x)=37626954) +2110 train 3.226523 (lr=1.2115e-04) (hash(x)=36028403) +2111 train 3.226969 (lr=1.2085e-04) (hash(x)=39856027) +2112 train 3.206479 (lr=1.2054e-04) (hash(x)=35083895) +2113 train 3.173445 (lr=1.2025e-04) (hash(x)=39270682) +2114 train 3.150347 (lr=1.1995e-04) (hash(x)=35323792) +2115 train 3.124321 (lr=1.1965e-04) (hash(x)=42573441) +2116 train 3.169347 (lr=1.1935e-04) (hash(x)=44052568) +2117 train 3.254465 (lr=1.1905e-04) (hash(x)=41432184) +2118 train 3.185150 (lr=1.1876e-04) (hash(x)=40774638) +2119 train 3.145009 (lr=1.1846e-04) (hash(x)=42170719) +2120 train 3.254835 (lr=1.1817e-04) (hash(x)=40739323) +2121 train 3.192242 (lr=1.1787e-04) (hash(x)=37669142) +2122 train 3.212479 (lr=1.1758e-04) (hash(x)=41597305) +2123 train 3.253601 (lr=1.1729e-04) (hash(x)=42549178) +2124 train 3.246919 (lr=1.1699e-04) (hash(x)=38700084) +2125 val loss 3.1790 +2125 val perplexity 24.0223 +2125 train 3.189884 (lr=1.1670e-04) (hash(x)=39893669) +2126 train 3.212507 (lr=1.1641e-04) (hash(x)=39578705) +2127 train 3.254087 (lr=1.1612e-04) (hash(x)=40870473) +2128 train 3.263184 (lr=1.1583e-04) (hash(x)=37775755) +2129 train 3.220930 (lr=1.1554e-04) (hash(x)=40860132) +2130 train 3.162859 (lr=1.1525e-04) (hash(x)=38862882) +2131 train 3.217631 (lr=1.1497e-04) (hash(x)=39012135) +2132 train 3.216703 (lr=1.1468e-04) (hash(x)=41727293) +2133 train 3.260168 (lr=1.1439e-04) (hash(x)=35997828) +2134 train 3.244363 (lr=1.1411e-04) (hash(x)=33411584) +2135 train 3.250727 (lr=1.1382e-04) (hash(x)=38013589) +2136 train 3.216146 (lr=1.1354e-04) (hash(x)=46040931) +2137 train 3.155060 (lr=1.1325e-04) (hash(x)=40096298) +2138 train 3.193447 (lr=1.1297e-04) (hash(x)=43113521) +2139 train 3.181904 (lr=1.1269e-04) (hash(x)=46434077) +2140 train 3.228526 (lr=1.1241e-04) (hash(x)=42657723) +2141 train 3.254064 (lr=1.1213e-04) (hash(x)=33455307) +2142 train 3.194732 (lr=1.1185e-04) (hash(x)=41801355) +2143 train 3.191528 (lr=1.1157e-04) (hash(x)=40188034) +2144 train 3.217355 (lr=1.1129e-04) (hash(x)=40572241) +2145 train 3.227738 (lr=1.1101e-04) (hash(x)=49081366) +2146 train 3.139304 (lr=1.1073e-04) (hash(x)=44402342) +2147 train 3.156915 (lr=1.1045e-04) (hash(x)=39871491) +2148 train 3.181363 (lr=1.1018e-04) (hash(x)=35796868) +2149 train 3.216437 (lr=1.0990e-04) (hash(x)=43579902) +2150 val loss 3.1772 +2150 val perplexity 23.9804 +2150 train 3.153757 (lr=1.0963e-04) (hash(x)=33972047) +2151 train 3.164675 (lr=1.0935e-04) (hash(x)=36281612) +2152 train 3.161997 (lr=1.0908e-04) (hash(x)=36625143) +2153 train 3.191922 (lr=1.0881e-04) (hash(x)=41175869) +2154 train 3.196617 (lr=1.0853e-04) (hash(x)=38570240) +2155 train 3.159378 (lr=1.0826e-04) (hash(x)=37403603) +2156 train 3.176820 (lr=1.0799e-04) (hash(x)=37220490) +2157 train 3.199013 (lr=1.0772e-04) (hash(x)=39249867) +2158 train 3.207851 (lr=1.0745e-04) (hash(x)=35733583) +2159 train 3.196948 (lr=1.0718e-04) (hash(x)=40360042) +2160 train 3.183661 (lr=1.0692e-04) (hash(x)=48146101) +2161 train 3.204528 (lr=1.0665e-04) (hash(x)=37060502) +2162 train 3.176831 (lr=1.0638e-04) (hash(x)=40326752) +2163 train 3.236493 (lr=1.0612e-04) (hash(x)=40432915) +2164 train 3.248329 (lr=1.0585e-04) (hash(x)=45567935) +2165 train 3.186474 (lr=1.0559e-04) (hash(x)=43529661) +2166 train 3.194041 (lr=1.0532e-04) (hash(x)=41723553) +2167 train 3.217759 (lr=1.0506e-04) (hash(x)=42303062) +2168 train 3.310438 (lr=1.0480e-04) (hash(x)=36688744) +2169 train 3.184469 (lr=1.0453e-04) (hash(x)=37546228) +2170 train 3.249474 (lr=1.0427e-04) (hash(x)=46168084) +2171 train 3.191573 (lr=1.0401e-04) (hash(x)=46511793) +2172 train 3.227280 (lr=1.0375e-04) (hash(x)=39704989) +2173 train 3.219881 (lr=1.0349e-04) (hash(x)=38508459) +2174 train 3.280161 (lr=1.0324e-04) (hash(x)=38100692) +2175 val loss 3.1746 +2175 val perplexity 23.9179 +2175 train 3.241443 (lr=1.0298e-04) (hash(x)=49382598) +2176 train 3.225566 (lr=1.0272e-04) (hash(x)=38778831) +2177 train 3.242883 (lr=1.0247e-04) (hash(x)=41208421) +2178 train 3.164306 (lr=1.0221e-04) (hash(x)=40600596) +2179 train 3.166261 (lr=1.0196e-04) (hash(x)=44756487) +2180 train 3.190430 (lr=1.0170e-04) (hash(x)=36498264) +2181 train 3.225512 (lr=1.0145e-04) (hash(x)=40128717) +2182 train 3.246063 (lr=1.0120e-04) (hash(x)=39867883) +2183 train 3.215605 (lr=1.0094e-04) (hash(x)=34602753) +2184 train 3.183640 (lr=1.0069e-04) (hash(x)=37263336) +2185 train 3.186970 (lr=1.0044e-04) (hash(x)=39181931) +2186 train 3.215996 (lr=1.0019e-04) (hash(x)=39180468) +2187 train 3.146749 (lr=9.9942e-05) (hash(x)=45676342) +2188 train 3.269212 (lr=9.9694e-05) (hash(x)=34186435) +2189 train 3.231520 (lr=9.9446e-05) (hash(x)=40362722) +2190 train 3.337600 (lr=9.9199e-05) (hash(x)=37659552) +2191 train 3.223573 (lr=9.8953e-05) (hash(x)=40864867) +2192 train 3.111867 (lr=9.8708e-05) (hash(x)=39094131) +2193 train 3.195261 (lr=9.8463e-05) (hash(x)=39317988) +2194 train 3.160705 (lr=9.8219e-05) (hash(x)=42925963) +2195 train 3.185447 (lr=9.7975e-05) (hash(x)=37527819) +2196 train 3.148914 (lr=9.7733e-05) (hash(x)=39831257) +2197 train 3.194801 (lr=9.7491e-05) (hash(x)=39456492) +2198 train 3.232344 (lr=9.7250e-05) (hash(x)=35736738) +2199 train 3.221091 (lr=9.7009e-05) (hash(x)=37314296) +2200 val loss 3.1743 +2200 val perplexity 23.9096 +2200 train 3.151190 (lr=9.6769e-05) (hash(x)=40439855) +2201 train 3.206026 (lr=9.6530e-05) (hash(x)=38537192) +2202 train 3.231071 (lr=9.6292e-05) (hash(x)=42545932) +2203 train 3.275881 (lr=9.6054e-05) (hash(x)=42358547) +2204 train 3.211563 (lr=9.5818e-05) (hash(x)=45321664) +2205 train 3.212021 (lr=9.5581e-05) (hash(x)=41990758) +2206 train 3.180505 (lr=9.5346e-05) (hash(x)=40871414) +2207 train 3.189975 (lr=9.5111e-05) (hash(x)=46253678) +2208 train 3.240729 (lr=9.4877e-05) (hash(x)=38117956) +2209 train 3.207275 (lr=9.4644e-05) (hash(x)=43775849) +2210 train 3.189369 (lr=9.4412e-05) (hash(x)=35989715) +2211 train 3.328573 (lr=9.4180e-05) (hash(x)=37319331) +2212 train 3.204878 (lr=9.3949e-05) (hash(x)=37558417) +2213 train 3.189070 (lr=9.3718e-05) (hash(x)=39062591) +2214 train 3.213707 (lr=9.3489e-05) (hash(x)=27244469) +2215 train 3.234775 (lr=9.3260e-05) (hash(x)=32936708) +2216 train 3.268548 (lr=9.3032e-05) (hash(x)=41110814) +2217 train 3.191166 (lr=9.2804e-05) (hash(x)=41931538) +2218 train 3.196417 (lr=9.2578e-05) (hash(x)=38765773) +2219 train 3.233568 (lr=9.2352e-05) (hash(x)=38841881) +2220 train 3.197446 (lr=9.2127e-05) (hash(x)=28584663) +2221 train 3.155994 (lr=9.1902e-05) (hash(x)=39533986) +2222 train 3.229795 (lr=9.1679e-05) (hash(x)=41569214) +2223 train 3.188248 (lr=9.1456e-05) (hash(x)=39007918) +2224 train 3.204623 (lr=9.1233e-05) (hash(x)=37411031) +2225 val loss 3.1715 +2225 val perplexity 23.8429 +2225 train 3.168435 (lr=9.1012e-05) (hash(x)=42000080) +2226 train 3.155571 (lr=9.0791e-05) (hash(x)=35328387) +2227 train 3.170044 (lr=9.0571e-05) (hash(x)=41340268) +2228 train 3.123554 (lr=9.0352e-05) (hash(x)=41934876) +2229 train 3.195941 (lr=9.0133e-05) (hash(x)=40151703) +2230 train 3.207673 (lr=8.9916e-05) (hash(x)=40311177) +2231 train 3.199227 (lr=8.9698e-05) (hash(x)=37154884) +2232 train 3.175836 (lr=8.9482e-05) (hash(x)=41653379) +2233 train 3.195689 (lr=8.9267e-05) (hash(x)=40207795) +2234 train 3.195185 (lr=8.9052e-05) (hash(x)=37893389) +2235 train 3.226979 (lr=8.8838e-05) (hash(x)=40317089) +2236 train 3.154136 (lr=8.8624e-05) (hash(x)=37899012) +2237 train 3.161141 (lr=8.8412e-05) (hash(x)=40049932) +2238 train 3.228069 (lr=8.8200e-05) (hash(x)=41152327) +2239 train 3.252168 (lr=8.7989e-05) (hash(x)=37556713) +2240 train 3.288457 (lr=8.7779e-05) (hash(x)=35782016) +2241 train 3.206999 (lr=8.7569e-05) (hash(x)=35140985) +2242 train 3.152836 (lr=8.7360e-05) (hash(x)=38014868) +2243 train 3.172194 (lr=8.7152e-05) (hash(x)=45601217) +2244 train 3.251462 (lr=8.6945e-05) (hash(x)=35283633) +2245 train 3.198990 (lr=8.6738e-05) (hash(x)=39121820) +2246 train 3.178666 (lr=8.6533e-05) (hash(x)=33341688) +2247 train 3.219136 (lr=8.6328e-05) (hash(x)=39687800) +2248 train 3.280279 (lr=8.6123e-05) (hash(x)=38123993) +2249 train 3.189261 (lr=8.5920e-05) (hash(x)=46921668) +2250 val loss 3.1698 +2250 val perplexity 23.8021 +2250 hella 0.2873 +2250 train 3.192695 (lr=8.5717e-05) (hash(x)=43627909) +2251 train 3.152376 (lr=8.5515e-05) (hash(x)=37663843) +2252 train 3.178159 (lr=8.5314e-05) (hash(x)=34836689) +2253 train 3.217944 (lr=8.5113e-05) (hash(x)=39927186) +2254 train 3.200094 (lr=8.4913e-05) (hash(x)=39593004) +2255 train 3.207508 (lr=8.4714e-05) (hash(x)=45673735) +2256 train 3.213320 (lr=8.4516e-05) (hash(x)=41104010) +2257 train 3.208475 (lr=8.4319e-05) (hash(x)=41050014) +2258 train 3.207616 (lr=8.4122e-05) (hash(x)=33270846) +2259 train 3.203358 (lr=8.3926e-05) (hash(x)=34687139) +2260 train 3.195184 (lr=8.3731e-05) (hash(x)=43537200) +2261 train 3.217925 (lr=8.3536e-05) (hash(x)=41531635) +2262 train 3.186250 (lr=8.3343e-05) (hash(x)=37082323) +2263 train 3.228310 (lr=8.3150e-05) (hash(x)=43382076) +2264 train 3.223874 (lr=8.2958e-05) (hash(x)=41047002) +2265 train 3.161670 (lr=8.2766e-05) (hash(x)=39192350) +2266 train 3.249376 (lr=8.2576e-05) (hash(x)=37691702) +2267 train 3.305618 (lr=8.2386e-05) (hash(x)=39906405) +2268 train 3.181733 (lr=8.2197e-05) (hash(x)=37306842) +2269 train 3.233741 (lr=8.2009e-05) (hash(x)=38106536) +2270 train 3.222421 (lr=8.1821e-05) (hash(x)=38032415) +2271 train 3.168190 (lr=8.1634e-05) (hash(x)=36750690) +2272 train 3.187704 (lr=8.1448e-05) (hash(x)=38558396) +2273 train 3.233734 (lr=8.1263e-05) (hash(x)=37676712) +2274 train 3.189555 (lr=8.1079e-05) (hash(x)=39793457) +2275 val loss 3.1696 +2275 val perplexity 23.7982 +2275 train 3.137665 (lr=8.0895e-05) (hash(x)=38868040) +2276 train 3.148821 (lr=8.0712e-05) (hash(x)=36904609) +2277 train 3.124657 (lr=8.0530e-05) (hash(x)=46906076) +2278 train 3.097897 (lr=8.0348e-05) (hash(x)=52864307) +2279 train 3.127996 (lr=8.0168e-05) (hash(x)=38792493) +2280 train 3.113494 (lr=7.9988e-05) (hash(x)=43869467) +2281 train 3.138358 (lr=7.9809e-05) (hash(x)=40380951) +2282 train 3.238327 (lr=7.9631e-05) (hash(x)=44366521) +2283 train 3.140528 (lr=7.9453e-05) (hash(x)=42342179) +2284 train 3.270218 (lr=7.9276e-05) (hash(x)=41738513) +2285 train 3.167413 (lr=7.9101e-05) (hash(x)=40407555) +2286 train 3.094296 (lr=7.8925e-05) (hash(x)=40789316) +2287 train 3.209049 (lr=7.8751e-05) (hash(x)=38913391) +2288 train 3.150516 (lr=7.8577e-05) (hash(x)=47036772) +2289 train 3.195809 (lr=7.8405e-05) (hash(x)=26354961) +2290 train 3.209304 (lr=7.8232e-05) (hash(x)=40784104) +2291 train 3.203858 (lr=7.8061e-05) (hash(x)=43435512) +2292 train 3.237984 (lr=7.7891e-05) (hash(x)=42553720) +2293 train 3.192333 (lr=7.7721e-05) (hash(x)=37984547) +2294 train 3.219926 (lr=7.7552e-05) (hash(x)=42927726) +2295 train 3.234611 (lr=7.7384e-05) (hash(x)=42175938) +2296 train 3.185009 (lr=7.7217e-05) (hash(x)=41660050) +2297 train 3.165952 (lr=7.7050e-05) (hash(x)=40258171) +2298 train 3.196211 (lr=7.6884e-05) (hash(x)=38329934) +2299 train 3.225919 (lr=7.6719e-05) (hash(x)=32156995) +2300 val loss 3.1684 +2300 val perplexity 23.7692 +2300 train 3.116920 (lr=7.6555e-05) (hash(x)=48507790) +2301 train 3.166348 (lr=7.6392e-05) (hash(x)=37695808) +2302 train 3.177983 (lr=7.6229e-05) (hash(x)=38611601) +2303 train 3.150621 (lr=7.6067e-05) (hash(x)=40437689) +2304 train 3.197284 (lr=7.5906e-05) (hash(x)=43384874) +2305 train 3.171366 (lr=7.5746e-05) (hash(x)=38421638) +2306 train 3.150937 (lr=7.5586e-05) (hash(x)=41890318) +2307 train 3.210037 (lr=7.5427e-05) (hash(x)=44892372) +2308 train 3.157723 (lr=7.5269e-05) (hash(x)=33604327) +2309 train 3.273235 (lr=7.5112e-05) (hash(x)=45069907) +2310 train 3.196662 (lr=7.4956e-05) (hash(x)=38583278) +2311 train 3.209044 (lr=7.4800e-05) (hash(x)=36663739) +2312 train 3.153679 (lr=7.4646e-05) (hash(x)=40644905) +2313 train 3.161768 (lr=7.4492e-05) (hash(x)=36353540) +2314 train 3.219148 (lr=7.4338e-05) (hash(x)=33446948) +2315 train 3.177769 (lr=7.4186e-05) (hash(x)=41412846) +2316 train 3.199986 (lr=7.4034e-05) (hash(x)=41861581) +2317 train 3.101651 (lr=7.3884e-05) (hash(x)=39777306) +2318 train 3.157269 (lr=7.3734e-05) (hash(x)=39035874) +2319 train 3.148629 (lr=7.3584e-05) (hash(x)=37351804) +2320 train 3.147712 (lr=7.3436e-05) (hash(x)=41087228) +2321 train 3.125938 (lr=7.3288e-05) (hash(x)=40832561) +2322 train 3.189282 (lr=7.3141e-05) (hash(x)=38778936) +2323 train 3.186615 (lr=7.2995e-05) (hash(x)=41597361) +2324 train 3.234245 (lr=7.2850e-05) (hash(x)=37884561) +2325 val loss 3.1645 +2325 val perplexity 23.6762 +2325 train 3.127610 (lr=7.2706e-05) (hash(x)=41581772) +2326 train 3.212462 (lr=7.2562e-05) (hash(x)=40877354) +2327 train 3.202553 (lr=7.2419e-05) (hash(x)=41625142) +2328 train 3.188098 (lr=7.2277e-05) (hash(x)=39349602) +2329 train 3.169904 (lr=7.2136e-05) (hash(x)=41073420) +2330 train 3.185216 (lr=7.1995e-05) (hash(x)=40927210) +2331 train 3.195322 (lr=7.1856e-05) (hash(x)=41889457) +2332 train 3.214297 (lr=7.1717e-05) (hash(x)=36863749) +2333 train 3.201446 (lr=7.1579e-05) (hash(x)=41790403) +2334 train 3.222209 (lr=7.1441e-05) (hash(x)=38013384) +2335 train 3.211924 (lr=7.1305e-05) (hash(x)=41136927) +2336 train 3.229180 (lr=7.1169e-05) (hash(x)=36118984) +2337 train 3.149779 (lr=7.1034e-05) (hash(x)=35032908) +2338 train 3.245169 (lr=7.0900e-05) (hash(x)=39253140) +2339 train 3.184708 (lr=7.0767e-05) (hash(x)=30278988) +2340 train 3.168014 (lr=7.0635e-05) (hash(x)=38669699) +2341 train 3.178735 (lr=7.0503e-05) (hash(x)=33847912) +2342 train 3.370126 (lr=7.0372e-05) (hash(x)=37781837) +2343 train 3.202217 (lr=7.0242e-05) (hash(x)=39033484) +2344 train 3.212671 (lr=7.0113e-05) (hash(x)=40473140) +2345 train 3.166245 (lr=6.9984e-05) (hash(x)=38499643) +2346 train 3.142761 (lr=6.9857e-05) (hash(x)=42346456) +2347 train 3.171115 (lr=6.9730e-05) (hash(x)=38700794) +2348 train 3.147779 (lr=6.9604e-05) (hash(x)=37614713) +2349 train 3.143156 (lr=6.9479e-05) (hash(x)=42548828) +2350 val loss 3.1652 +2350 val perplexity 23.6924 +2350 train 3.176768 (lr=6.9354e-05) (hash(x)=34904275) +2351 train 3.203927 (lr=6.9231e-05) (hash(x)=45058829) +2352 train 3.186168 (lr=6.9108e-05) (hash(x)=36289706) +2353 train 3.159200 (lr=6.8986e-05) (hash(x)=39255517) +2354 train 3.201078 (lr=6.8865e-05) (hash(x)=40017470) +2355 train 3.124195 (lr=6.8744e-05) (hash(x)=39883882) +2356 train 3.181032 (lr=6.8625e-05) (hash(x)=47098079) +2357 train 3.155217 (lr=6.8506e-05) (hash(x)=44785563) +2358 train 3.211712 (lr=6.8388e-05) (hash(x)=41630703) +2359 train 3.158242 (lr=6.8271e-05) (hash(x)=42265263) +2360 train 3.181457 (lr=6.8155e-05) (hash(x)=42423511) +2361 train 3.174617 (lr=6.8039e-05) (hash(x)=44714452) +2362 train 3.230580 (lr=6.7925e-05) (hash(x)=49394032) +2363 train 3.194075 (lr=6.7811e-05) (hash(x)=41446183) +2364 train 3.189980 (lr=6.7698e-05) (hash(x)=45423241) +2365 train 3.218899 (lr=6.7585e-05) (hash(x)=38575184) +2366 train 3.157509 (lr=6.7474e-05) (hash(x)=40011652) +2367 train 3.158178 (lr=6.7363e-05) (hash(x)=36502424) +2368 train 3.196077 (lr=6.7254e-05) (hash(x)=37277966) +2369 train 3.163372 (lr=6.7145e-05) (hash(x)=42050131) +2370 train 3.172558 (lr=6.7036e-05) (hash(x)=40488046) +2371 train 3.150167 (lr=6.6929e-05) (hash(x)=41628228) +2372 train 3.196053 (lr=6.6822e-05) (hash(x)=38976337) +2373 train 3.190768 (lr=6.6717e-05) (hash(x)=42548965) +2374 train 3.225233 (lr=6.6612e-05) (hash(x)=42149363) +2375 val loss 3.1632 +2375 val perplexity 23.6462 +2375 train 3.257929 (lr=6.6508e-05) (hash(x)=36093892) +2376 train 3.212163 (lr=6.6404e-05) (hash(x)=38487793) +2377 train 3.158589 (lr=6.6302e-05) (hash(x)=35406173) +2378 train 3.144438 (lr=6.6200e-05) (hash(x)=42860597) +2379 train 3.180876 (lr=6.6099e-05) (hash(x)=40471517) +2380 train 3.252946 (lr=6.5999e-05) (hash(x)=38208956) +2381 train 3.217980 (lr=6.5900e-05) (hash(x)=37287570) +2382 train 3.173961 (lr=6.5802e-05) (hash(x)=38513031) +2383 train 3.179870 (lr=6.5704e-05) (hash(x)=42048953) +2384 train 3.194555 (lr=6.5607e-05) (hash(x)=37180778) +2385 train 3.127796 (lr=6.5511e-05) (hash(x)=36795978) +2386 train 3.144840 (lr=6.5416e-05) (hash(x)=34755135) +2387 train 3.140290 (lr=6.5322e-05) (hash(x)=36720056) +2388 train 3.165158 (lr=6.5229e-05) (hash(x)=35001697) +2389 train 3.156161 (lr=6.5136e-05) (hash(x)=44216024) +2390 train 3.190417 (lr=6.5044e-05) (hash(x)=35606719) +2391 train 3.172535 (lr=6.4953e-05) (hash(x)=38626374) +2392 train 3.096777 (lr=6.4863e-05) (hash(x)=43128356) +2393 train 3.192488 (lr=6.4774e-05) (hash(x)=33631790) +2394 train 3.188267 (lr=6.4685e-05) (hash(x)=37013026) +2395 train 3.179092 (lr=6.4597e-05) (hash(x)=38279807) +2396 train 3.175366 (lr=6.4510e-05) (hash(x)=54250224) +2397 train 3.218047 (lr=6.4424e-05) (hash(x)=37829360) +2398 train 3.246032 (lr=6.4339e-05) (hash(x)=34562819) +2399 train 3.156776 (lr=6.4255e-05) (hash(x)=38588555) +2400 val loss 3.1618 +2400 val perplexity 23.6140 +2400 train 3.191436 (lr=6.4171e-05) (hash(x)=41714010) +2401 train 3.147417 (lr=6.4088e-05) (hash(x)=40847756) +2402 train 3.205053 (lr=6.4006e-05) (hash(x)=42082508) +2403 train 3.154894 (lr=6.3925e-05) (hash(x)=39275125) +2404 train 3.233796 (lr=6.3845e-05) (hash(x)=48358855) +2405 train 3.175199 (lr=6.3765e-05) (hash(x)=40583533) +2406 train 3.171179 (lr=6.3687e-05) (hash(x)=39011594) +2407 train 3.117702 (lr=6.3609e-05) (hash(x)=36824577) +2408 train 3.174238 (lr=6.3532e-05) (hash(x)=34469865) +2409 train 3.185596 (lr=6.3456e-05) (hash(x)=44032280) +2410 train 3.180871 (lr=6.3380e-05) (hash(x)=41368977) +2411 train 3.200687 (lr=6.3306e-05) (hash(x)=38937806) +2412 train 3.188562 (lr=6.3232e-05) (hash(x)=39628376) +2413 train 3.194297 (lr=6.3159e-05) (hash(x)=34947735) +2414 train 3.169108 (lr=6.3087e-05) (hash(x)=39550281) +2415 train 3.201134 (lr=6.3016e-05) (hash(x)=44916647) +2416 train 3.155251 (lr=6.2945e-05) (hash(x)=36634407) +2417 train 3.183017 (lr=6.2876e-05) (hash(x)=40602462) +2418 train 3.171113 (lr=6.2807e-05) (hash(x)=44797558) +2419 train 3.174513 (lr=6.2739e-05) (hash(x)=32683756) +2420 train 3.157426 (lr=6.2672e-05) (hash(x)=40222481) +2421 train 3.164004 (lr=6.2606e-05) (hash(x)=41158201) +2422 train 3.149777 (lr=6.2540e-05) (hash(x)=38804495) +2423 train 3.184538 (lr=6.2476e-05) (hash(x)=39487565) +2424 train 3.172535 (lr=6.2412e-05) (hash(x)=39824017) +2425 val loss 3.1618 +2425 val perplexity 23.6119 +2425 train 3.096504 (lr=6.2349e-05) (hash(x)=37587696) +2426 train 3.196667 (lr=6.2287e-05) (hash(x)=39632774) +2427 train 3.197175 (lr=6.2225e-05) (hash(x)=45941633) +2428 train 3.103321 (lr=6.2165e-05) (hash(x)=42335966) +2429 train 3.185068 (lr=6.2105e-05) (hash(x)=47609367) +2430 train 3.218474 (lr=6.2046e-05) (hash(x)=39450223) +2431 train 3.163240 (lr=6.1988e-05) (hash(x)=40414253) +2432 train 3.195980 (lr=6.1931e-05) (hash(x)=38849710) +2433 train 3.191642 (lr=6.1875e-05) (hash(x)=41653220) +2434 train 3.166094 (lr=6.1820e-05) (hash(x)=40169526) +2435 train 3.196271 (lr=6.1765e-05) (hash(x)=44858000) +2436 train 3.177360 (lr=6.1711e-05) (hash(x)=38894878) +2437 train 3.183860 (lr=6.1658e-05) (hash(x)=43613758) +2438 train 3.232023 (lr=6.1606e-05) (hash(x)=47474569) +2439 train 3.150385 (lr=6.1555e-05) (hash(x)=43775495) +2440 train 3.364250 (lr=6.1504e-05) (hash(x)=40715325) +2441 train 3.181325 (lr=6.1454e-05) (hash(x)=39592467) +2442 train 3.178249 (lr=6.1406e-05) (hash(x)=42624187) +2443 train 3.267856 (lr=6.1358e-05) (hash(x)=50975897) +2444 train 3.101630 (lr=6.1310e-05) (hash(x)=37829145) +2445 train 3.259470 (lr=6.1264e-05) (hash(x)=36552249) +2446 train 3.198108 (lr=6.1218e-05) (hash(x)=44288049) +2447 train 3.235226 (lr=6.1174e-05) (hash(x)=37746209) +2448 train 3.234485 (lr=6.1130e-05) (hash(x)=40652438) +2449 train 3.212986 (lr=6.1087e-05) (hash(x)=44620132) +2450 val loss 3.1606 +2450 val perplexity 23.5857 +2450 train 3.204928 (lr=6.1045e-05) (hash(x)=45561207) +2451 train 3.194884 (lr=6.1003e-05) (hash(x)=39004659) +2452 train 3.174356 (lr=6.0963e-05) (hash(x)=35113270) +2453 train 3.168595 (lr=6.0923e-05) (hash(x)=36351666) +2454 train 3.172582 (lr=6.0884e-05) (hash(x)=38936350) +2455 train 3.216583 (lr=6.0846e-05) (hash(x)=46201334) +2456 train 3.086204 (lr=6.0809e-05) (hash(x)=43453200) +2457 train 3.105927 (lr=6.0773e-05) (hash(x)=37184899) +2458 train 3.205726 (lr=6.0737e-05) (hash(x)=40527967) +2459 train 3.207264 (lr=6.0703e-05) (hash(x)=39602329) +2460 train 3.154262 (lr=6.0669e-05) (hash(x)=38847498) +2461 train 3.130014 (lr=6.0636e-05) (hash(x)=44106590) +2462 train 3.155589 (lr=6.0604e-05) (hash(x)=41490965) +2463 train 3.162129 (lr=6.0572e-05) (hash(x)=39832265) +2464 train 3.194639 (lr=6.0542e-05) (hash(x)=41997044) +2465 train 3.170419 (lr=6.0512e-05) (hash(x)=40129952) +2466 train 3.224929 (lr=6.0483e-05) (hash(x)=39801305) +2467 train 3.158404 (lr=6.0455e-05) (hash(x)=38914190) +2468 train 3.256289 (lr=6.0428e-05) (hash(x)=37138572) +2469 train 3.209816 (lr=6.0402e-05) (hash(x)=41294566) +2470 train 3.161743 (lr=6.0376e-05) (hash(x)=44762367) +2471 train 3.150369 (lr=6.0352e-05) (hash(x)=41635683) +2472 train 3.198856 (lr=6.0328e-05) (hash(x)=37761743) +2473 train 3.177891 (lr=6.0305e-05) (hash(x)=45386286) +2474 train 3.227271 (lr=6.0283e-05) (hash(x)=42485480) +2475 val loss 3.1586 +2475 val perplexity 23.5377 +2475 train 3.163866 (lr=6.0261e-05) (hash(x)=40198349) +2476 train 3.115510 (lr=6.0241e-05) (hash(x)=43807060) +2477 train 3.152856 (lr=6.0221e-05) (hash(x)=39885607) +2478 train 3.192984 (lr=6.0202e-05) (hash(x)=43005593) +2479 train 3.211437 (lr=6.0184e-05) (hash(x)=35687855) +2480 train 3.171411 (lr=6.0167e-05) (hash(x)=36913433) +2481 train 3.253450 (lr=6.0151e-05) (hash(x)=41135209) +2482 train 3.231420 (lr=6.0135e-05) (hash(x)=50145156) +2483 train 3.248109 (lr=6.0121e-05) (hash(x)=38878355) +2484 train 3.231893 (lr=6.0107e-05) (hash(x)=40197635) +2485 train 3.296749 (lr=6.0094e-05) (hash(x)=44139663) +2486 train 3.177407 (lr=6.0082e-05) (hash(x)=38855758) +2487 train 3.213601 (lr=6.0071e-05) (hash(x)=42214173) +2488 train 3.223625 (lr=6.0060e-05) (hash(x)=31913186) +2489 train 3.238159 (lr=6.0051e-05) (hash(x)=38815597) +2490 train 3.189882 (lr=6.0042e-05) (hash(x)=37557401) +2491 train 3.164188 (lr=6.0034e-05) (hash(x)=41046165) +2492 train 3.180332 (lr=6.0027e-05) (hash(x)=43449463) +2493 train 3.162686 (lr=6.0020e-05) (hash(x)=38023800) +2494 train 3.179134 (lr=6.0015e-05) (hash(x)=41871892) +2495 train 3.160711 (lr=6.0010e-05) (hash(x)=40567150) +2496 train 3.105864 (lr=6.0007e-05) (hash(x)=44577568) +2497 train 3.176164 (lr=6.0004e-05) (hash(x)=40080828) +2498 train 3.179257 (lr=6.0002e-05) (hash(x)=39340600) +2499 val loss 3.1599 +2499 val perplexity 23.5678 +2499 hella 0.2868 +2499 train 3.161965 (lr=6.0000e-05) (hash(x)=43843813)