diff --git a/lr1.75e-4_total_batch_size5120_seq_len256_decay_lrtrue_attention_kindselective_warmup_steps1/args.json b/lr1.75e-4_total_batch_size5120_seq_len256_decay_lrtrue_attention_kindselective_warmup_steps1/args.json new file mode 100644 index 0000000000000000000000000000000000000000..302f5a54eebc0bf19ad8eff57e2ecfcf3fa26c93 --- /dev/null +++ b/lr1.75e-4_total_batch_size5120_seq_len256_decay_lrtrue_attention_kindselective_warmup_steps1/args.json @@ -0,0 +1 @@ +{"hellaswag": true, "attention_kind": "selective", "log_dir": "proxy_model_sweep_2/lr1.75e-4_total_batch_size5120_seq_len256_decay_lrtrue_attention_kindselective_warmup_steps1", "resume_checkpoint": null, "resume_optimizer": false, "add_a_head": false, "add_head_to_start": true, "new_head_init": "normal", "n_heads": 2, "protect_bos_token": true, "prevent_from_masking_myself": true, "max_steps": 10000, "warmup_steps": 1, "group": "proxy_model_sweep_2", "use_wandb": true, "kill_self_after_run": false, "random_seed": 1337, "memory_penalty_epsilon": 0.1, "selection_head_linear_combo": "none", "selection_head_linear_combo_scale": 1.0, "protection_kind": "none", "leaky_relu_alpha": null, "leaky_relu_bias": null, "use_compile": true, "use_mini_model": false, "upload_to_hf": true, "seq_len": 256, "batch_size": 20, "total_batch_size": 5120, "protection_head_scaling_factor": 1.0, "protection_head_bias": 0.0, "n_sliced_masks": null, "n_latent_masks": null, "mask_layernorm": false, "residual_attention_masks": false, "compute_base_shapes": false, "base_shapes_savefile": null, "mup": true, "disable_selection": false, "mup_enable_coord_check_logging": false, "max_lr": 0.000175, "decay_lr": true, "readout_zero_init": false, "query_zero_init": false, "l1_loss": false, "debugpy": false, "n_embd": 128} \ No newline at end of file diff --git a/lr1.75e-4_total_batch_size5120_seq_len256_decay_lrtrue_attention_kindselective_warmup_steps1/dataloader_02500.pt b/lr1.75e-4_total_batch_size5120_seq_len256_decay_lrtrue_attention_kindselective_warmup_steps1/dataloader_02500.pt new file mode 100644 index 0000000000000000000000000000000000000000..2bc253f8fc6225637fb651d7b45bcde02b1c9ff0 --- /dev/null +++ b/lr1.75e-4_total_batch_size5120_seq_len256_decay_lrtrue_attention_kindselective_warmup_steps1/dataloader_02500.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f5f86eba64e08aa3145708d463ef689ecaee47ebe0a97035e6e0aeb59f377344 +size 964 diff --git a/lr1.75e-4_total_batch_size5120_seq_len256_decay_lrtrue_attention_kindselective_warmup_steps1/dataloader_05000.pt b/lr1.75e-4_total_batch_size5120_seq_len256_decay_lrtrue_attention_kindselective_warmup_steps1/dataloader_05000.pt new file mode 100644 index 0000000000000000000000000000000000000000..bece7d05d8848580e904f556cba45a27c2aabefc --- /dev/null +++ b/lr1.75e-4_total_batch_size5120_seq_len256_decay_lrtrue_attention_kindselective_warmup_steps1/dataloader_05000.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a669cff46eb6a9ac053ccb64aba9cabfe25f09b9de8be0fa7cbcf53d547468bd +size 964 diff --git a/lr1.75e-4_total_batch_size5120_seq_len256_decay_lrtrue_attention_kindselective_warmup_steps1/dataloader_07500.pt b/lr1.75e-4_total_batch_size5120_seq_len256_decay_lrtrue_attention_kindselective_warmup_steps1/dataloader_07500.pt new file mode 100644 index 0000000000000000000000000000000000000000..9c0ee8c168397a0e7b7775123a24de07bc00a1af --- /dev/null +++ b/lr1.75e-4_total_batch_size5120_seq_len256_decay_lrtrue_attention_kindselective_warmup_steps1/dataloader_07500.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d5ccc252bab74018a361c32a7ec3feffb7cfbeb3a9386972640ad89c08895266 +size 964 diff --git a/lr1.75e-4_total_batch_size5120_seq_len256_decay_lrtrue_attention_kindselective_warmup_steps1/dataloader_09999.pt b/lr1.75e-4_total_batch_size5120_seq_len256_decay_lrtrue_attention_kindselective_warmup_steps1/dataloader_09999.pt new file mode 100644 index 0000000000000000000000000000000000000000..b55d9a6dac70f629d30f6dbbcdedb32b282b909b --- /dev/null +++ b/lr1.75e-4_total_batch_size5120_seq_len256_decay_lrtrue_attention_kindselective_warmup_steps1/dataloader_09999.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2b95c984402cc9cb954a35bd3e3a1d7e71c550bc1628b6c4dca17aedfa872fb2 +size 964 diff --git a/lr1.75e-4_total_batch_size5120_seq_len256_decay_lrtrue_attention_kindselective_warmup_steps1/log2.txt b/lr1.75e-4_total_batch_size5120_seq_len256_decay_lrtrue_attention_kindselective_warmup_steps1/log2.txt new file mode 100644 index 0000000000000000000000000000000000000000..973f4d729bab23e216a99a6eb739b70f2fe5183c --- /dev/null +++ b/lr1.75e-4_total_batch_size5120_seq_len256_decay_lrtrue_attention_kindselective_warmup_steps1/log2.txt @@ -0,0 +1,10403 @@ +max_steps: 10000 +0 val loss 11.7537 +0 val perplexity 127229.2734 +0 train 11.717543 (lr=1.7500e-04) (hash(x)=22886834) +1 train 11.387790 (lr=1.7500e-04) (hash(x)=26375038) +2 train 11.072809 (lr=1.7500e-04) (hash(x)=30598777) +3 train 10.848566 (lr=1.7500e-04) (hash(x)=27234506) +4 train 10.487396 (lr=1.7500e-04) (hash(x)=27767880) +5 train 10.320102 (lr=1.7500e-04) (hash(x)=23702020) +6 train 10.219807 (lr=1.7500e-04) (hash(x)=31986844) +7 train 10.217485 (lr=1.7500e-04) (hash(x)=20782690) +8 train 10.168891 (lr=1.7500e-04) (hash(x)=25201599) +9 train 10.080634 (lr=1.7500e-04) (hash(x)=23094976) +10 train 10.078605 (lr=1.7500e-04) (hash(x)=23841096) +11 train 10.033015 (lr=1.7500e-04) (hash(x)=26532095) +12 train 9.995017 (lr=1.7500e-04) (hash(x)=24432298) +13 train 9.889338 (lr=1.7500e-04) (hash(x)=27151649) +14 train 9.780807 (lr=1.7500e-04) (hash(x)=24596846) +15 train 9.737216 (lr=1.7500e-04) (hash(x)=23890908) +16 train 9.627806 (lr=1.7500e-04) (hash(x)=28913955) +17 train 9.530715 (lr=1.7500e-04) (hash(x)=25588236) +18 train 9.557948 (lr=1.7500e-04) (hash(x)=23770034) +19 train 9.441186 (lr=1.7500e-04) (hash(x)=24011372) +20 train 9.296049 (lr=1.7500e-04) (hash(x)=25441898) +21 train 9.431739 (lr=1.7500e-04) (hash(x)=28375581) +22 train 9.180840 (lr=1.7500e-04) (hash(x)=24046679) +23 train 9.209860 (lr=1.7500e-04) (hash(x)=24611628) +24 train 9.232833 (lr=1.7500e-04) (hash(x)=26169030) +25 train 9.194285 (lr=1.7500e-04) (hash(x)=30298407) +26 train 8.992119 (lr=1.7500e-04) (hash(x)=23711112) +27 train 8.763118 (lr=1.7500e-04) (hash(x)=19245352) +28 train 8.784709 (lr=1.7500e-04) (hash(x)=21529136) +29 train 9.023089 (lr=1.7500e-04) (hash(x)=28936608) +30 train 8.673490 (lr=1.7500e-04) (hash(x)=24339013) +31 train 8.577460 (lr=1.7500e-04) (hash(x)=25767553) +32 train 8.683044 (lr=1.7500e-04) (hash(x)=26439905) +33 train 8.780372 (lr=1.7500e-04) (hash(x)=31093473) +34 train 8.540997 (lr=1.7500e-04) (hash(x)=25450374) +35 train 8.401160 (lr=1.7500e-04) (hash(x)=24809873) +36 train 8.499735 (lr=1.7500e-04) (hash(x)=23253252) +37 train 8.592098 (lr=1.7499e-04) (hash(x)=27852919) +38 train 8.390683 (lr=1.7499e-04) (hash(x)=23327497) +39 train 8.182198 (lr=1.7499e-04) (hash(x)=22512166) +40 train 8.346059 (lr=1.7499e-04) (hash(x)=22859419) +41 train 8.290916 (lr=1.7499e-04) (hash(x)=27620338) +42 train 8.349892 (lr=1.7499e-04) (hash(x)=26397837) +43 train 8.376694 (lr=1.7499e-04) (hash(x)=28092148) +44 train 8.266028 (lr=1.7499e-04) (hash(x)=24662703) +45 train 8.432530 (lr=1.7499e-04) (hash(x)=27938767) +46 train 8.636294 (lr=1.7499e-04) (hash(x)=26037988) +47 train 8.135444 (lr=1.7499e-04) (hash(x)=24732833) +48 train 8.228609 (lr=1.7499e-04) (hash(x)=25259526) +49 train 8.100403 (lr=1.7499e-04) (hash(x)=23200230) +50 val loss 8.1008 +50 val perplexity 3297.0654 +50 train 8.171128 (lr=1.7499e-04) (hash(x)=26721357) +51 train 7.924701 (lr=1.7499e-04) (hash(x)=22694718) +52 train 8.062140 (lr=1.7499e-04) (hash(x)=28066766) +53 train 8.014413 (lr=1.7499e-04) (hash(x)=23125151) +54 train 8.044814 (lr=1.7499e-04) (hash(x)=27193725) +55 train 7.920696 (lr=1.7499e-04) (hash(x)=25129410) +56 train 8.033238 (lr=1.7499e-04) (hash(x)=24263988) +57 train 7.824045 (lr=1.7499e-04) (hash(x)=23059154) +58 train 8.041553 (lr=1.7499e-04) (hash(x)=26063864) +59 train 8.260378 (lr=1.7499e-04) (hash(x)=27858570) +60 train 7.999161 (lr=1.7499e-04) (hash(x)=23874620) +61 train 7.837064 (lr=1.7499e-04) (hash(x)=22402617) +62 train 7.975332 (lr=1.7499e-04) (hash(x)=23600822) +63 train 7.829595 (lr=1.7499e-04) (hash(x)=26582391) +64 train 7.813296 (lr=1.7498e-04) (hash(x)=23225283) +65 train 8.152164 (lr=1.7498e-04) (hash(x)=26075451) +66 train 7.849660 (lr=1.7498e-04) (hash(x)=24723419) +67 train 8.038936 (lr=1.7498e-04) (hash(x)=27279806) +68 train 7.806892 (lr=1.7498e-04) (hash(x)=25870391) +69 train 8.016068 (lr=1.7498e-04) (hash(x)=26188136) +70 train 8.190073 (lr=1.7498e-04) (hash(x)=30373443) +71 train 8.072668 (lr=1.7498e-04) (hash(x)=26472336) +72 train 7.871035 (lr=1.7498e-04) (hash(x)=26651572) +73 train 7.985930 (lr=1.7498e-04) (hash(x)=26376212) +74 train 7.967943 (lr=1.7498e-04) (hash(x)=26733350) +75 train 8.118359 (lr=1.7498e-04) (hash(x)=28301589) +76 train 7.969753 (lr=1.7498e-04) (hash(x)=27599559) +77 train 7.996449 (lr=1.7498e-04) (hash(x)=28035221) +78 train 8.002274 (lr=1.7498e-04) (hash(x)=25016783) +79 train 8.027806 (lr=1.7498e-04) (hash(x)=27654289) +80 train 7.837456 (lr=1.7498e-04) (hash(x)=24597558) +81 train 7.670068 (lr=1.7498e-04) (hash(x)=21560904) +82 train 7.673793 (lr=1.7497e-04) (hash(x)=21983837) +83 train 7.869457 (lr=1.7497e-04) (hash(x)=24995715) +84 train 8.179688 (lr=1.7497e-04) (hash(x)=29876413) +85 train 7.823871 (lr=1.7497e-04) (hash(x)=23792508) +86 train 7.745181 (lr=1.7497e-04) (hash(x)=25509120) +87 train 7.964862 (lr=1.7497e-04) (hash(x)=26559876) +88 train 7.892053 (lr=1.7497e-04) (hash(x)=23569647) +89 train 7.905339 (lr=1.7497e-04) (hash(x)=25758852) +90 train 7.767405 (lr=1.7497e-04) (hash(x)=25706298) +91 train 7.910306 (lr=1.7497e-04) (hash(x)=28364895) +92 train 7.677411 (lr=1.7497e-04) (hash(x)=25304663) +93 train 7.844238 (lr=1.7497e-04) (hash(x)=25269299) +94 train 7.969888 (lr=1.7497e-04) (hash(x)=25870566) +95 train 7.619409 (lr=1.7497e-04) (hash(x)=21770329) +96 train 8.008567 (lr=1.7496e-04) (hash(x)=27595900) +97 train 7.974862 (lr=1.7496e-04) (hash(x)=24785397) +98 train 7.721855 (lr=1.7496e-04) (hash(x)=21521480) +99 train 7.808492 (lr=1.7496e-04) (hash(x)=24628606) +100 val loss 7.8375 +100 val perplexity 2533.9084 +100 train 7.914215 (lr=1.7496e-04) (hash(x)=24670150) +101 train 7.795280 (lr=1.7496e-04) (hash(x)=23181910) +102 train 7.748592 (lr=1.7496e-04) (hash(x)=22714991) +103 train 7.709934 (lr=1.7496e-04) (hash(x)=22723459) +104 train 7.652877 (lr=1.7496e-04) (hash(x)=21524316) +105 train 7.841011 (lr=1.7496e-04) (hash(x)=25506632) +106 train 7.566896 (lr=1.7496e-04) (hash(x)=21675672) +107 train 7.680740 (lr=1.7496e-04) (hash(x)=22897919) +108 train 7.715202 (lr=1.7496e-04) (hash(x)=23321631) +109 train 7.897560 (lr=1.7495e-04) (hash(x)=26546719) +110 train 8.963068 (lr=1.7495e-04) (hash(x)=31962348) +111 train 8.194994 (lr=1.7495e-04) (hash(x)=30338342) +112 train 7.761909 (lr=1.7495e-04) (hash(x)=23724471) +113 train 7.945762 (lr=1.7495e-04) (hash(x)=29175888) +114 train 7.957448 (lr=1.7495e-04) (hash(x)=23256716) +115 train 8.038605 (lr=1.7495e-04) (hash(x)=27063280) +116 train 8.052036 (lr=1.7495e-04) (hash(x)=31057659) +117 train 8.185000 (lr=1.7495e-04) (hash(x)=32915097) +118 train 8.101087 (lr=1.7495e-04) (hash(x)=28842717) +119 train 7.786813 (lr=1.7495e-04) (hash(x)=25678059) +120 train 7.680457 (lr=1.7494e-04) (hash(x)=21593510) +121 train 7.599580 (lr=1.7494e-04) (hash(x)=20083773) +122 train 7.736897 (lr=1.7494e-04) (hash(x)=23002820) +123 train 7.541101 (lr=1.7494e-04) (hash(x)=21853028) +124 train 7.829818 (lr=1.7494e-04) (hash(x)=26985625) +125 train 7.558042 (lr=1.7494e-04) (hash(x)=21808483) +126 train 7.999930 (lr=1.7494e-04) (hash(x)=28873251) +127 train 7.815692 (lr=1.7494e-04) (hash(x)=26109335) +128 train 7.999889 (lr=1.7494e-04) (hash(x)=26334674) +129 train 7.873211 (lr=1.7494e-04) (hash(x)=24916754) +130 train 7.832350 (lr=1.7494e-04) (hash(x)=25449624) +131 train 7.912010 (lr=1.7493e-04) (hash(x)=25334848) +132 train 8.219378 (lr=1.7493e-04) (hash(x)=27484863) +133 train 7.740839 (lr=1.7493e-04) (hash(x)=24917705) +134 train 7.693491 (lr=1.7493e-04) (hash(x)=25143449) +135 train 7.712107 (lr=1.7493e-04) (hash(x)=25044885) +136 train 7.980123 (lr=1.7493e-04) (hash(x)=27821028) +137 train 7.931516 (lr=1.7493e-04) (hash(x)=28747022) +138 train 7.858842 (lr=1.7493e-04) (hash(x)=27182888) +139 train 7.689018 (lr=1.7493e-04) (hash(x)=23678349) +140 train 7.832613 (lr=1.7492e-04) (hash(x)=23593235) +141 train 8.132922 (lr=1.7492e-04) (hash(x)=28529813) +142 train 8.433945 (lr=1.7492e-04) (hash(x)=32074661) +143 train 8.022489 (lr=1.7492e-04) (hash(x)=28870690) +144 train 7.954082 (lr=1.7492e-04) (hash(x)=27307705) +145 train 7.798363 (lr=1.7492e-04) (hash(x)=25044834) +146 train 7.824174 (lr=1.7492e-04) (hash(x)=23712023) +147 train 8.349800 (lr=1.7492e-04) (hash(x)=32982615) +148 train 8.113904 (lr=1.7492e-04) (hash(x)=30113660) +149 train 7.549158 (lr=1.7491e-04) (hash(x)=20970960) +150 val loss 7.7955 +150 val perplexity 2429.7546 +150 train 7.760231 (lr=1.7491e-04) (hash(x)=23132684) +151 train 9.481065 (lr=1.7491e-04) (hash(x)=35279941) +152 train 8.691726 (lr=1.7491e-04) (hash(x)=31227444) +153 train 7.785446 (lr=1.7491e-04) (hash(x)=25529472) +154 train 7.859598 (lr=1.7491e-04) (hash(x)=24350409) +155 train 8.161690 (lr=1.7491e-04) (hash(x)=26400041) +156 train 7.823780 (lr=1.7491e-04) (hash(x)=25262621) +157 train 7.847019 (lr=1.7491e-04) (hash(x)=24656138) +158 train 8.034095 (lr=1.7490e-04) (hash(x)=26803414) +159 train 7.913691 (lr=1.7490e-04) (hash(x)=25015923) +160 train 7.647293 (lr=1.7490e-04) (hash(x)=23581172) +161 train 7.787302 (lr=1.7490e-04) (hash(x)=22924885) +162 train 7.682102 (lr=1.7490e-04) (hash(x)=23414296) +163 train 7.864666 (lr=1.7490e-04) (hash(x)=24853586) +164 train 7.917706 (lr=1.7490e-04) (hash(x)=25000130) +165 train 7.823215 (lr=1.7490e-04) (hash(x)=27004780) +166 train 7.864797 (lr=1.7489e-04) (hash(x)=26148573) +167 train 7.809293 (lr=1.7489e-04) (hash(x)=26740855) +168 train 7.485372 (lr=1.7489e-04) (hash(x)=20965419) +169 train 7.728194 (lr=1.7489e-04) (hash(x)=23950114) +170 train 7.650537 (lr=1.7489e-04) (hash(x)=24951982) +171 train 7.770790 (lr=1.7489e-04) (hash(x)=24584116) +172 train 7.758091 (lr=1.7489e-04) (hash(x)=24378759) +173 train 7.758475 (lr=1.7489e-04) (hash(x)=25718516) +174 train 7.881557 (lr=1.7488e-04) (hash(x)=28424396) +175 train 7.660587 (lr=1.7488e-04) (hash(x)=22262151) +176 train 7.917156 (lr=1.7488e-04) (hash(x)=26438412) +177 train 7.691567 (lr=1.7488e-04) (hash(x)=23025303) +178 train 7.764558 (lr=1.7488e-04) (hash(x)=24190770) +179 train 7.946657 (lr=1.7488e-04) (hash(x)=26627860) +180 train 7.714971 (lr=1.7488e-04) (hash(x)=23663439) +181 train 7.588162 (lr=1.7487e-04) (hash(x)=23700532) +182 train 7.591295 (lr=1.7487e-04) (hash(x)=23075676) +183 train 7.829134 (lr=1.7487e-04) (hash(x)=26621834) +184 train 7.892342 (lr=1.7487e-04) (hash(x)=29426269) +185 train 7.507324 (lr=1.7487e-04) (hash(x)=21821465) +186 train 7.799781 (lr=1.7487e-04) (hash(x)=26506130) +187 train 8.060587 (lr=1.7487e-04) (hash(x)=26930630) +188 train 7.557540 (lr=1.7486e-04) (hash(x)=22993793) +189 train 7.455083 (lr=1.7486e-04) (hash(x)=19557946) +190 train 7.768485 (lr=1.7486e-04) (hash(x)=23572891) +191 train 7.610698 (lr=1.7486e-04) (hash(x)=23234741) +192 train 7.695989 (lr=1.7486e-04) (hash(x)=25547951) +193 train 7.775999 (lr=1.7486e-04) (hash(x)=26713563) +194 train 7.791559 (lr=1.7486e-04) (hash(x)=25913622) +195 train 8.017021 (lr=1.7485e-04) (hash(x)=28102443) +196 train 7.704450 (lr=1.7485e-04) (hash(x)=23093351) +197 train 8.453059 (lr=1.7485e-04) (hash(x)=31689122) +198 train 8.299349 (lr=1.7485e-04) (hash(x)=32252517) +199 train 7.820924 (lr=1.7485e-04) (hash(x)=25470563) +200 val loss 7.7611 +200 val perplexity 2347.3752 +200 train 7.854872 (lr=1.7485e-04) (hash(x)=25597614) +201 train 7.910756 (lr=1.7484e-04) (hash(x)=23757479) +202 train 7.703302 (lr=1.7484e-04) (hash(x)=25140048) +203 train 7.907781 (lr=1.7484e-04) (hash(x)=28282861) +204 train 7.700969 (lr=1.7484e-04) (hash(x)=24754885) +205 train 7.925158 (lr=1.7484e-04) (hash(x)=26731964) +206 train 8.022298 (lr=1.7484e-04) (hash(x)=26660561) +207 train 7.586006 (lr=1.7484e-04) (hash(x)=21799102) +208 train 7.796894 (lr=1.7483e-04) (hash(x)=27025986) +209 train 7.619682 (lr=1.7483e-04) (hash(x)=24672077) +210 train 7.707273 (lr=1.7483e-04) (hash(x)=25322984) +211 train 7.556777 (lr=1.7483e-04) (hash(x)=23471769) +212 train 7.397170 (lr=1.7483e-04) (hash(x)=20766491) +213 train 7.907413 (lr=1.7483e-04) (hash(x)=24058931) +214 train 7.606233 (lr=1.7482e-04) (hash(x)=23872843) +215 train 7.649713 (lr=1.7482e-04) (hash(x)=23275479) +216 train 7.766348 (lr=1.7482e-04) (hash(x)=24914695) +217 train 7.645772 (lr=1.7482e-04) (hash(x)=24364396) +218 train 7.902153 (lr=1.7482e-04) (hash(x)=27986474) +219 train 7.807587 (lr=1.7482e-04) (hash(x)=24473581) +220 train 7.701970 (lr=1.7481e-04) (hash(x)=22974689) +221 train 7.803379 (lr=1.7481e-04) (hash(x)=23774644) +222 train 7.724121 (lr=1.7481e-04) (hash(x)=23245327) +223 train 7.515969 (lr=1.7481e-04) (hash(x)=22091862) +224 train 7.601925 (lr=1.7481e-04) (hash(x)=24362839) +225 train 7.750305 (lr=1.7481e-04) (hash(x)=25482303) +226 train 7.842496 (lr=1.7480e-04) (hash(x)=24911853) +227 train 7.805655 (lr=1.7480e-04) (hash(x)=26018202) +228 train 7.635735 (lr=1.7480e-04) (hash(x)=26124495) +229 train 7.790889 (lr=1.7480e-04) (hash(x)=24560096) +230 train 7.767109 (lr=1.7480e-04) (hash(x)=24695331) +231 train 7.512361 (lr=1.7479e-04) (hash(x)=17430373) +232 train 7.530595 (lr=1.7479e-04) (hash(x)=21813345) +233 train 7.148598 (lr=1.7479e-04) (hash(x)=20098681) +234 train 7.495050 (lr=1.7479e-04) (hash(x)=25095928) +235 train 7.622829 (lr=1.7479e-04) (hash(x)=24078083) +236 train 7.604046 (lr=1.7479e-04) (hash(x)=22901505) +237 train 7.795442 (lr=1.7478e-04) (hash(x)=26595592) +238 train 7.691138 (lr=1.7478e-04) (hash(x)=27663196) +239 train 7.502931 (lr=1.7478e-04) (hash(x)=22954861) +240 train 7.998073 (lr=1.7478e-04) (hash(x)=30159234) +241 train 7.867140 (lr=1.7478e-04) (hash(x)=29294271) +242 train 7.811857 (lr=1.7477e-04) (hash(x)=23728322) +243 train 7.851375 (lr=1.7477e-04) (hash(x)=28695016) +244 train 7.986904 (lr=1.7477e-04) (hash(x)=26702728) +245 train 7.780266 (lr=1.7477e-04) (hash(x)=27100115) +246 train 7.694339 (lr=1.7477e-04) (hash(x)=25082752) +247 train 8.028763 (lr=1.7476e-04) (hash(x)=26671799) +248 train 7.709586 (lr=1.7476e-04) (hash(x)=23718946) +249 train 7.932622 (lr=1.7476e-04) (hash(x)=28137394) +250 val loss 7.7296 +250 val perplexity 2274.7268 +250 train 7.992450 (lr=1.7476e-04) (hash(x)=23893495) +251 train 7.765212 (lr=1.7476e-04) (hash(x)=23166092) +252 train 7.743087 (lr=1.7476e-04) (hash(x)=25907665) +253 train 7.687177 (lr=1.7475e-04) (hash(x)=25885986) +254 train 7.742312 (lr=1.7475e-04) (hash(x)=25262712) +255 train 7.700317 (lr=1.7475e-04) (hash(x)=26924723) +256 train 7.888734 (lr=1.7475e-04) (hash(x)=28744736) +257 train 7.640926 (lr=1.7475e-04) (hash(x)=26140590) +258 train 7.880619 (lr=1.7474e-04) (hash(x)=25780449) +259 train 7.676221 (lr=1.7474e-04) (hash(x)=25138659) +260 train 7.982831 (lr=1.7474e-04) (hash(x)=27244046) +261 train 7.811873 (lr=1.7474e-04) (hash(x)=27224685) +262 train 8.112437 (lr=1.7474e-04) (hash(x)=28274477) +263 train 7.575011 (lr=1.7473e-04) (hash(x)=23557495) +264 train 7.679855 (lr=1.7473e-04) (hash(x)=24680596) +265 train 7.692327 (lr=1.7473e-04) (hash(x)=23928957) +266 train 7.668775 (lr=1.7473e-04) (hash(x)=23761390) +267 train 7.576411 (lr=1.7473e-04) (hash(x)=25288123) +268 train 7.837968 (lr=1.7472e-04) (hash(x)=28705502) +269 train 7.447624 (lr=1.7472e-04) (hash(x)=23246294) +270 train 7.527484 (lr=1.7472e-04) (hash(x)=28639079) +271 train 7.428257 (lr=1.7472e-04) (hash(x)=27804380) +272 train 7.653123 (lr=1.7471e-04) (hash(x)=24172235) +273 train 7.750426 (lr=1.7471e-04) (hash(x)=23089140) +274 train 7.955221 (lr=1.7471e-04) (hash(x)=27163701) +275 train 8.013991 (lr=1.7471e-04) (hash(x)=26993263) +276 train 7.823602 (lr=1.7471e-04) (hash(x)=28224233) +277 train 8.115489 (lr=1.7470e-04) (hash(x)=27397203) +278 train 8.001493 (lr=1.7470e-04) (hash(x)=27923882) +279 train 7.810876 (lr=1.7470e-04) (hash(x)=26654908) +280 train 7.735929 (lr=1.7470e-04) (hash(x)=24213147) +281 train 7.491553 (lr=1.7470e-04) (hash(x)=21965022) +282 train 7.622316 (lr=1.7469e-04) (hash(x)=25465685) +283 train 7.815414 (lr=1.7469e-04) (hash(x)=27347722) +284 train 7.808369 (lr=1.7469e-04) (hash(x)=26732050) +285 train 8.013652 (lr=1.7469e-04) (hash(x)=28314127) +286 train 7.627503 (lr=1.7468e-04) (hash(x)=21471186) +287 train 7.517757 (lr=1.7468e-04) (hash(x)=23627518) +288 train 7.471567 (lr=1.7468e-04) (hash(x)=20870353) +289 train 7.581824 (lr=1.7468e-04) (hash(x)=25024764) +290 train 7.380519 (lr=1.7468e-04) (hash(x)=20683822) +291 train 7.722206 (lr=1.7467e-04) (hash(x)=21768671) +292 train 7.708836 (lr=1.7467e-04) (hash(x)=25557309) +293 train 7.902594 (lr=1.7467e-04) (hash(x)=25076667) +294 train 7.531447 (lr=1.7467e-04) (hash(x)=23765822) +295 train 7.515642 (lr=1.7466e-04) (hash(x)=21889990) +296 train 7.730985 (lr=1.7466e-04) (hash(x)=26339893) +297 train 7.392798 (lr=1.7466e-04) (hash(x)=20932794) +298 train 7.572254 (lr=1.7466e-04) (hash(x)=21750070) +299 train 7.699207 (lr=1.7466e-04) (hash(x)=23665838) +300 val loss 7.6429 +300 val perplexity 2085.8425 +300 train 8.516079 (lr=1.7465e-04) (hash(x)=32888061) +301 train 8.288180 (lr=1.7465e-04) (hash(x)=30223582) +302 train 7.941082 (lr=1.7465e-04) (hash(x)=26908418) +303 train 7.212556 (lr=1.7465e-04) (hash(x)=22528001) +304 train 7.830842 (lr=1.7464e-04) (hash(x)=27452187) +305 train 7.669841 (lr=1.7464e-04) (hash(x)=25181641) +306 train 7.772883 (lr=1.7464e-04) (hash(x)=25546593) +307 train 7.830658 (lr=1.7464e-04) (hash(x)=22487328) +308 train 7.963051 (lr=1.7463e-04) (hash(x)=27804274) +309 train 7.965591 (lr=1.7463e-04) (hash(x)=26544630) +310 train 8.079451 (lr=1.7463e-04) (hash(x)=27738934) +311 train 7.853819 (lr=1.7463e-04) (hash(x)=29248942) +312 train 7.642883 (lr=1.7462e-04) (hash(x)=25103452) +313 train 7.887007 (lr=1.7462e-04) (hash(x)=25052066) +314 train 7.745298 (lr=1.7462e-04) (hash(x)=24481302) +315 train 7.720790 (lr=1.7462e-04) (hash(x)=23543273) +316 train 7.748628 (lr=1.7461e-04) (hash(x)=25608244) +317 train 7.914731 (lr=1.7461e-04) (hash(x)=27451288) +318 train 7.623667 (lr=1.7461e-04) (hash(x)=22806491) +319 train 7.724152 (lr=1.7461e-04) (hash(x)=25533417) +320 train 7.737788 (lr=1.7460e-04) (hash(x)=24557997) +321 train 7.771209 (lr=1.7460e-04) (hash(x)=24432899) +322 train 7.993737 (lr=1.7460e-04) (hash(x)=27583287) +323 train 7.918916 (lr=1.7460e-04) (hash(x)=25552036) +324 train 7.615454 (lr=1.7459e-04) (hash(x)=24201868) +325 train 7.903546 (lr=1.7459e-04) (hash(x)=28149782) +326 train 7.657488 (lr=1.7459e-04) (hash(x)=25529698) +327 train 7.353101 (lr=1.7459e-04) (hash(x)=20612533) +328 train 7.458944 (lr=1.7458e-04) (hash(x)=20699000) +329 train 7.370140 (lr=1.7458e-04) (hash(x)=19774173) +330 train 7.412444 (lr=1.7458e-04) (hash(x)=21681646) +331 train 7.251329 (lr=1.7458e-04) (hash(x)=20216795) +332 train 7.964858 (lr=1.7457e-04) (hash(x)=27697998) +333 train 7.706909 (lr=1.7457e-04) (hash(x)=25896435) +334 train 7.556771 (lr=1.7457e-04) (hash(x)=21585310) +335 train 7.607178 (lr=1.7457e-04) (hash(x)=24677740) +336 train 7.426884 (lr=1.7456e-04) (hash(x)=22027900) +337 train 7.454559 (lr=1.7456e-04) (hash(x)=21835643) +338 train 7.388040 (lr=1.7456e-04) (hash(x)=20558462) +339 train 7.276611 (lr=1.7456e-04) (hash(x)=16722715) +340 train 7.447326 (lr=1.7455e-04) (hash(x)=20972655) +341 train 7.911574 (lr=1.7455e-04) (hash(x)=26303975) +342 train 7.654630 (lr=1.7455e-04) (hash(x)=22938170) +343 train 7.709662 (lr=1.7455e-04) (hash(x)=25347203) +344 train 7.649480 (lr=1.7454e-04) (hash(x)=27398686) +345 train 7.655919 (lr=1.7454e-04) (hash(x)=25973417) +346 train 7.653415 (lr=1.7454e-04) (hash(x)=26918389) +347 train 7.625793 (lr=1.7454e-04) (hash(x)=24272489) +348 train 7.653507 (lr=1.7453e-04) (hash(x)=25593714) +349 train 7.730521 (lr=1.7453e-04) (hash(x)=29260846) +350 val loss 7.6372 +350 val perplexity 2073.8306 +350 train 7.795288 (lr=1.7453e-04) (hash(x)=27951602) +351 train 7.885916 (lr=1.7452e-04) (hash(x)=28922363) +352 train 7.774652 (lr=1.7452e-04) (hash(x)=27210734) +353 train 7.810730 (lr=1.7452e-04) (hash(x)=26322572) +354 train 7.663588 (lr=1.7452e-04) (hash(x)=27084665) +355 train 7.612375 (lr=1.7451e-04) (hash(x)=25510798) +356 train 7.701323 (lr=1.7451e-04) (hash(x)=24970921) +357 train 7.728298 (lr=1.7451e-04) (hash(x)=24138948) +358 train 7.620800 (lr=1.7451e-04) (hash(x)=24790211) +359 train 7.649292 (lr=1.7450e-04) (hash(x)=25631397) +360 train 7.522758 (lr=1.7450e-04) (hash(x)=23226625) +361 train 7.588192 (lr=1.7450e-04) (hash(x)=24001903) +362 train 7.584004 (lr=1.7449e-04) (hash(x)=24587948) +363 train 7.274430 (lr=1.7449e-04) (hash(x)=21333676) +364 train 7.155509 (lr=1.7449e-04) (hash(x)=23673779) +365 train 8.553187 (lr=1.7449e-04) (hash(x)=30770484) +366 train 7.720029 (lr=1.7448e-04) (hash(x)=26564899) +367 train 7.714358 (lr=1.7448e-04) (hash(x)=26237983) +368 train 7.435991 (lr=1.7448e-04) (hash(x)=23764356) +369 train 7.805808 (lr=1.7447e-04) (hash(x)=26205744) +370 train 7.478035 (lr=1.7447e-04) (hash(x)=19208770) +371 train 7.720394 (lr=1.7447e-04) (hash(x)=25976502) +372 train 7.576633 (lr=1.7447e-04) (hash(x)=23983933) +373 train 7.546113 (lr=1.7446e-04) (hash(x)=24080636) +374 train 7.654334 (lr=1.7446e-04) (hash(x)=24404047) +375 train 7.587448 (lr=1.7446e-04) (hash(x)=24742645) +376 train 7.679443 (lr=1.7445e-04) (hash(x)=24159600) +377 train 7.887161 (lr=1.7445e-04) (hash(x)=28677257) +378 train 7.616828 (lr=1.7445e-04) (hash(x)=25604111) +379 train 7.576842 (lr=1.7445e-04) (hash(x)=27086333) +380 train 7.539707 (lr=1.7444e-04) (hash(x)=25188207) +381 train 7.758823 (lr=1.7444e-04) (hash(x)=27855233) +382 train 7.351087 (lr=1.7444e-04) (hash(x)=19470039) +383 train 7.640946 (lr=1.7443e-04) (hash(x)=26157660) +384 train 7.587367 (lr=1.7443e-04) (hash(x)=25291570) +385 train 7.576439 (lr=1.7443e-04) (hash(x)=25046062) +386 train 7.820184 (lr=1.7442e-04) (hash(x)=27020337) +387 train 7.481259 (lr=1.7442e-04) (hash(x)=23616370) +388 train 7.161711 (lr=1.7442e-04) (hash(x)=19113218) +389 train 7.539506 (lr=1.7442e-04) (hash(x)=24302232) +390 train 7.518250 (lr=1.7441e-04) (hash(x)=22188949) +391 train 7.330171 (lr=1.7441e-04) (hash(x)=22582169) +392 train 7.592052 (lr=1.7441e-04) (hash(x)=24700570) +393 train 7.428636 (lr=1.7440e-04) (hash(x)=22773833) +394 train 7.279177 (lr=1.7440e-04) (hash(x)=21875928) +395 train 7.551633 (lr=1.7440e-04) (hash(x)=26233189) +396 train 7.456102 (lr=1.7439e-04) (hash(x)=24321467) +397 train 7.769784 (lr=1.7439e-04) (hash(x)=26431507) +398 train 7.796596 (lr=1.7439e-04) (hash(x)=28690877) +399 train 7.748239 (lr=1.7439e-04) (hash(x)=26431960) +400 val loss 7.6006 +400 val perplexity 1999.3451 +400 train 7.553566 (lr=1.7438e-04) (hash(x)=24580300) +401 train 7.559749 (lr=1.7438e-04) (hash(x)=25112360) +402 train 7.655788 (lr=1.7438e-04) (hash(x)=27597243) +403 train 8.132774 (lr=1.7437e-04) (hash(x)=30707498) +404 train 7.774739 (lr=1.7437e-04) (hash(x)=28485465) +405 train 7.442301 (lr=1.7437e-04) (hash(x)=22586447) +406 train 7.553408 (lr=1.7436e-04) (hash(x)=23175270) +407 train 7.646970 (lr=1.7436e-04) (hash(x)=25716176) +408 train 7.703323 (lr=1.7436e-04) (hash(x)=26861373) +409 train 7.778273 (lr=1.7435e-04) (hash(x)=25118971) +410 train 7.279932 (lr=1.7435e-04) (hash(x)=19829066) +411 train 7.449191 (lr=1.7435e-04) (hash(x)=26256420) +412 train 7.746890 (lr=1.7434e-04) (hash(x)=27796153) +413 train 7.476814 (lr=1.7434e-04) (hash(x)=22633318) +414 train 7.486262 (lr=1.7434e-04) (hash(x)=22589383) +415 train 7.908957 (lr=1.7433e-04) (hash(x)=28019788) +416 train 7.833005 (lr=1.7433e-04) (hash(x)=28970440) +417 train 7.531925 (lr=1.7433e-04) (hash(x)=27396089) +418 train 7.518622 (lr=1.7433e-04) (hash(x)=21183513) +419 train 7.578526 (lr=1.7432e-04) (hash(x)=23510110) +420 train 7.752895 (lr=1.7432e-04) (hash(x)=28833467) +421 train 7.582342 (lr=1.7432e-04) (hash(x)=23646926) +422 train 7.575220 (lr=1.7431e-04) (hash(x)=24697272) +423 train 7.342975 (lr=1.7431e-04) (hash(x)=20382963) +424 train 7.351684 (lr=1.7431e-04) (hash(x)=23467595) +425 train 7.532127 (lr=1.7430e-04) (hash(x)=24304768) +426 train 7.453154 (lr=1.7430e-04) (hash(x)=21392328) +427 train 7.467114 (lr=1.7430e-04) (hash(x)=25339466) +428 train 7.438719 (lr=1.7429e-04) (hash(x)=22092542) +429 train 7.547771 (lr=1.7429e-04) (hash(x)=22088696) +430 train 7.425775 (lr=1.7429e-04) (hash(x)=22184471) +431 train 7.507379 (lr=1.7428e-04) (hash(x)=24489647) +432 train 7.574052 (lr=1.7428e-04) (hash(x)=26794132) +433 train 7.334546 (lr=1.7428e-04) (hash(x)=22940357) +434 train 7.529318 (lr=1.7427e-04) (hash(x)=23719522) +435 train 7.396057 (lr=1.7427e-04) (hash(x)=22927699) +436 train 7.528749 (lr=1.7427e-04) (hash(x)=26068576) +437 train 7.667379 (lr=1.7426e-04) (hash(x)=27631132) +438 train 7.540792 (lr=1.7426e-04) (hash(x)=26739991) +439 train 7.645323 (lr=1.7426e-04) (hash(x)=25128502) +440 train 7.733915 (lr=1.7425e-04) (hash(x)=25657260) +441 train 7.431349 (lr=1.7425e-04) (hash(x)=23576982) +442 train 7.643265 (lr=1.7425e-04) (hash(x)=27117886) +443 train 7.636597 (lr=1.7424e-04) (hash(x)=25808969) +444 train 7.555326 (lr=1.7424e-04) (hash(x)=24738238) +445 train 7.543463 (lr=1.7423e-04) (hash(x)=23429962) +446 train 7.701154 (lr=1.7423e-04) (hash(x)=25075165) +447 train 7.518109 (lr=1.7423e-04) (hash(x)=25231390) +448 train 7.348240 (lr=1.7422e-04) (hash(x)=22055054) +449 train 7.570409 (lr=1.7422e-04) (hash(x)=25395441) +450 val loss 7.5571 +450 val perplexity 1914.2720 +450 train 7.622447 (lr=1.7422e-04) (hash(x)=25863209) +451 train 7.325107 (lr=1.7421e-04) (hash(x)=21154388) +452 train 7.289626 (lr=1.7421e-04) (hash(x)=21600876) +453 train 7.419891 (lr=1.7421e-04) (hash(x)=24278611) +454 train 7.304300 (lr=1.7420e-04) (hash(x)=23221720) +455 train 7.502678 (lr=1.7420e-04) (hash(x)=22708977) +456 train 8.143703 (lr=1.7420e-04) (hash(x)=23637758) +457 train 7.832823 (lr=1.7419e-04) (hash(x)=28228490) +458 train 7.798595 (lr=1.7419e-04) (hash(x)=28638071) +459 train 7.682745 (lr=1.7419e-04) (hash(x)=27258353) +460 train 7.686019 (lr=1.7418e-04) (hash(x)=26604728) +461 train 7.604051 (lr=1.7418e-04) (hash(x)=23252199) +462 train 7.669640 (lr=1.7418e-04) (hash(x)=26441427) +463 train 7.444358 (lr=1.7417e-04) (hash(x)=24364920) +464 train 7.569417 (lr=1.7417e-04) (hash(x)=25623792) +465 train 7.440802 (lr=1.7416e-04) (hash(x)=23283905) +466 train 7.851317 (lr=1.7416e-04) (hash(x)=26025267) +467 train 7.616397 (lr=1.7416e-04) (hash(x)=27243972) +468 train 7.985469 (lr=1.7415e-04) (hash(x)=30449945) +469 train 7.710962 (lr=1.7415e-04) (hash(x)=28113043) +470 train 7.485198 (lr=1.7415e-04) (hash(x)=25182521) +471 train 7.496022 (lr=1.7414e-04) (hash(x)=24932925) +472 train 7.322660 (lr=1.7414e-04) (hash(x)=20353098) +473 train 7.298418 (lr=1.7414e-04) (hash(x)=19001259) +474 train 7.865453 (lr=1.7413e-04) (hash(x)=27585685) +475 train 7.550072 (lr=1.7413e-04) (hash(x)=26371091) +476 train 7.407805 (lr=1.7412e-04) (hash(x)=24891798) +477 train 7.465149 (lr=1.7412e-04) (hash(x)=24258817) +478 train 7.520711 (lr=1.7412e-04) (hash(x)=24330263) +479 train 7.598073 (lr=1.7411e-04) (hash(x)=26913684) +480 train 7.606056 (lr=1.7411e-04) (hash(x)=26338455) +481 train 7.885242 (lr=1.7411e-04) (hash(x)=27753043) +482 train 7.542792 (lr=1.7410e-04) (hash(x)=26123289) +483 train 7.657524 (lr=1.7410e-04) (hash(x)=29239611) +484 train 7.589462 (lr=1.7409e-04) (hash(x)=26553003) +485 train 7.589851 (lr=1.7409e-04) (hash(x)=22984557) +486 train 7.106796 (lr=1.7409e-04) (hash(x)=16947491) +487 train 7.080177 (lr=1.7408e-04) (hash(x)=18017792) +488 train 7.238435 (lr=1.7408e-04) (hash(x)=19918608) +489 train 7.719379 (lr=1.7408e-04) (hash(x)=23374526) +490 train 7.567415 (lr=1.7407e-04) (hash(x)=25009505) +491 train 7.544042 (lr=1.7407e-04) (hash(x)=27574089) +492 train 7.711972 (lr=1.7406e-04) (hash(x)=24122664) +493 train 7.555321 (lr=1.7406e-04) (hash(x)=26154906) +494 train 7.486359 (lr=1.7406e-04) (hash(x)=25192767) +495 train 7.637563 (lr=1.7405e-04) (hash(x)=28613882) +496 train 7.545291 (lr=1.7405e-04) (hash(x)=23547219) +497 train 7.560543 (lr=1.7405e-04) (hash(x)=25272182) +498 train 7.415227 (lr=1.7404e-04) (hash(x)=24992761) +499 train 7.686630 (lr=1.7404e-04) (hash(x)=26981914) +500 val loss 7.5583 +500 val perplexity 1916.6321 +500 train 7.491047 (lr=1.7403e-04) (hash(x)=22051933) +501 train 7.662050 (lr=1.7403e-04) (hash(x)=24232348) +502 train 7.599288 (lr=1.7403e-04) (hash(x)=23158331) +503 train 7.464095 (lr=1.7402e-04) (hash(x)=22652243) +504 train 7.486315 (lr=1.7402e-04) (hash(x)=23805602) +505 train 7.783764 (lr=1.7401e-04) (hash(x)=25411991) +506 train 6.995913 (lr=1.7401e-04) (hash(x)=18827215) +507 train 6.693370 (lr=1.7401e-04) (hash(x)=15446025) +508 train 7.069777 (lr=1.7400e-04) (hash(x)=20516263) +509 train 7.646791 (lr=1.7400e-04) (hash(x)=27846176) +510 train 7.340229 (lr=1.7400e-04) (hash(x)=23342449) +511 train 7.615109 (lr=1.7399e-04) (hash(x)=27194521) +512 train 7.413400 (lr=1.7399e-04) (hash(x)=23008284) +513 train 7.902568 (lr=1.7398e-04) (hash(x)=29430001) +514 train 7.193265 (lr=1.7398e-04) (hash(x)=22579319) +515 train 7.241995 (lr=1.7398e-04) (hash(x)=25264518) +516 train 7.589450 (lr=1.7397e-04) (hash(x)=25359075) +517 train 7.560925 (lr=1.7397e-04) (hash(x)=25568956) +518 train 7.849724 (lr=1.7396e-04) (hash(x)=32004108) +519 train 7.477512 (lr=1.7396e-04) (hash(x)=24936836) +520 train 7.648629 (lr=1.7396e-04) (hash(x)=27263338) +521 train 7.696280 (lr=1.7395e-04) (hash(x)=27452099) +522 train 7.557938 (lr=1.7395e-04) (hash(x)=25965406) +523 train 7.736557 (lr=1.7394e-04) (hash(x)=28197282) +524 train 7.478039 (lr=1.7394e-04) (hash(x)=22466209) +525 train 7.495471 (lr=1.7394e-04) (hash(x)=22931889) +526 train 7.642963 (lr=1.7393e-04) (hash(x)=26903920) +527 train 7.506481 (lr=1.7393e-04) (hash(x)=24765578) +528 train 7.644804 (lr=1.7392e-04) (hash(x)=27811359) +529 train 7.396092 (lr=1.7392e-04) (hash(x)=25078649) +530 train 7.571931 (lr=1.7391e-04) (hash(x)=25572416) +531 train 7.736364 (lr=1.7391e-04) (hash(x)=27448185) +532 train 7.741216 (lr=1.7391e-04) (hash(x)=25923719) +533 train 7.539249 (lr=1.7390e-04) (hash(x)=24804856) +534 train 7.646930 (lr=1.7390e-04) (hash(x)=23207829) +535 train 7.521163 (lr=1.7389e-04) (hash(x)=23107416) +536 train 7.402254 (lr=1.7389e-04) (hash(x)=26739531) +537 train 7.418138 (lr=1.7389e-04) (hash(x)=24960796) +538 train 7.534999 (lr=1.7388e-04) (hash(x)=24667802) +539 train 7.637517 (lr=1.7388e-04) (hash(x)=26755138) +540 train 7.537213 (lr=1.7387e-04) (hash(x)=25537132) +541 train 7.478016 (lr=1.7387e-04) (hash(x)=24542526) +542 train 7.230060 (lr=1.7387e-04) (hash(x)=21296355) +543 train 7.799911 (lr=1.7386e-04) (hash(x)=29314255) +544 train 7.527037 (lr=1.7386e-04) (hash(x)=26001799) +545 train 7.564829 (lr=1.7385e-04) (hash(x)=27347755) +546 train 7.570212 (lr=1.7385e-04) (hash(x)=25107798) +547 train 7.417750 (lr=1.7384e-04) (hash(x)=22112669) +548 train 7.460186 (lr=1.7384e-04) (hash(x)=21897967) +549 train 7.567720 (lr=1.7384e-04) (hash(x)=25161929) +550 val loss 7.5284 +550 val perplexity 1860.1437 +550 train 7.430411 (lr=1.7383e-04) (hash(x)=27465106) +551 train 7.546826 (lr=1.7383e-04) (hash(x)=24013079) +552 train 7.406374 (lr=1.7382e-04) (hash(x)=23142015) +553 train 7.510686 (lr=1.7382e-04) (hash(x)=26768629) +554 train 7.524379 (lr=1.7381e-04) (hash(x)=26393383) +555 train 7.365048 (lr=1.7381e-04) (hash(x)=22537194) +556 train 7.626203 (lr=1.7381e-04) (hash(x)=24046036) +557 train 7.595754 (lr=1.7380e-04) (hash(x)=24974360) +558 train 7.807181 (lr=1.7380e-04) (hash(x)=28379928) +559 train 7.510521 (lr=1.7379e-04) (hash(x)=25322001) +560 train 7.619294 (lr=1.7379e-04) (hash(x)=26622031) +561 train 7.292791 (lr=1.7378e-04) (hash(x)=20562247) +562 train 7.663509 (lr=1.7378e-04) (hash(x)=27381885) +563 train 7.795445 (lr=1.7378e-04) (hash(x)=27028126) +564 train 7.638288 (lr=1.7377e-04) (hash(x)=28882928) +565 train 7.562164 (lr=1.7377e-04) (hash(x)=25666355) +566 train 7.665579 (lr=1.7376e-04) (hash(x)=24330810) +567 train 7.578109 (lr=1.7376e-04) (hash(x)=26690440) +568 train 7.455680 (lr=1.7375e-04) (hash(x)=22923592) +569 train 7.542317 (lr=1.7375e-04) (hash(x)=27348418) +570 train 7.600000 (lr=1.7374e-04) (hash(x)=28849848) +571 train 7.643384 (lr=1.7374e-04) (hash(x)=26967331) +572 train 7.408121 (lr=1.7374e-04) (hash(x)=22831467) +573 train 7.476360 (lr=1.7373e-04) (hash(x)=24765121) +574 train 7.447816 (lr=1.7373e-04) (hash(x)=24331857) +575 train 7.282009 (lr=1.7372e-04) (hash(x)=22598512) +576 train 7.466237 (lr=1.7372e-04) (hash(x)=25149353) +577 train 7.357207 (lr=1.7371e-04) (hash(x)=23725598) +578 train 7.557891 (lr=1.7371e-04) (hash(x)=26449557) +579 train 7.628087 (lr=1.7371e-04) (hash(x)=24697985) +580 train 7.625739 (lr=1.7370e-04) (hash(x)=26923059) +581 train 7.441399 (lr=1.7370e-04) (hash(x)=25201962) +582 train 7.089180 (lr=1.7369e-04) (hash(x)=20931520) +583 train 7.185483 (lr=1.7369e-04) (hash(x)=18473911) +584 train 7.312924 (lr=1.7368e-04) (hash(x)=21306267) +585 train 7.561831 (lr=1.7368e-04) (hash(x)=25982840) +586 train 7.436995 (lr=1.7367e-04) (hash(x)=25364874) +587 train 7.345181 (lr=1.7367e-04) (hash(x)=23172124) +588 train 7.655729 (lr=1.7366e-04) (hash(x)=27876897) +589 train 8.351913 (lr=1.7366e-04) (hash(x)=34646114) +590 train 8.699298 (lr=1.7366e-04) (hash(x)=35153576) +591 train 7.482562 (lr=1.7365e-04) (hash(x)=22322442) +592 train 7.679793 (lr=1.7365e-04) (hash(x)=27907331) +593 train 7.585308 (lr=1.7364e-04) (hash(x)=26211794) +594 train 7.798825 (lr=1.7364e-04) (hash(x)=29291512) +595 train 8.017406 (lr=1.7363e-04) (hash(x)=29659121) +596 train 7.863708 (lr=1.7363e-04) (hash(x)=29674399) +597 train 7.535595 (lr=1.7362e-04) (hash(x)=23538306) +598 train 7.654556 (lr=1.7362e-04) (hash(x)=21991524) +599 train 7.585126 (lr=1.7361e-04) (hash(x)=26324153) +600 val loss 7.5320 +600 val perplexity 1866.8320 +600 train 7.503036 (lr=1.7361e-04) (hash(x)=23712082) +601 train 7.565921 (lr=1.7360e-04) (hash(x)=24910403) +602 train 7.520542 (lr=1.7360e-04) (hash(x)=26737205) +603 train 7.621850 (lr=1.7360e-04) (hash(x)=26939970) +604 train 7.504177 (lr=1.7359e-04) (hash(x)=27651943) +605 train 7.845799 (lr=1.7359e-04) (hash(x)=27515446) +606 train 7.742703 (lr=1.7358e-04) (hash(x)=26753129) +607 train 7.386687 (lr=1.7358e-04) (hash(x)=23446058) +608 train 7.647676 (lr=1.7357e-04) (hash(x)=27587849) +609 train 7.584589 (lr=1.7357e-04) (hash(x)=25308253) +610 train 7.624557 (lr=1.7356e-04) (hash(x)=26615098) +611 train 7.700421 (lr=1.7356e-04) (hash(x)=29981801) +612 train 7.733836 (lr=1.7355e-04) (hash(x)=29592345) +613 train 7.733566 (lr=1.7355e-04) (hash(x)=23470413) +614 train 7.627326 (lr=1.7354e-04) (hash(x)=24742370) +615 train 7.580044 (lr=1.7354e-04) (hash(x)=24843741) +616 train 7.507389 (lr=1.7353e-04) (hash(x)=25192548) +617 train 7.581398 (lr=1.7353e-04) (hash(x)=27176996) +618 train 7.408834 (lr=1.7352e-04) (hash(x)=23964552) +619 train 7.405167 (lr=1.7352e-04) (hash(x)=22855363) +620 train 7.397290 (lr=1.7352e-04) (hash(x)=26332996) +621 train 7.222443 (lr=1.7351e-04) (hash(x)=22960957) +622 train 7.589858 (lr=1.7351e-04) (hash(x)=22752597) +623 train 7.497939 (lr=1.7350e-04) (hash(x)=23197102) +624 train 8.034548 (lr=1.7350e-04) (hash(x)=27383319) +625 train 7.491621 (lr=1.7349e-04) (hash(x)=26132276) +626 train 7.378711 (lr=1.7349e-04) (hash(x)=19810497) +627 train 7.469108 (lr=1.7348e-04) (hash(x)=25704919) +628 train 7.647825 (lr=1.7348e-04) (hash(x)=27174264) +629 train 7.749819 (lr=1.7347e-04) (hash(x)=22280814) +630 train 8.506136 (lr=1.7347e-04) (hash(x)=24279448) +631 train 7.956941 (lr=1.7346e-04) (hash(x)=23054940) +632 train 8.061400 (lr=1.7346e-04) (hash(x)=23942400) +633 train 8.320475 (lr=1.7345e-04) (hash(x)=24712416) +634 train 7.862144 (lr=1.7345e-04) (hash(x)=24564658) +635 train 7.566182 (lr=1.7344e-04) (hash(x)=24909904) +636 train 7.637791 (lr=1.7344e-04) (hash(x)=23049534) +637 train 7.672598 (lr=1.7343e-04) (hash(x)=24321591) +638 train 7.479599 (lr=1.7343e-04) (hash(x)=26153298) +639 train 7.495813 (lr=1.7342e-04) (hash(x)=27140757) +640 train 7.288542 (lr=1.7342e-04) (hash(x)=25115907) +641 train 7.333669 (lr=1.7341e-04) (hash(x)=26563770) +642 train 7.473837 (lr=1.7341e-04) (hash(x)=28089252) +643 train 7.411179 (lr=1.7340e-04) (hash(x)=25993110) +644 train 7.405826 (lr=1.7340e-04) (hash(x)=25150008) +645 train 7.682908 (lr=1.7339e-04) (hash(x)=28520222) +646 train 7.341737 (lr=1.7339e-04) (hash(x)=21349943) +647 train 7.422746 (lr=1.7338e-04) (hash(x)=25149419) +648 train 7.673110 (lr=1.7338e-04) (hash(x)=25730641) +649 train 7.807018 (lr=1.7337e-04) (hash(x)=26112813) +650 val loss 7.5422 +650 val perplexity 1886.0009 +650 train 7.590981 (lr=1.7337e-04) (hash(x)=25907805) +651 train 7.620588 (lr=1.7336e-04) (hash(x)=27623643) +652 train 7.536258 (lr=1.7336e-04) (hash(x)=26484959) +653 train 7.573206 (lr=1.7335e-04) (hash(x)=29199854) +654 train 7.557233 (lr=1.7335e-04) (hash(x)=28369628) +655 train 7.403890 (lr=1.7334e-04) (hash(x)=24727764) +656 train 7.124716 (lr=1.7334e-04) (hash(x)=22610673) +657 train 7.079892 (lr=1.7333e-04) (hash(x)=22667179) +658 train 6.907544 (lr=1.7333e-04) (hash(x)=18477300) +659 train 7.343370 (lr=1.7332e-04) (hash(x)=23155773) +660 train 7.160665 (lr=1.7332e-04) (hash(x)=19461032) +661 train 7.472562 (lr=1.7331e-04) (hash(x)=23453788) +662 train 7.572008 (lr=1.7331e-04) (hash(x)=24543466) +663 train 7.321659 (lr=1.7330e-04) (hash(x)=21935931) +664 train 7.144660 (lr=1.7330e-04) (hash(x)=19910292) +665 train 7.459741 (lr=1.7329e-04) (hash(x)=24481079) +666 train 7.156796 (lr=1.7329e-04) (hash(x)=18922411) +667 train 7.162258 (lr=1.7328e-04) (hash(x)=20054917) +668 train 7.415921 (lr=1.7328e-04) (hash(x)=24850470) +669 train 7.379200 (lr=1.7327e-04) (hash(x)=25907741) +670 train 7.556645 (lr=1.7327e-04) (hash(x)=26873522) +671 train 7.601387 (lr=1.7326e-04) (hash(x)=27606073) +672 train 7.747165 (lr=1.7326e-04) (hash(x)=26209645) +673 train 7.511827 (lr=1.7325e-04) (hash(x)=25202001) +674 train 7.578786 (lr=1.7325e-04) (hash(x)=25569462) +675 train 7.547596 (lr=1.7324e-04) (hash(x)=26534487) +676 train 7.483856 (lr=1.7324e-04) (hash(x)=26455057) +677 train 7.378989 (lr=1.7323e-04) (hash(x)=24095850) +678 train 7.627275 (lr=1.7323e-04) (hash(x)=25287752) +679 train 7.145816 (lr=1.7322e-04) (hash(x)=22450341) +680 train 7.849328 (lr=1.7321e-04) (hash(x)=29004853) +681 train 7.630689 (lr=1.7321e-04) (hash(x)=27993763) +682 train 7.411548 (lr=1.7320e-04) (hash(x)=26382658) +683 train 7.563086 (lr=1.7320e-04) (hash(x)=25013073) +684 train 7.579036 (lr=1.7319e-04) (hash(x)=30595809) +685 train 7.678876 (lr=1.7319e-04) (hash(x)=30934371) +686 train 8.252087 (lr=1.7318e-04) (hash(x)=33060834) +687 train 7.487601 (lr=1.7318e-04) (hash(x)=25945859) +688 train 7.323802 (lr=1.7317e-04) (hash(x)=23375678) +689 train 7.366932 (lr=1.7317e-04) (hash(x)=25218689) +690 train 7.447595 (lr=1.7316e-04) (hash(x)=28127397) +691 train 7.405389 (lr=1.7316e-04) (hash(x)=24418091) +692 train 7.366332 (lr=1.7315e-04) (hash(x)=22761099) +693 train 7.346985 (lr=1.7315e-04) (hash(x)=24615466) +694 train 7.487827 (lr=1.7314e-04) (hash(x)=24699240) +695 train 7.410272 (lr=1.7314e-04) (hash(x)=21613707) +696 train 7.442729 (lr=1.7313e-04) (hash(x)=24977554) +697 train 7.403676 (lr=1.7312e-04) (hash(x)=24348175) +698 train 7.588467 (lr=1.7312e-04) (hash(x)=25102767) +699 train 7.569154 (lr=1.7311e-04) (hash(x)=26386157) +700 val loss 7.4429 +700 val perplexity 1707.6249 +700 train 7.460927 (lr=1.7311e-04) (hash(x)=26423460) +701 train 7.417915 (lr=1.7310e-04) (hash(x)=25771047) +702 train 7.473680 (lr=1.7310e-04) (hash(x)=26999875) +703 train 7.397762 (lr=1.7309e-04) (hash(x)=24396519) +704 train 7.410364 (lr=1.7309e-04) (hash(x)=22588122) +705 train 7.748529 (lr=1.7308e-04) (hash(x)=25142399) +706 train 7.520061 (lr=1.7308e-04) (hash(x)=20440214) +707 train 7.369156 (lr=1.7307e-04) (hash(x)=23265507) +708 train 7.437582 (lr=1.7307e-04) (hash(x)=24563470) +709 train 7.343443 (lr=1.7306e-04) (hash(x)=22514858) +710 train 7.672957 (lr=1.7305e-04) (hash(x)=26691212) +711 train 7.742537 (lr=1.7305e-04) (hash(x)=29138828) +712 train 7.741755 (lr=1.7304e-04) (hash(x)=28028528) +713 train 7.578784 (lr=1.7304e-04) (hash(x)=20531210) +714 train 7.469285 (lr=1.7303e-04) (hash(x)=25075352) +715 train 7.504518 (lr=1.7303e-04) (hash(x)=24265353) +716 train 7.601104 (lr=1.7302e-04) (hash(x)=24635726) +717 train 7.468804 (lr=1.7302e-04) (hash(x)=24999726) +718 train 7.605103 (lr=1.7301e-04) (hash(x)=27412910) +719 train 7.384634 (lr=1.7300e-04) (hash(x)=24685515) +720 train 7.433606 (lr=1.7300e-04) (hash(x)=23780329) +721 train 7.278142 (lr=1.7299e-04) (hash(x)=25071701) +722 train 7.445471 (lr=1.7299e-04) (hash(x)=23767130) +723 train 7.384529 (lr=1.7298e-04) (hash(x)=24876269) +724 train 7.529788 (lr=1.7298e-04) (hash(x)=26405773) +725 train 7.966467 (lr=1.7297e-04) (hash(x)=31733180) +726 train 7.109746 (lr=1.7297e-04) (hash(x)=21337509) +727 train 7.314444 (lr=1.7296e-04) (hash(x)=22825749) +728 train 7.638598 (lr=1.7295e-04) (hash(x)=28638695) +729 train 7.501904 (lr=1.7295e-04) (hash(x)=26393943) +730 train 7.658429 (lr=1.7294e-04) (hash(x)=27563583) +731 train 7.163854 (lr=1.7294e-04) (hash(x)=21239652) +732 train 7.284845 (lr=1.7293e-04) (hash(x)=23986428) +733 train 7.260571 (lr=1.7293e-04) (hash(x)=24943881) +734 train 7.749829 (lr=1.7292e-04) (hash(x)=29691448) +735 train 7.688746 (lr=1.7292e-04) (hash(x)=28767869) +736 train 7.396689 (lr=1.7291e-04) (hash(x)=23628188) +737 train 7.691718 (lr=1.7290e-04) (hash(x)=29341482) +738 train 7.528356 (lr=1.7290e-04) (hash(x)=30336570) +739 train 7.495988 (lr=1.7289e-04) (hash(x)=25614301) +740 train 7.342590 (lr=1.7289e-04) (hash(x)=24160500) +741 train 7.572826 (lr=1.7288e-04) (hash(x)=26030058) +742 train 7.962368 (lr=1.7288e-04) (hash(x)=29243936) +743 train 7.251953 (lr=1.7287e-04) (hash(x)=21159060) +744 train 7.350572 (lr=1.7286e-04) (hash(x)=23701853) +745 train 7.536485 (lr=1.7286e-04) (hash(x)=24629937) +746 train 7.451332 (lr=1.7285e-04) (hash(x)=25110108) +747 train 7.532421 (lr=1.7285e-04) (hash(x)=26751788) +748 train 7.558176 (lr=1.7284e-04) (hash(x)=26430427) +749 train 7.415695 (lr=1.7284e-04) (hash(x)=26012353) +750 val loss 7.4425 +750 val perplexity 1707.0411 +750 train 7.547369 (lr=1.7283e-04) (hash(x)=22735910) +751 train 7.353456 (lr=1.7282e-04) (hash(x)=25045397) +752 train 7.085124 (lr=1.7282e-04) (hash(x)=21554427) +753 train 7.180463 (lr=1.7281e-04) (hash(x)=23751143) +754 train 7.918900 (lr=1.7281e-04) (hash(x)=28602273) +755 train 7.992921 (lr=1.7280e-04) (hash(x)=29989709) +756 train 7.326936 (lr=1.7279e-04) (hash(x)=22331648) +757 train 7.777967 (lr=1.7279e-04) (hash(x)=31017246) +758 train 7.741321 (lr=1.7278e-04) (hash(x)=29709045) +759 train 7.785671 (lr=1.7278e-04) (hash(x)=25560928) +760 train 7.443559 (lr=1.7277e-04) (hash(x)=25075464) +761 train 7.522632 (lr=1.7277e-04) (hash(x)=27352253) +762 train 7.722389 (lr=1.7276e-04) (hash(x)=28187891) +763 train 7.589462 (lr=1.7275e-04) (hash(x)=26062687) +764 train 7.606270 (lr=1.7275e-04) (hash(x)=27427811) +765 train 7.674103 (lr=1.7274e-04) (hash(x)=27614522) +766 train 7.443927 (lr=1.7274e-04) (hash(x)=26129544) +767 train 8.021016 (lr=1.7273e-04) (hash(x)=28959222) +768 train 7.551888 (lr=1.7272e-04) (hash(x)=26860067) +769 train 7.325565 (lr=1.7272e-04) (hash(x)=25122598) +770 train 7.411251 (lr=1.7271e-04) (hash(x)=25245030) +771 train 7.432627 (lr=1.7271e-04) (hash(x)=25434884) +772 train 7.476860 (lr=1.7270e-04) (hash(x)=27732790) +773 train 7.530504 (lr=1.7269e-04) (hash(x)=27824438) +774 train 7.597169 (lr=1.7269e-04) (hash(x)=27201953) +775 train 7.306684 (lr=1.7268e-04) (hash(x)=21248405) +776 train 7.112946 (lr=1.7268e-04) (hash(x)=22805934) +777 train 7.465209 (lr=1.7267e-04) (hash(x)=26482588) +778 train 7.525830 (lr=1.7266e-04) (hash(x)=24153691) +779 train 7.659496 (lr=1.7266e-04) (hash(x)=25044192) +780 train 7.590161 (lr=1.7265e-04) (hash(x)=25910078) +781 train 7.607973 (lr=1.7265e-04) (hash(x)=28645524) +782 train 7.383944 (lr=1.7264e-04) (hash(x)=24368498) +783 train 7.450169 (lr=1.7263e-04) (hash(x)=25830182) +784 train 7.548956 (lr=1.7263e-04) (hash(x)=29181807) +785 train 7.485994 (lr=1.7262e-04) (hash(x)=25585137) +786 train 7.429746 (lr=1.7262e-04) (hash(x)=24798246) +787 train 7.589588 (lr=1.7261e-04) (hash(x)=26621419) +788 train 7.155810 (lr=1.7260e-04) (hash(x)=21446891) +789 train 7.043518 (lr=1.7260e-04) (hash(x)=22165286) +790 train 7.249327 (lr=1.7259e-04) (hash(x)=23477219) +791 train 7.528397 (lr=1.7259e-04) (hash(x)=25173113) +792 train 7.425717 (lr=1.7258e-04) (hash(x)=25853788) +793 train 7.541417 (lr=1.7257e-04) (hash(x)=27267091) +794 train 7.365044 (lr=1.7257e-04) (hash(x)=23743694) +795 train 7.308537 (lr=1.7256e-04) (hash(x)=24400133) +796 train 7.436267 (lr=1.7256e-04) (hash(x)=23663639) +797 train 7.270186 (lr=1.7255e-04) (hash(x)=23103223) +798 train 7.831042 (lr=1.7254e-04) (hash(x)=28748411) +799 train 7.067379 (lr=1.7254e-04) (hash(x)=23486277) +800 val loss 7.4012 +800 val perplexity 1638.0250 +800 train 7.437694 (lr=1.7253e-04) (hash(x)=25678518) +801 train 7.340000 (lr=1.7253e-04) (hash(x)=23421286) +802 train 7.469672 (lr=1.7252e-04) (hash(x)=26054104) +803 train 7.477445 (lr=1.7251e-04) (hash(x)=25978130) +804 train 7.514594 (lr=1.7251e-04) (hash(x)=26006525) +805 train 7.469439 (lr=1.7250e-04) (hash(x)=25769432) +806 train 7.328386 (lr=1.7249e-04) (hash(x)=22430795) +807 train 7.638425 (lr=1.7249e-04) (hash(x)=28916006) +808 train 7.431887 (lr=1.7248e-04) (hash(x)=25166800) +809 train 7.535104 (lr=1.7248e-04) (hash(x)=24226056) +810 train 7.405067 (lr=1.7247e-04) (hash(x)=25057934) +811 train 8.260428 (lr=1.7246e-04) (hash(x)=33195100) +812 train 7.578388 (lr=1.7246e-04) (hash(x)=26312888) +813 train 7.786307 (lr=1.7245e-04) (hash(x)=27730410) +814 train 7.653440 (lr=1.7244e-04) (hash(x)=27372474) +815 train 7.475751 (lr=1.7244e-04) (hash(x)=25556929) +816 train 7.543768 (lr=1.7243e-04) (hash(x)=26909985) +817 train 7.356500 (lr=1.7243e-04) (hash(x)=25991247) +818 train 7.507844 (lr=1.7242e-04) (hash(x)=27438141) +819 train 7.648247 (lr=1.7241e-04) (hash(x)=29536986) +820 train 7.410089 (lr=1.7241e-04) (hash(x)=24478391) +821 train 7.420381 (lr=1.7240e-04) (hash(x)=26125216) +822 train 7.468386 (lr=1.7239e-04) (hash(x)=26422130) +823 train 7.716223 (lr=1.7239e-04) (hash(x)=29648798) +824 train 7.332265 (lr=1.7238e-04) (hash(x)=21247770) +825 train 7.459490 (lr=1.7238e-04) (hash(x)=23195388) +826 train 7.400462 (lr=1.7237e-04) (hash(x)=25796725) +827 train 7.432698 (lr=1.7236e-04) (hash(x)=23124767) +828 train 7.493410 (lr=1.7236e-04) (hash(x)=25233464) +829 train 7.468573 (lr=1.7235e-04) (hash(x)=25713275) +830 train 7.407988 (lr=1.7234e-04) (hash(x)=25550167) +831 train 7.318481 (lr=1.7234e-04) (hash(x)=24976217) +832 train 7.641346 (lr=1.7233e-04) (hash(x)=28536827) +833 train 7.503920 (lr=1.7232e-04) (hash(x)=27500801) +834 train 7.365631 (lr=1.7232e-04) (hash(x)=25545765) +835 train 7.369522 (lr=1.7231e-04) (hash(x)=23632825) +836 train 7.408049 (lr=1.7231e-04) (hash(x)=25708009) +837 train 7.468597 (lr=1.7230e-04) (hash(x)=24456276) +838 train 7.590183 (lr=1.7229e-04) (hash(x)=29189855) +839 train 7.819975 (lr=1.7229e-04) (hash(x)=31019606) +840 train 7.736539 (lr=1.7228e-04) (hash(x)=26328013) +841 train 7.625509 (lr=1.7227e-04) (hash(x)=25027904) +842 train 7.385633 (lr=1.7227e-04) (hash(x)=23734189) +843 train 7.614815 (lr=1.7226e-04) (hash(x)=28236580) +844 train 7.427223 (lr=1.7225e-04) (hash(x)=26509780) +845 train 7.498210 (lr=1.7225e-04) (hash(x)=25386473) +846 train 7.411026 (lr=1.7224e-04) (hash(x)=24052671) +847 train 7.623950 (lr=1.7223e-04) (hash(x)=28269421) +848 train 7.068606 (lr=1.7223e-04) (hash(x)=22251724) +849 train 7.268853 (lr=1.7222e-04) (hash(x)=24308447) +850 val loss 7.3959 +850 val perplexity 1629.3531 +850 train 7.238973 (lr=1.7221e-04) (hash(x)=24242830) +851 train 7.434433 (lr=1.7221e-04) (hash(x)=25563279) +852 train 7.457991 (lr=1.7220e-04) (hash(x)=26354481) +853 train 7.608778 (lr=1.7220e-04) (hash(x)=26152637) +854 train 7.636075 (lr=1.7219e-04) (hash(x)=28051025) +855 train 7.481891 (lr=1.7218e-04) (hash(x)=24865358) +856 train 7.351685 (lr=1.7218e-04) (hash(x)=24288911) +857 train 7.271910 (lr=1.7217e-04) (hash(x)=22230964) +858 train 7.158313 (lr=1.7216e-04) (hash(x)=21303832) +859 train 7.290369 (lr=1.7216e-04) (hash(x)=22155546) +860 train 7.380185 (lr=1.7215e-04) (hash(x)=25296428) +861 train 7.559322 (lr=1.7214e-04) (hash(x)=29142319) +862 train 7.422871 (lr=1.7214e-04) (hash(x)=25545430) +863 train 7.237175 (lr=1.7213e-04) (hash(x)=26984272) +864 train 7.416353 (lr=1.7212e-04) (hash(x)=25429005) +865 train 7.464957 (lr=1.7212e-04) (hash(x)=27077032) +866 train 7.458102 (lr=1.7211e-04) (hash(x)=26494424) +867 train 7.518829 (lr=1.7210e-04) (hash(x)=23193673) +868 train 7.485367 (lr=1.7210e-04) (hash(x)=25075134) +869 train 7.534297 (lr=1.7209e-04) (hash(x)=27112558) +870 train 7.680614 (lr=1.7208e-04) (hash(x)=27436608) +871 train 7.388448 (lr=1.7208e-04) (hash(x)=24544116) +872 train 7.734698 (lr=1.7207e-04) (hash(x)=31632686) +873 train 7.418986 (lr=1.7206e-04) (hash(x)=25890184) +874 train 7.511102 (lr=1.7206e-04) (hash(x)=22887555) +875 train 7.354283 (lr=1.7205e-04) (hash(x)=24547533) +876 train 7.507053 (lr=1.7204e-04) (hash(x)=26553496) +877 train 7.584329 (lr=1.7204e-04) (hash(x)=27467688) +878 train 7.338591 (lr=1.7203e-04) (hash(x)=24766934) +879 train 7.224267 (lr=1.7202e-04) (hash(x)=22059850) +880 train 7.618631 (lr=1.7202e-04) (hash(x)=22871702) +881 train 7.432559 (lr=1.7201e-04) (hash(x)=23893130) +882 train 7.491089 (lr=1.7200e-04) (hash(x)=25125691) +883 train 7.433243 (lr=1.7200e-04) (hash(x)=25994573) +884 train 7.467024 (lr=1.7199e-04) (hash(x)=26076345) +885 train 7.421118 (lr=1.7198e-04) (hash(x)=26577783) +886 train 7.552625 (lr=1.7198e-04) (hash(x)=27395225) +887 train 7.388032 (lr=1.7197e-04) (hash(x)=23926632) +888 train 7.227498 (lr=1.7196e-04) (hash(x)=21737239) +889 train 7.495122 (lr=1.7195e-04) (hash(x)=23574207) +890 train 7.204813 (lr=1.7195e-04) (hash(x)=24365231) +891 train 7.354857 (lr=1.7194e-04) (hash(x)=27111369) +892 train 7.632646 (lr=1.7193e-04) (hash(x)=27290015) +893 train 7.379998 (lr=1.7193e-04) (hash(x)=23979820) +894 train 7.495746 (lr=1.7192e-04) (hash(x)=26450121) +895 train 7.396114 (lr=1.7191e-04) (hash(x)=27025333) +896 train 7.386922 (lr=1.7191e-04) (hash(x)=23624605) +897 train 7.191288 (lr=1.7190e-04) (hash(x)=22846386) +898 train 7.285307 (lr=1.7189e-04) (hash(x)=22970561) +899 train 7.136703 (lr=1.7189e-04) (hash(x)=16908068) +900 val loss 7.3899 +900 val perplexity 1619.5275 +900 train 7.346834 (lr=1.7188e-04) (hash(x)=24661446) +901 train 7.495481 (lr=1.7187e-04) (hash(x)=25664727) +902 train 7.427517 (lr=1.7187e-04) (hash(x)=25667011) +903 train 7.468562 (lr=1.7186e-04) (hash(x)=29120407) +904 train 7.557970 (lr=1.7185e-04) (hash(x)=23385735) +905 train 7.596091 (lr=1.7184e-04) (hash(x)=25564213) +906 train 7.645246 (lr=1.7184e-04) (hash(x)=25413898) +907 train 7.583778 (lr=1.7183e-04) (hash(x)=27092710) +908 train 7.358478 (lr=1.7182e-04) (hash(x)=25789923) +909 train 7.461766 (lr=1.7182e-04) (hash(x)=28533197) +910 train 7.273321 (lr=1.7181e-04) (hash(x)=22982996) +911 train 7.386063 (lr=1.7180e-04) (hash(x)=23827393) +912 train 7.033237 (lr=1.7180e-04) (hash(x)=21242640) +913 train 7.417636 (lr=1.7179e-04) (hash(x)=24154233) +914 train 7.447549 (lr=1.7178e-04) (hash(x)=24331967) +915 train 7.745840 (lr=1.7178e-04) (hash(x)=32812727) +916 train 7.320339 (lr=1.7177e-04) (hash(x)=23572994) +917 train 7.336129 (lr=1.7176e-04) (hash(x)=26305435) +918 train 7.396671 (lr=1.7175e-04) (hash(x)=26268355) +919 train 7.550912 (lr=1.7175e-04) (hash(x)=27230027) +920 train 7.334062 (lr=1.7174e-04) (hash(x)=23885377) +921 train 7.270705 (lr=1.7173e-04) (hash(x)=23532437) +922 train 7.372217 (lr=1.7173e-04) (hash(x)=25577034) +923 train 7.520888 (lr=1.7172e-04) (hash(x)=25703381) +924 train 7.484300 (lr=1.7171e-04) (hash(x)=27113866) +925 train 7.339252 (lr=1.7170e-04) (hash(x)=26961429) +926 train 7.177138 (lr=1.7170e-04) (hash(x)=21355372) +927 train 7.283957 (lr=1.7169e-04) (hash(x)=24968260) +928 train 7.271898 (lr=1.7168e-04) (hash(x)=25357517) +929 train 7.393138 (lr=1.7168e-04) (hash(x)=24854265) +930 train 7.158477 (lr=1.7167e-04) (hash(x)=21102770) +931 train 7.445956 (lr=1.7166e-04) (hash(x)=25676468) +932 train 7.280006 (lr=1.7165e-04) (hash(x)=22809869) +933 train 7.376547 (lr=1.7165e-04) (hash(x)=25503865) +934 train 7.282083 (lr=1.7164e-04) (hash(x)=24853995) +935 train 7.485017 (lr=1.7163e-04) (hash(x)=27544803) +936 train 7.541898 (lr=1.7163e-04) (hash(x)=25981933) +937 train 7.248161 (lr=1.7162e-04) (hash(x)=24658683) +938 train 7.418201 (lr=1.7161e-04) (hash(x)=23855201) +939 train 7.345225 (lr=1.7160e-04) (hash(x)=24331407) +940 train 7.563238 (lr=1.7160e-04) (hash(x)=29265551) +941 train 7.282538 (lr=1.7159e-04) (hash(x)=21892556) +942 train 7.337181 (lr=1.7158e-04) (hash(x)=27183405) +943 train 7.304929 (lr=1.7158e-04) (hash(x)=26540663) +944 train 7.250268 (lr=1.7157e-04) (hash(x)=25718393) +945 train 7.416306 (lr=1.7156e-04) (hash(x)=26819462) +946 train 7.382411 (lr=1.7155e-04) (hash(x)=27427540) +947 train 7.368616 (lr=1.7155e-04) (hash(x)=25532657) +948 train 7.629161 (lr=1.7154e-04) (hash(x)=27641372) +949 train 7.304125 (lr=1.7153e-04) (hash(x)=26515570) +950 val loss 7.3457 +950 val perplexity 1549.5625 +950 train 7.560983 (lr=1.7153e-04) (hash(x)=26911957) +951 train 7.770375 (lr=1.7152e-04) (hash(x)=25856625) +952 train 7.204317 (lr=1.7151e-04) (hash(x)=25219129) +953 train 7.168865 (lr=1.7150e-04) (hash(x)=25260471) +954 train 7.621967 (lr=1.7150e-04) (hash(x)=29373370) +955 train 7.094585 (lr=1.7149e-04) (hash(x)=23437426) +956 train 7.456252 (lr=1.7148e-04) (hash(x)=23769521) +957 train 7.521903 (lr=1.7147e-04) (hash(x)=25961833) +958 train 7.226558 (lr=1.7147e-04) (hash(x)=23582666) +959 train 7.311450 (lr=1.7146e-04) (hash(x)=23164356) +960 train 7.254163 (lr=1.7145e-04) (hash(x)=24443114) +961 train 7.332226 (lr=1.7144e-04) (hash(x)=25052665) +962 train 7.458611 (lr=1.7144e-04) (hash(x)=27802272) +963 train 7.270822 (lr=1.7143e-04) (hash(x)=25957896) +964 train 7.347778 (lr=1.7142e-04) (hash(x)=26737251) +965 train 7.501845 (lr=1.7142e-04) (hash(x)=24723263) +966 train 7.420486 (lr=1.7141e-04) (hash(x)=24707011) +967 train 7.428133 (lr=1.7140e-04) (hash(x)=25646282) +968 train 7.454709 (lr=1.7139e-04) (hash(x)=27544665) +969 train 7.339728 (lr=1.7139e-04) (hash(x)=25851993) +970 train 7.724787 (lr=1.7138e-04) (hash(x)=29059700) +971 train 7.429220 (lr=1.7137e-04) (hash(x)=21513584) +972 train 7.213628 (lr=1.7136e-04) (hash(x)=23151267) +973 train 7.433173 (lr=1.7136e-04) (hash(x)=26017176) +974 train 7.465435 (lr=1.7135e-04) (hash(x)=26979518) +975 train 7.453277 (lr=1.7134e-04) (hash(x)=23843233) +976 train 7.675657 (lr=1.7133e-04) (hash(x)=24193010) +977 train 7.358127 (lr=1.7133e-04) (hash(x)=21476847) +978 train 7.213284 (lr=1.7132e-04) (hash(x)=21366504) +979 train 7.193771 (lr=1.7131e-04) (hash(x)=23226697) +980 train 6.979225 (lr=1.7130e-04) (hash(x)=19961773) +981 train 6.867967 (lr=1.7130e-04) (hash(x)=19772969) +982 train 7.203844 (lr=1.7129e-04) (hash(x)=23110142) +983 train 7.454412 (lr=1.7128e-04) (hash(x)=24506028) +984 train 7.453249 (lr=1.7127e-04) (hash(x)=25480731) +985 train 7.263885 (lr=1.7127e-04) (hash(x)=21077417) +986 train 7.257013 (lr=1.7126e-04) (hash(x)=23686713) +987 train 7.292868 (lr=1.7125e-04) (hash(x)=26024321) +988 train 7.408092 (lr=1.7124e-04) (hash(x)=27424109) +989 train 7.542737 (lr=1.7124e-04) (hash(x)=27786174) +990 train 7.349844 (lr=1.7123e-04) (hash(x)=25232502) +991 train 7.347635 (lr=1.7122e-04) (hash(x)=22781277) +992 train 7.459560 (lr=1.7121e-04) (hash(x)=26184527) +993 train 7.418424 (lr=1.7121e-04) (hash(x)=24459895) +994 train 7.392319 (lr=1.7120e-04) (hash(x)=25244624) +995 train 7.514288 (lr=1.7119e-04) (hash(x)=24451843) +996 train 7.532412 (lr=1.7118e-04) (hash(x)=22129897) +997 train 7.256130 (lr=1.7118e-04) (hash(x)=21116390) +998 train 7.073079 (lr=1.7117e-04) (hash(x)=20650070) +999 train 7.462614 (lr=1.7116e-04) (hash(x)=24948650) +1000 val loss 7.3487 +1000 val perplexity 1554.1979 +1000 train 7.364742 (lr=1.7115e-04) (hash(x)=25444553) +1001 train 7.321649 (lr=1.7114e-04) (hash(x)=25617781) +1002 train 7.212125 (lr=1.7114e-04) (hash(x)=23862434) +1003 train 7.266995 (lr=1.7113e-04) (hash(x)=25559534) +1004 train 7.472035 (lr=1.7112e-04) (hash(x)=26577585) +1005 train 7.334969 (lr=1.7111e-04) (hash(x)=25546274) +1006 train 7.359958 (lr=1.7111e-04) (hash(x)=26284202) +1007 train 7.418993 (lr=1.7110e-04) (hash(x)=26373991) +1008 train 7.319303 (lr=1.7109e-04) (hash(x)=24612851) +1009 train 7.422052 (lr=1.7108e-04) (hash(x)=26410662) +1010 train 7.474313 (lr=1.7108e-04) (hash(x)=23824841) +1011 train 7.744843 (lr=1.7107e-04) (hash(x)=27756673) +1012 train 7.469768 (lr=1.7106e-04) (hash(x)=25427447) +1013 train 7.484413 (lr=1.7105e-04) (hash(x)=23661686) +1014 train 7.367393 (lr=1.7104e-04) (hash(x)=25129504) +1015 train 7.301383 (lr=1.7104e-04) (hash(x)=23402396) +1016 train 7.573224 (lr=1.7103e-04) (hash(x)=26145557) +1017 train 7.303380 (lr=1.7102e-04) (hash(x)=26547918) +1018 train 7.416523 (lr=1.7101e-04) (hash(x)=26653070) +1019 train 7.432761 (lr=1.7101e-04) (hash(x)=28250354) +1020 train 7.398674 (lr=1.7100e-04) (hash(x)=25437401) +1021 train 7.457897 (lr=1.7099e-04) (hash(x)=25598861) +1022 train 7.286643 (lr=1.7098e-04) (hash(x)=24572587) +1023 train 7.312264 (lr=1.7097e-04) (hash(x)=21562133) +1024 train 7.724053 (lr=1.7097e-04) (hash(x)=27718876) +1025 train 7.306474 (lr=1.7096e-04) (hash(x)=25312391) +1026 train 7.381176 (lr=1.7095e-04) (hash(x)=26579535) +1027 train 7.639217 (lr=1.7094e-04) (hash(x)=27253861) +1028 train 7.518033 (lr=1.7094e-04) (hash(x)=28451867) +1029 train 7.206136 (lr=1.7093e-04) (hash(x)=26795921) +1030 train 7.356931 (lr=1.7092e-04) (hash(x)=26147208) +1031 train 7.432410 (lr=1.7091e-04) (hash(x)=25009210) +1032 train 7.354872 (lr=1.7090e-04) (hash(x)=25213771) +1033 train 7.258798 (lr=1.7090e-04) (hash(x)=26254538) +1034 train 7.307682 (lr=1.7089e-04) (hash(x)=25565614) +1035 train 7.155371 (lr=1.7088e-04) (hash(x)=23052577) +1036 train 7.987491 (lr=1.7087e-04) (hash(x)=29630613) +1037 train 7.208566 (lr=1.7086e-04) (hash(x)=23667224) +1038 train 7.328963 (lr=1.7086e-04) (hash(x)=25740670) +1039 train 7.467515 (lr=1.7085e-04) (hash(x)=27161811) +1040 train 7.582025 (lr=1.7084e-04) (hash(x)=26385663) +1041 train 7.287973 (lr=1.7083e-04) (hash(x)=26313522) +1042 train 7.370128 (lr=1.7083e-04) (hash(x)=26814686) +1043 train 7.496887 (lr=1.7082e-04) (hash(x)=27302459) +1044 train 7.783177 (lr=1.7081e-04) (hash(x)=26758132) +1045 train 7.367226 (lr=1.7080e-04) (hash(x)=26837963) +1046 train 7.203972 (lr=1.7079e-04) (hash(x)=22089547) +1047 train 7.726242 (lr=1.7079e-04) (hash(x)=29515100) +1048 train 7.438416 (lr=1.7078e-04) (hash(x)=25471442) +1049 train 7.345440 (lr=1.7077e-04) (hash(x)=26674478) +1050 val loss 7.3550 +1050 val perplexity 1563.9963 +1050 train 7.322531 (lr=1.7076e-04) (hash(x)=25373386) +1051 train 7.324645 (lr=1.7075e-04) (hash(x)=25318001) +1052 train 7.520314 (lr=1.7075e-04) (hash(x)=27255021) +1053 train 7.453936 (lr=1.7074e-04) (hash(x)=25174043) +1054 train 7.199980 (lr=1.7073e-04) (hash(x)=23857597) +1055 train 7.434664 (lr=1.7072e-04) (hash(x)=25305929) +1056 train 7.458626 (lr=1.7071e-04) (hash(x)=27009246) +1057 train 7.530457 (lr=1.7071e-04) (hash(x)=26175477) +1058 train 7.158226 (lr=1.7070e-04) (hash(x)=22700025) +1059 train 7.305308 (lr=1.7069e-04) (hash(x)=24339043) +1060 train 7.168544 (lr=1.7068e-04) (hash(x)=22139900) +1061 train 7.937405 (lr=1.7067e-04) (hash(x)=25412772) +1062 train 7.389800 (lr=1.7066e-04) (hash(x)=27020849) +1063 train 7.317282 (lr=1.7066e-04) (hash(x)=26808543) +1064 train 7.118846 (lr=1.7065e-04) (hash(x)=23061527) +1065 train 7.341051 (lr=1.7064e-04) (hash(x)=24738650) +1066 train 7.142502 (lr=1.7063e-04) (hash(x)=24036715) +1067 train 7.206356 (lr=1.7062e-04) (hash(x)=25763991) +1068 train 7.502979 (lr=1.7062e-04) (hash(x)=27393753) +1069 train 7.607764 (lr=1.7061e-04) (hash(x)=28182190) +1070 train 7.227566 (lr=1.7060e-04) (hash(x)=23358569) +1071 train 7.421059 (lr=1.7059e-04) (hash(x)=25669509) +1072 train 7.512629 (lr=1.7058e-04) (hash(x)=29139024) +1073 train 7.447246 (lr=1.7058e-04) (hash(x)=25616522) +1074 train 7.320650 (lr=1.7057e-04) (hash(x)=25695789) +1075 train 7.527893 (lr=1.7056e-04) (hash(x)=27676869) +1076 train 7.398305 (lr=1.7055e-04) (hash(x)=25952695) +1077 train 7.379205 (lr=1.7054e-04) (hash(x)=26316170) +1078 train 7.288249 (lr=1.7053e-04) (hash(x)=24081867) +1079 train 7.454759 (lr=1.7053e-04) (hash(x)=28435805) +1080 train 7.369466 (lr=1.7052e-04) (hash(x)=23375063) +1081 train 7.344190 (lr=1.7051e-04) (hash(x)=26869022) +1082 train 7.217685 (lr=1.7050e-04) (hash(x)=25793007) +1083 train 7.160675 (lr=1.7049e-04) (hash(x)=23455211) +1084 train 7.235754 (lr=1.7048e-04) (hash(x)=20441501) +1085 train 7.659101 (lr=1.7048e-04) (hash(x)=29321187) +1086 train 7.844403 (lr=1.7047e-04) (hash(x)=32627505) +1087 train 7.270303 (lr=1.7046e-04) (hash(x)=26482758) +1088 train 7.086067 (lr=1.7045e-04) (hash(x)=21431511) +1089 train 7.310867 (lr=1.7044e-04) (hash(x)=26046639) +1090 train 7.433331 (lr=1.7044e-04) (hash(x)=27464841) +1091 train 7.290209 (lr=1.7043e-04) (hash(x)=27068280) +1092 train 7.189130 (lr=1.7042e-04) (hash(x)=23119133) +1093 train 7.366785 (lr=1.7041e-04) (hash(x)=26782091) +1094 train 7.420967 (lr=1.7040e-04) (hash(x)=26265326) +1095 train 7.398642 (lr=1.7039e-04) (hash(x)=24929929) +1096 train 7.275880 (lr=1.7039e-04) (hash(x)=23158628) +1097 train 7.373760 (lr=1.7038e-04) (hash(x)=25950541) +1098 train 7.148512 (lr=1.7037e-04) (hash(x)=22093912) +1099 train 7.282513 (lr=1.7036e-04) (hash(x)=25373676) +1100 val loss 7.3035 +1100 val perplexity 1485.4797 +1100 train 7.012780 (lr=1.7035e-04) (hash(x)=18986670) +1101 train 7.556435 (lr=1.7034e-04) (hash(x)=27283187) +1102 train 7.298884 (lr=1.7034e-04) (hash(x)=25474743) +1103 train 7.183403 (lr=1.7033e-04) (hash(x)=25043037) +1104 train 7.099920 (lr=1.7032e-04) (hash(x)=23156261) +1105 train 7.600711 (lr=1.7031e-04) (hash(x)=27027534) +1106 train 7.169823 (lr=1.7030e-04) (hash(x)=22733630) +1107 train 7.432134 (lr=1.7029e-04) (hash(x)=27906976) +1108 train 7.418533 (lr=1.7028e-04) (hash(x)=27848655) +1109 train 7.340860 (lr=1.7028e-04) (hash(x)=23889709) +1110 train 8.330238 (lr=1.7027e-04) (hash(x)=33189918) +1111 train 7.948875 (lr=1.7026e-04) (hash(x)=29151257) +1112 train 7.647668 (lr=1.7025e-04) (hash(x)=23881512) +1113 train 7.362649 (lr=1.7024e-04) (hash(x)=21307974) +1114 train 7.346222 (lr=1.7023e-04) (hash(x)=25264524) +1115 train 7.474779 (lr=1.7023e-04) (hash(x)=26405613) +1116 train 7.126159 (lr=1.7022e-04) (hash(x)=21918678) +1117 train 7.141615 (lr=1.7021e-04) (hash(x)=24233887) +1118 train 6.791396 (lr=1.7020e-04) (hash(x)=19490509) +1119 train 7.479090 (lr=1.7019e-04) (hash(x)=26400365) +1120 train 7.761586 (lr=1.7018e-04) (hash(x)=28572086) +1121 train 7.150074 (lr=1.7017e-04) (hash(x)=22293114) +1122 train 7.289867 (lr=1.7017e-04) (hash(x)=26845479) +1123 train 7.176906 (lr=1.7016e-04) (hash(x)=23971905) +1124 train 7.395374 (lr=1.7015e-04) (hash(x)=25639959) +1125 train 7.020345 (lr=1.7014e-04) (hash(x)=20076502) +1126 train 7.413547 (lr=1.7013e-04) (hash(x)=25089255) +1127 train 7.269116 (lr=1.7012e-04) (hash(x)=24098812) +1128 train 7.288963 (lr=1.7011e-04) (hash(x)=23493707) +1129 train 7.532476 (lr=1.7011e-04) (hash(x)=27610410) +1130 train 7.256096 (lr=1.7010e-04) (hash(x)=24540186) +1131 train 7.566958 (lr=1.7009e-04) (hash(x)=29402976) +1132 train 7.137786 (lr=1.7008e-04) (hash(x)=23776025) +1133 train 6.887546 (lr=1.7007e-04) (hash(x)=19032564) +1134 train 7.484811 (lr=1.7006e-04) (hash(x)=26921117) +1135 train 7.070796 (lr=1.7005e-04) (hash(x)=20967666) +1136 train 7.131073 (lr=1.7005e-04) (hash(x)=23394540) +1137 train 7.192506 (lr=1.7004e-04) (hash(x)=22666342) +1138 train 7.398232 (lr=1.7003e-04) (hash(x)=23482498) +1139 train 7.428648 (lr=1.7002e-04) (hash(x)=24287610) +1140 train 7.479375 (lr=1.7001e-04) (hash(x)=24512831) +1141 train 7.724477 (lr=1.7000e-04) (hash(x)=28637634) +1142 train 7.916282 (lr=1.6999e-04) (hash(x)=24107127) +1143 train 7.587456 (lr=1.6998e-04) (hash(x)=28667963) +1144 train 7.468751 (lr=1.6998e-04) (hash(x)=26302492) +1145 train 7.466949 (lr=1.6997e-04) (hash(x)=23621685) +1146 train 7.191504 (lr=1.6996e-04) (hash(x)=23997414) +1147 train 7.284860 (lr=1.6995e-04) (hash(x)=25974316) +1148 train 7.233768 (lr=1.6994e-04) (hash(x)=23464988) +1149 train 7.366230 (lr=1.6993e-04) (hash(x)=24487710) +1150 val loss 7.3554 +1150 val perplexity 1564.6877 +1150 train 7.624738 (lr=1.6992e-04) (hash(x)=29610350) +1151 train 7.759580 (lr=1.6992e-04) (hash(x)=27083417) +1152 train 7.007880 (lr=1.6991e-04) (hash(x)=20666288) +1153 train 7.112840 (lr=1.6990e-04) (hash(x)=22850633) +1154 train 7.310382 (lr=1.6989e-04) (hash(x)=24741872) +1155 train 7.736496 (lr=1.6988e-04) (hash(x)=28605205) +1156 train 7.130516 (lr=1.6987e-04) (hash(x)=22624463) +1157 train 7.366961 (lr=1.6986e-04) (hash(x)=24786468) +1158 train 7.051040 (lr=1.6985e-04) (hash(x)=21365399) +1159 train 7.306826 (lr=1.6985e-04) (hash(x)=23649001) +1160 train 7.406339 (lr=1.6984e-04) (hash(x)=28203982) +1161 train 7.299213 (lr=1.6983e-04) (hash(x)=26473994) +1162 train 7.000452 (lr=1.6982e-04) (hash(x)=19476441) +1163 train 7.295290 (lr=1.6981e-04) (hash(x)=25921700) +1164 train 7.141401 (lr=1.6980e-04) (hash(x)=23064343) +1165 train 7.318882 (lr=1.6979e-04) (hash(x)=24117626) +1166 train 7.249561 (lr=1.6978e-04) (hash(x)=21764556) +1167 train 8.116375 (lr=1.6977e-04) (hash(x)=31338300) +1168 train 7.546416 (lr=1.6977e-04) (hash(x)=27443187) +1169 train 6.908689 (lr=1.6976e-04) (hash(x)=21337692) +1170 train 7.439312 (lr=1.6975e-04) (hash(x)=27845383) +1171 train 7.246575 (lr=1.6974e-04) (hash(x)=23862328) +1172 train 7.477600 (lr=1.6973e-04) (hash(x)=23811014) +1173 train 7.405194 (lr=1.6972e-04) (hash(x)=24380098) +1174 train 7.051769 (lr=1.6971e-04) (hash(x)=22351136) +1175 train 7.434986 (lr=1.6970e-04) (hash(x)=30603174) +1176 train 7.461113 (lr=1.6969e-04) (hash(x)=27924596) +1177 train 7.822130 (lr=1.6969e-04) (hash(x)=30882548) +1178 train 7.222208 (lr=1.6968e-04) (hash(x)=22339464) +1179 train 7.068852 (lr=1.6967e-04) (hash(x)=23603806) +1180 train 7.452847 (lr=1.6966e-04) (hash(x)=24809041) +1181 train 7.249598 (lr=1.6965e-04) (hash(x)=24382442) +1182 train 7.191129 (lr=1.6964e-04) (hash(x)=23134077) +1183 train 7.225625 (lr=1.6963e-04) (hash(x)=24830965) +1184 train 7.310234 (lr=1.6962e-04) (hash(x)=25527259) +1185 train 7.369991 (lr=1.6961e-04) (hash(x)=25547480) +1186 train 7.182691 (lr=1.6960e-04) (hash(x)=24424314) +1187 train 7.648182 (lr=1.6960e-04) (hash(x)=32488729) +1188 train 7.583559 (lr=1.6959e-04) (hash(x)=31168462) +1189 train 7.815445 (lr=1.6958e-04) (hash(x)=31331643) +1190 train 7.443772 (lr=1.6957e-04) (hash(x)=28746633) +1191 train 7.415104 (lr=1.6956e-04) (hash(x)=27269893) +1192 train 7.186811 (lr=1.6955e-04) (hash(x)=23484031) +1193 train 7.200359 (lr=1.6954e-04) (hash(x)=23278725) +1194 train 7.338876 (lr=1.6953e-04) (hash(x)=25440745) +1195 train 7.379451 (lr=1.6952e-04) (hash(x)=25215077) +1196 train 7.442348 (lr=1.6951e-04) (hash(x)=28309266) +1197 train 7.139370 (lr=1.6951e-04) (hash(x)=22442404) +1198 train 7.149053 (lr=1.6950e-04) (hash(x)=20775262) +1199 train 7.229539 (lr=1.6949e-04) (hash(x)=24825041) +1200 val loss 7.2893 +1200 val perplexity 1464.5388 +1200 train 7.427461 (lr=1.6948e-04) (hash(x)=29016896) +1201 train 7.349986 (lr=1.6947e-04) (hash(x)=25590276) +1202 train 7.183403 (lr=1.6946e-04) (hash(x)=22816384) +1203 train 7.382070 (lr=1.6945e-04) (hash(x)=25893804) +1204 train 7.241312 (lr=1.6944e-04) (hash(x)=23983816) +1205 train 7.116162 (lr=1.6943e-04) (hash(x)=22222468) +1206 train 7.198715 (lr=1.6942e-04) (hash(x)=23039141) +1207 train 7.123201 (lr=1.6941e-04) (hash(x)=22724871) +1208 train 7.215744 (lr=1.6940e-04) (hash(x)=25253062) +1209 train 7.207423 (lr=1.6940e-04) (hash(x)=25140744) +1210 train 7.288469 (lr=1.6939e-04) (hash(x)=24717218) +1211 train 7.390728 (lr=1.6938e-04) (hash(x)=27317554) +1212 train 7.014757 (lr=1.6937e-04) (hash(x)=22013236) +1213 train 7.578937 (lr=1.6936e-04) (hash(x)=26692343) +1214 train 7.084622 (lr=1.6935e-04) (hash(x)=19859225) +1215 train 7.022730 (lr=1.6934e-04) (hash(x)=24683717) +1216 train 7.113950 (lr=1.6933e-04) (hash(x)=21932013) +1217 train 7.374730 (lr=1.6932e-04) (hash(x)=26849303) +1218 train 7.477870 (lr=1.6931e-04) (hash(x)=26458000) +1219 train 7.207565 (lr=1.6930e-04) (hash(x)=21584083) +1220 train 7.601984 (lr=1.6929e-04) (hash(x)=23598625) +1221 train 7.295946 (lr=1.6929e-04) (hash(x)=26059939) +1222 train 7.543237 (lr=1.6928e-04) (hash(x)=25481982) +1223 train 7.411541 (lr=1.6927e-04) (hash(x)=26190337) +1224 train 7.565211 (lr=1.6926e-04) (hash(x)=28767755) +1225 train 7.221604 (lr=1.6925e-04) (hash(x)=23663918) +1226 train 7.363104 (lr=1.6924e-04) (hash(x)=21293227) +1227 train 7.344974 (lr=1.6923e-04) (hash(x)=22249019) +1228 train 7.440430 (lr=1.6922e-04) (hash(x)=26886529) +1229 train 7.251349 (lr=1.6921e-04) (hash(x)=25779849) +1230 train 7.394920 (lr=1.6920e-04) (hash(x)=26228964) +1231 train 7.317209 (lr=1.6919e-04) (hash(x)=23086289) +1232 train 7.430899 (lr=1.6918e-04) (hash(x)=23198922) +1233 train 7.452879 (lr=1.6917e-04) (hash(x)=27523941) +1234 train 7.193835 (lr=1.6916e-04) (hash(x)=24293992) +1235 train 7.930650 (lr=1.6915e-04) (hash(x)=28047044) +1236 train 7.390512 (lr=1.6915e-04) (hash(x)=23688671) +1237 train 7.260832 (lr=1.6914e-04) (hash(x)=25125498) +1238 train 7.138358 (lr=1.6913e-04) (hash(x)=21977292) +1239 train 7.312904 (lr=1.6912e-04) (hash(x)=23593875) +1240 train 7.136464 (lr=1.6911e-04) (hash(x)=22659030) +1241 train 7.255498 (lr=1.6910e-04) (hash(x)=25117733) +1242 train 7.223252 (lr=1.6909e-04) (hash(x)=22322808) +1243 train 7.310516 (lr=1.6908e-04) (hash(x)=26059735) +1244 train 7.285142 (lr=1.6907e-04) (hash(x)=22485526) +1245 train 7.178739 (lr=1.6906e-04) (hash(x)=23028679) +1246 train 7.192830 (lr=1.6905e-04) (hash(x)=22906035) +1247 train 7.110574 (lr=1.6904e-04) (hash(x)=22414190) +1248 train 7.381729 (lr=1.6903e-04) (hash(x)=26229624) +1249 train 7.130967 (lr=1.6902e-04) (hash(x)=22223137) +1250 val loss 7.2923 +1250 val perplexity 1469.0004 +1250 train 7.452713 (lr=1.6901e-04) (hash(x)=24911520) +1251 train 7.663809 (lr=1.6900e-04) (hash(x)=24204591) +1252 train 7.135028 (lr=1.6899e-04) (hash(x)=24379601) +1253 train 7.129131 (lr=1.6899e-04) (hash(x)=22922475) +1254 train 7.217510 (lr=1.6898e-04) (hash(x)=23426249) +1255 train 7.412304 (lr=1.6897e-04) (hash(x)=26758114) +1256 train 7.109962 (lr=1.6896e-04) (hash(x)=24027111) +1257 train 7.271157 (lr=1.6895e-04) (hash(x)=25358064) +1258 train 7.151071 (lr=1.6894e-04) (hash(x)=22571285) +1259 train 7.540486 (lr=1.6893e-04) (hash(x)=20084233) +1260 train 7.394174 (lr=1.6892e-04) (hash(x)=18786581) +1261 train 7.288876 (lr=1.6891e-04) (hash(x)=26395104) +1262 train 7.204344 (lr=1.6890e-04) (hash(x)=24212567) +1263 train 7.004578 (lr=1.6889e-04) (hash(x)=21563184) +1264 train 7.300999 (lr=1.6888e-04) (hash(x)=26490150) +1265 train 7.396229 (lr=1.6887e-04) (hash(x)=25207694) +1266 train 7.244557 (lr=1.6886e-04) (hash(x)=23914544) +1267 train 7.154321 (lr=1.6885e-04) (hash(x)=23861489) +1268 train 7.697505 (lr=1.6884e-04) (hash(x)=30714540) +1269 train 7.166350 (lr=1.6883e-04) (hash(x)=23471007) +1270 train 7.179688 (lr=1.6882e-04) (hash(x)=23244293) +1271 train 7.096256 (lr=1.6881e-04) (hash(x)=19218470) +1272 train 7.432140 (lr=1.6880e-04) (hash(x)=26965136) +1273 train 7.136637 (lr=1.6879e-04) (hash(x)=22944035) +1274 train 7.184428 (lr=1.6878e-04) (hash(x)=22002714) +1275 train 7.517316 (lr=1.6877e-04) (hash(x)=28469562) +1276 train 7.568788 (lr=1.6877e-04) (hash(x)=26889992) +1277 train 7.708136 (lr=1.6876e-04) (hash(x)=26452814) +1278 train 7.403123 (lr=1.6875e-04) (hash(x)=28397488) +1279 train 7.552557 (lr=1.6874e-04) (hash(x)=25588469) +1280 train 7.403415 (lr=1.6873e-04) (hash(x)=24833139) +1281 train 7.288645 (lr=1.6872e-04) (hash(x)=24788298) +1282 train 7.573669 (lr=1.6871e-04) (hash(x)=24979383) +1283 train 7.608803 (lr=1.6870e-04) (hash(x)=25236367) +1284 train 7.496301 (lr=1.6869e-04) (hash(x)=22638257) +1285 train 7.402524 (lr=1.6868e-04) (hash(x)=23069067) +1286 train 7.504482 (lr=1.6867e-04) (hash(x)=25133239) +1287 train 8.073915 (lr=1.6866e-04) (hash(x)=30433767) +1288 train 8.073992 (lr=1.6865e-04) (hash(x)=34319079) +1289 train 7.888945 (lr=1.6864e-04) (hash(x)=29268881) +1290 train 7.528261 (lr=1.6863e-04) (hash(x)=24528336) +1291 train 7.670931 (lr=1.6862e-04) (hash(x)=26302626) +1292 train 7.596714 (lr=1.6861e-04) (hash(x)=25479111) +1293 train 7.804012 (lr=1.6860e-04) (hash(x)=24749682) +1294 train 7.449883 (lr=1.6859e-04) (hash(x)=24111393) +1295 train 7.056259 (lr=1.6858e-04) (hash(x)=17851621) +1296 train 7.324935 (lr=1.6857e-04) (hash(x)=26463070) +1297 train 7.396608 (lr=1.6856e-04) (hash(x)=25620741) +1298 train 8.079783 (lr=1.6855e-04) (hash(x)=28225676) +1299 train 7.884273 (lr=1.6854e-04) (hash(x)=27028191) +1300 val loss 7.3810 +1300 val perplexity 1605.1750 +1300 train 7.468037 (lr=1.6853e-04) (hash(x)=29006516) +1301 train 7.574924 (lr=1.6852e-04) (hash(x)=27590299) +1302 train 7.716960 (lr=1.6851e-04) (hash(x)=28678983) +1303 train 7.538952 (lr=1.6850e-04) (hash(x)=25183690) +1304 train 7.117168 (lr=1.6849e-04) (hash(x)=19918097) +1305 train 7.936279 (lr=1.6848e-04) (hash(x)=31114252) +1306 train 7.971478 (lr=1.6847e-04) (hash(x)=30913255) +1307 train 7.453697 (lr=1.6846e-04) (hash(x)=26182243) +1308 train 7.693331 (lr=1.6845e-04) (hash(x)=27420668) +1309 train 7.882478 (lr=1.6844e-04) (hash(x)=30419908) +1310 train 7.806268 (lr=1.6843e-04) (hash(x)=29002281) +1311 train 7.535689 (lr=1.6842e-04) (hash(x)=27040642) +1312 train 7.439781 (lr=1.6841e-04) (hash(x)=26929300) +1313 train 7.542525 (lr=1.6840e-04) (hash(x)=26240761) +1314 train 7.618105 (lr=1.6839e-04) (hash(x)=27161876) +1315 train 7.385916 (lr=1.6838e-04) (hash(x)=24489607) +1316 train 7.735037 (lr=1.6837e-04) (hash(x)=27040115) +1317 train 7.407663 (lr=1.6836e-04) (hash(x)=25012872) +1318 train 7.035732 (lr=1.6835e-04) (hash(x)=20894720) +1319 train 7.154698 (lr=1.6834e-04) (hash(x)=22183303) +1320 train 7.411315 (lr=1.6833e-04) (hash(x)=26291778) +1321 train 7.562580 (lr=1.6832e-04) (hash(x)=27682633) +1322 train 7.252292 (lr=1.6831e-04) (hash(x)=26490892) +1323 train 7.747901 (lr=1.6830e-04) (hash(x)=28844646) +1324 train 8.085184 (lr=1.6829e-04) (hash(x)=29545304) +1325 train 8.210191 (lr=1.6828e-04) (hash(x)=31082070) +1326 train 7.834241 (lr=1.6827e-04) (hash(x)=27486316) +1327 train 7.709617 (lr=1.6826e-04) (hash(x)=27537063) +1328 train 7.513256 (lr=1.6825e-04) (hash(x)=26955557) +1329 train 7.511653 (lr=1.6824e-04) (hash(x)=26125988) +1330 train 7.499639 (lr=1.6823e-04) (hash(x)=22800125) +1331 train 7.643684 (lr=1.6822e-04) (hash(x)=25446686) +1332 train 7.695862 (lr=1.6821e-04) (hash(x)=28743746) +1333 train 7.390575 (lr=1.6820e-04) (hash(x)=19819857) +1334 train 7.150829 (lr=1.6819e-04) (hash(x)=23518628) +1335 train 7.073029 (lr=1.6818e-04) (hash(x)=19492832) +1336 train 7.390504 (lr=1.6817e-04) (hash(x)=24627720) +1337 train 7.267519 (lr=1.6816e-04) (hash(x)=23741214) +1338 train 7.339093 (lr=1.6815e-04) (hash(x)=25837914) +1339 train 7.239967 (lr=1.6814e-04) (hash(x)=25484958) +1340 train 7.213388 (lr=1.6813e-04) (hash(x)=23671284) +1341 train 7.280254 (lr=1.6812e-04) (hash(x)=25525370) +1342 train 7.438568 (lr=1.6811e-04) (hash(x)=26585300) +1343 train 7.470137 (lr=1.6810e-04) (hash(x)=25951629) +1344 train 7.695392 (lr=1.6809e-04) (hash(x)=28743135) +1345 train 7.904527 (lr=1.6808e-04) (hash(x)=28557663) +1346 train 7.257165 (lr=1.6807e-04) (hash(x)=22642751) +1347 train 7.164679 (lr=1.6806e-04) (hash(x)=23462798) +1348 train 7.086674 (lr=1.6805e-04) (hash(x)=24292328) +1349 train 7.389279 (lr=1.6804e-04) (hash(x)=27320280) +1350 val loss 7.3376 +1350 val perplexity 1537.0669 +1350 train 7.561740 (lr=1.6803e-04) (hash(x)=27352812) +1351 train 7.388153 (lr=1.6802e-04) (hash(x)=22408682) +1352 train 7.292865 (lr=1.6801e-04) (hash(x)=23144732) +1353 train 7.136622 (lr=1.6800e-04) (hash(x)=22230799) +1354 train 7.644997 (lr=1.6799e-04) (hash(x)=29747687) +1355 train 7.833942 (lr=1.6798e-04) (hash(x)=31317970) +1356 train 6.914219 (lr=1.6797e-04) (hash(x)=20131758) +1357 train 7.371128 (lr=1.6796e-04) (hash(x)=24020983) +1358 train 7.188481 (lr=1.6795e-04) (hash(x)=23998051) +1359 train 7.311749 (lr=1.6794e-04) (hash(x)=27633457) +1360 train 7.000914 (lr=1.6793e-04) (hash(x)=20155247) +1361 train 7.303020 (lr=1.6792e-04) (hash(x)=23766987) +1362 train 7.197865 (lr=1.6791e-04) (hash(x)=25960383) +1363 train 7.476614 (lr=1.6790e-04) (hash(x)=23729283) +1364 train 7.622457 (lr=1.6789e-04) (hash(x)=27775445) +1365 train 7.471893 (lr=1.6788e-04) (hash(x)=25975834) +1366 train 7.301226 (lr=1.6787e-04) (hash(x)=22765259) +1367 train 7.568687 (lr=1.6786e-04) (hash(x)=27635080) +1368 train 7.300228 (lr=1.6785e-04) (hash(x)=23848542) +1369 train 7.446013 (lr=1.6784e-04) (hash(x)=27181156) +1370 train 7.624511 (lr=1.6783e-04) (hash(x)=28321340) +1371 train 7.359806 (lr=1.6782e-04) (hash(x)=25918780) +1372 train 7.353857 (lr=1.6781e-04) (hash(x)=23338297) +1373 train 7.426582 (lr=1.6780e-04) (hash(x)=22370417) +1374 train 7.416944 (lr=1.6779e-04) (hash(x)=24272668) +1375 train 7.081144 (lr=1.6778e-04) (hash(x)=22287596) +1376 train 7.282355 (lr=1.6776e-04) (hash(x)=25257403) +1377 train 7.196697 (lr=1.6775e-04) (hash(x)=21584419) +1378 train 7.411576 (lr=1.6774e-04) (hash(x)=25318823) +1379 train 7.152982 (lr=1.6773e-04) (hash(x)=22694623) +1380 train 7.290915 (lr=1.6772e-04) (hash(x)=23743406) +1381 train 7.586244 (lr=1.6771e-04) (hash(x)=30820846) +1382 train 8.132363 (lr=1.6770e-04) (hash(x)=34639557) +1383 train 7.995103 (lr=1.6769e-04) (hash(x)=35895440) +1384 train 7.363719 (lr=1.6768e-04) (hash(x)=26304839) +1385 train 7.522652 (lr=1.6767e-04) (hash(x)=27058657) +1386 train 7.419740 (lr=1.6766e-04) (hash(x)=25209529) +1387 train 7.293233 (lr=1.6765e-04) (hash(x)=24298886) +1388 train 7.422395 (lr=1.6764e-04) (hash(x)=26200200) +1389 train 7.344403 (lr=1.6763e-04) (hash(x)=27303061) +1390 train 7.385816 (lr=1.6762e-04) (hash(x)=26531628) +1391 train 7.407486 (lr=1.6761e-04) (hash(x)=25888847) +1392 train 7.606818 (lr=1.6760e-04) (hash(x)=28924067) +1393 train 7.046886 (lr=1.6759e-04) (hash(x)=21267641) +1394 train 7.636278 (lr=1.6758e-04) (hash(x)=29419156) +1395 train 7.834409 (lr=1.6757e-04) (hash(x)=30860646) +1396 train 7.405828 (lr=1.6756e-04) (hash(x)=25744434) +1397 train 7.355171 (lr=1.6755e-04) (hash(x)=26881837) +1398 train 7.353644 (lr=1.6754e-04) (hash(x)=26676176) +1399 train 7.530951 (lr=1.6752e-04) (hash(x)=26518800) +1400 val loss 7.3262 +1400 val perplexity 1519.5825 +1400 train 7.250644 (lr=1.6751e-04) (hash(x)=25043238) +1401 train 7.510713 (lr=1.6750e-04) (hash(x)=25863277) +1402 train 7.185211 (lr=1.6749e-04) (hash(x)=24073623) +1403 train 7.226394 (lr=1.6748e-04) (hash(x)=25385523) +1404 train 7.294005 (lr=1.6747e-04) (hash(x)=24958112) +1405 train 7.200107 (lr=1.6746e-04) (hash(x)=23362519) +1406 train 7.524701 (lr=1.6745e-04) (hash(x)=29262616) +1407 train 7.938034 (lr=1.6744e-04) (hash(x)=37519283) +1408 train 8.238019 (lr=1.6743e-04) (hash(x)=33716930) +1409 train 7.332501 (lr=1.6742e-04) (hash(x)=23392584) +1410 train 7.816240 (lr=1.6741e-04) (hash(x)=22877779) +1411 train 8.183646 (lr=1.6740e-04) (hash(x)=20564397) +1412 train 7.578860 (lr=1.6739e-04) (hash(x)=24366235) +1413 train 7.427068 (lr=1.6738e-04) (hash(x)=27065499) +1414 train 7.276659 (lr=1.6737e-04) (hash(x)=26844114) +1415 train 7.399042 (lr=1.6736e-04) (hash(x)=25141945) +1416 train 7.629028 (lr=1.6734e-04) (hash(x)=28813116) +1417 train 7.399436 (lr=1.6733e-04) (hash(x)=25466598) +1418 train 7.254410 (lr=1.6732e-04) (hash(x)=22800032) +1419 train 7.344827 (lr=1.6731e-04) (hash(x)=22717866) +1420 train 7.922821 (lr=1.6730e-04) (hash(x)=28040763) +1421 train 8.033353 (lr=1.6729e-04) (hash(x)=29648992) +1422 train 7.977982 (lr=1.6728e-04) (hash(x)=31747228) +1423 train 7.356761 (lr=1.6727e-04) (hash(x)=28527939) +1424 train 7.262528 (lr=1.6726e-04) (hash(x)=21563992) +1425 train 7.228487 (lr=1.6725e-04) (hash(x)=25134784) +1426 train 7.453311 (lr=1.6724e-04) (hash(x)=28442823) +1427 train 8.015386 (lr=1.6723e-04) (hash(x)=32757059) +1428 train 7.137088 (lr=1.6722e-04) (hash(x)=24110500) +1429 train 7.218315 (lr=1.6721e-04) (hash(x)=24145729) +1430 train 7.293502 (lr=1.6720e-04) (hash(x)=23541086) +1431 train 7.159267 (lr=1.6718e-04) (hash(x)=21942471) +1432 train 7.252153 (lr=1.6717e-04) (hash(x)=24736836) +1433 train 7.423162 (lr=1.6716e-04) (hash(x)=25325444) +1434 train 7.404439 (lr=1.6715e-04) (hash(x)=25188954) +1435 train 7.980555 (lr=1.6714e-04) (hash(x)=24247339) +1436 train 7.388417 (lr=1.6713e-04) (hash(x)=23773363) +1437 train 7.132315 (lr=1.6712e-04) (hash(x)=24142989) +1438 train 7.153043 (lr=1.6711e-04) (hash(x)=24226952) +1439 train 7.381023 (lr=1.6710e-04) (hash(x)=24955630) +1440 train 7.307853 (lr=1.6709e-04) (hash(x)=24563233) +1441 train 7.430257 (lr=1.6708e-04) (hash(x)=25491335) +1442 train 7.815412 (lr=1.6707e-04) (hash(x)=33253763) +1443 train 7.176763 (lr=1.6705e-04) (hash(x)=21368780) +1444 train 7.224172 (lr=1.6704e-04) (hash(x)=26615500) +1445 train 7.462463 (lr=1.6703e-04) (hash(x)=27146278) +1446 train 7.324889 (lr=1.6702e-04) (hash(x)=25904861) +1447 train 7.133123 (lr=1.6701e-04) (hash(x)=25541230) +1448 train 7.337459 (lr=1.6700e-04) (hash(x)=25434227) +1449 train 7.265499 (lr=1.6699e-04) (hash(x)=25375355) +1450 val loss 7.2831 +1450 val perplexity 1455.5155 +1450 train 7.100755 (lr=1.6698e-04) (hash(x)=21921129) +1451 train 7.133897 (lr=1.6697e-04) (hash(x)=23098806) +1452 train 7.114453 (lr=1.6696e-04) (hash(x)=22000544) +1453 train 7.054414 (lr=1.6695e-04) (hash(x)=22061174) +1454 train 7.133292 (lr=1.6694e-04) (hash(x)=24326286) +1455 train 7.163066 (lr=1.6692e-04) (hash(x)=23501481) +1456 train 7.348842 (lr=1.6691e-04) (hash(x)=26397938) +1457 train 7.367274 (lr=1.6690e-04) (hash(x)=24656430) +1458 train 7.047231 (lr=1.6689e-04) (hash(x)=23494971) +1459 train 7.105865 (lr=1.6688e-04) (hash(x)=23802681) +1460 train 7.089640 (lr=1.6687e-04) (hash(x)=21990153) +1461 train 7.171082 (lr=1.6686e-04) (hash(x)=23496118) +1462 train 7.197286 (lr=1.6685e-04) (hash(x)=24233822) +1463 train 7.582451 (lr=1.6684e-04) (hash(x)=22754988) +1464 train 7.225813 (lr=1.6683e-04) (hash(x)=23116635) +1465 train 6.996608 (lr=1.6682e-04) (hash(x)=21461650) +1466 train 7.168151 (lr=1.6680e-04) (hash(x)=22274473) +1467 train 7.187218 (lr=1.6679e-04) (hash(x)=22183009) +1468 train 7.433422 (lr=1.6678e-04) (hash(x)=24972441) +1469 train 7.200826 (lr=1.6677e-04) (hash(x)=22300616) +1470 train 6.956067 (lr=1.6676e-04) (hash(x)=21443060) +1471 train 7.226720 (lr=1.6675e-04) (hash(x)=23475070) +1472 train 7.128043 (lr=1.6674e-04) (hash(x)=22316810) +1473 train 7.664482 (lr=1.6673e-04) (hash(x)=24508407) +1474 train 7.609012 (lr=1.6672e-04) (hash(x)=24603557) +1475 train 7.238603 (lr=1.6670e-04) (hash(x)=23359061) +1476 train 7.287071 (lr=1.6669e-04) (hash(x)=22950844) +1477 train 7.354896 (lr=1.6668e-04) (hash(x)=22588667) +1478 train 7.476388 (lr=1.6667e-04) (hash(x)=26083526) +1479 train 7.403482 (lr=1.6666e-04) (hash(x)=23609959) +1480 train 7.398591 (lr=1.6665e-04) (hash(x)=24088171) +1481 train 7.370496 (lr=1.6664e-04) (hash(x)=25394852) +1482 train 7.304263 (lr=1.6663e-04) (hash(x)=24503040) +1483 train 7.032187 (lr=1.6662e-04) (hash(x)=22408449) +1484 train 7.320941 (lr=1.6661e-04) (hash(x)=25069325) +1485 train 7.343579 (lr=1.6659e-04) (hash(x)=26947398) +1486 train 6.712953 (lr=1.6658e-04) (hash(x)=17527161) +1487 train 7.208717 (lr=1.6657e-04) (hash(x)=23441847) +1488 train 7.249193 (lr=1.6656e-04) (hash(x)=25592861) +1489 train 7.157814 (lr=1.6655e-04) (hash(x)=23101350) +1490 train 7.103365 (lr=1.6654e-04) (hash(x)=24201380) +1491 train 7.234295 (lr=1.6653e-04) (hash(x)=23676365) +1492 train 7.303934 (lr=1.6652e-04) (hash(x)=26668088) +1493 train 7.409822 (lr=1.6650e-04) (hash(x)=26488811) +1494 train 7.444499 (lr=1.6649e-04) (hash(x)=27248109) +1495 train 7.465642 (lr=1.6648e-04) (hash(x)=23096292) +1496 train 7.371344 (lr=1.6647e-04) (hash(x)=22101981) +1497 train 7.530304 (lr=1.6646e-04) (hash(x)=24512380) +1498 train 7.365834 (lr=1.6645e-04) (hash(x)=25367738) +1499 train 7.358765 (lr=1.6644e-04) (hash(x)=27706294) +1500 val loss 7.3029 +1500 val perplexity 1484.6384 +1500 train 7.437232 (lr=1.6643e-04) (hash(x)=24154026) +1501 train 7.128339 (lr=1.6642e-04) (hash(x)=21892472) +1502 train 7.224975 (lr=1.6640e-04) (hash(x)=23662543) +1503 train 7.299825 (lr=1.6639e-04) (hash(x)=26171093) +1504 train 7.344662 (lr=1.6638e-04) (hash(x)=25974292) +1505 train 7.159401 (lr=1.6637e-04) (hash(x)=23191101) +1506 train 7.393585 (lr=1.6636e-04) (hash(x)=26498861) +1507 train 7.929600 (lr=1.6635e-04) (hash(x)=34946941) +1508 train 7.560694 (lr=1.6634e-04) (hash(x)=25442719) +1509 train 7.397138 (lr=1.6632e-04) (hash(x)=25569942) +1510 train 7.117923 (lr=1.6631e-04) (hash(x)=21265828) +1511 train 7.017744 (lr=1.6630e-04) (hash(x)=20060838) +1512 train 7.212696 (lr=1.6629e-04) (hash(x)=22588251) +1513 train 7.179106 (lr=1.6628e-04) (hash(x)=24581020) +1514 train 7.118950 (lr=1.6627e-04) (hash(x)=21882493) +1515 train 7.067142 (lr=1.6626e-04) (hash(x)=21591702) +1516 train 7.081610 (lr=1.6625e-04) (hash(x)=19813285) +1517 train 7.188048 (lr=1.6623e-04) (hash(x)=21870012) +1518 train 7.243844 (lr=1.6622e-04) (hash(x)=26895498) +1519 train 7.271600 (lr=1.6621e-04) (hash(x)=25451055) +1520 train 7.331120 (lr=1.6620e-04) (hash(x)=25395865) +1521 train 6.761361 (lr=1.6619e-04) (hash(x)=18989695) +1522 train 6.661767 (lr=1.6618e-04) (hash(x)=17040678) +1523 train 6.757914 (lr=1.6617e-04) (hash(x)=18691455) +1524 train 6.855401 (lr=1.6615e-04) (hash(x)=19017167) +1525 train 7.188137 (lr=1.6614e-04) (hash(x)=22406503) +1526 train 7.338274 (lr=1.6613e-04) (hash(x)=23036138) +1527 train 7.224599 (lr=1.6612e-04) (hash(x)=24934792) +1528 train 7.251990 (lr=1.6611e-04) (hash(x)=22843127) +1529 train 7.188770 (lr=1.6610e-04) (hash(x)=24249677) +1530 train 7.060271 (lr=1.6609e-04) (hash(x)=23318555) +1531 train 7.095184 (lr=1.6607e-04) (hash(x)=23864361) +1532 train 6.978598 (lr=1.6606e-04) (hash(x)=20242060) +1533 train 7.178033 (lr=1.6605e-04) (hash(x)=21549554) +1534 train 6.985710 (lr=1.6604e-04) (hash(x)=21642024) +1535 train 7.489873 (lr=1.6603e-04) (hash(x)=25367597) +1536 train 7.657135 (lr=1.6602e-04) (hash(x)=27224144) +1537 train 7.214709 (lr=1.6601e-04) (hash(x)=24409290) +1538 train 7.338246 (lr=1.6599e-04) (hash(x)=24987180) +1539 train 7.205217 (lr=1.6598e-04) (hash(x)=27016702) +1540 train 7.490759 (lr=1.6597e-04) (hash(x)=25819636) +1541 train 7.411102 (lr=1.6596e-04) (hash(x)=25520453) +1542 train 7.221127 (lr=1.6595e-04) (hash(x)=23580496) +1543 train 7.420785 (lr=1.6594e-04) (hash(x)=25022148) +1544 train 7.406676 (lr=1.6593e-04) (hash(x)=25447327) +1545 train 7.401579 (lr=1.6591e-04) (hash(x)=25010319) +1546 train 7.331848 (lr=1.6590e-04) (hash(x)=25511777) +1547 train 7.370328 (lr=1.6589e-04) (hash(x)=24459012) +1548 train 7.379001 (lr=1.6588e-04) (hash(x)=25082785) +1549 train 7.423771 (lr=1.6587e-04) (hash(x)=26528670) +1550 val loss 7.4304 +1550 val perplexity 1686.4746 +1550 train 7.470870 (lr=1.6586e-04) (hash(x)=26684367) +1551 train 7.428014 (lr=1.6584e-04) (hash(x)=25431365) +1552 train 7.432413 (lr=1.6583e-04) (hash(x)=24802747) +1553 train 7.262413 (lr=1.6582e-04) (hash(x)=24229522) +1554 train 7.475128 (lr=1.6581e-04) (hash(x)=24757176) +1555 train 7.575279 (lr=1.6580e-04) (hash(x)=25958785) +1556 train 7.578231 (lr=1.6579e-04) (hash(x)=26810735) +1557 train 7.241680 (lr=1.6578e-04) (hash(x)=22882640) +1558 train 7.712522 (lr=1.6576e-04) (hash(x)=27220057) +1559 train 7.950438 (lr=1.6575e-04) (hash(x)=29307788) +1560 train 7.383049 (lr=1.6574e-04) (hash(x)=25214030) +1561 train 7.190193 (lr=1.6573e-04) (hash(x)=23167825) +1562 train 7.307439 (lr=1.6572e-04) (hash(x)=24658511) +1563 train 7.413217 (lr=1.6571e-04) (hash(x)=24965435) +1564 train 7.165338 (lr=1.6569e-04) (hash(x)=23620579) +1565 train 7.157141 (lr=1.6568e-04) (hash(x)=23772949) +1566 train 7.315460 (lr=1.6567e-04) (hash(x)=23807939) +1567 train 7.519860 (lr=1.6566e-04) (hash(x)=25651929) +1568 train 7.449608 (lr=1.6565e-04) (hash(x)=25549933) +1569 train 7.164639 (lr=1.6564e-04) (hash(x)=23146724) +1570 train 7.263537 (lr=1.6562e-04) (hash(x)=24099275) +1571 train 7.442217 (lr=1.6561e-04) (hash(x)=28451031) +1572 train 7.521511 (lr=1.6560e-04) (hash(x)=25488511) +1573 train 7.332733 (lr=1.6559e-04) (hash(x)=23796771) +1574 train 7.370192 (lr=1.6558e-04) (hash(x)=22642764) +1575 train 7.465704 (lr=1.6556e-04) (hash(x)=26312387) +1576 train 7.209690 (lr=1.6555e-04) (hash(x)=22486223) +1577 train 7.212653 (lr=1.6554e-04) (hash(x)=21257377) +1578 train 7.337718 (lr=1.6553e-04) (hash(x)=24328365) +1579 train 7.436723 (lr=1.6552e-04) (hash(x)=25326650) +1580 train 7.413919 (lr=1.6551e-04) (hash(x)=26484837) +1581 train 7.146164 (lr=1.6549e-04) (hash(x)=24605603) +1582 train 7.274971 (lr=1.6548e-04) (hash(x)=24668537) +1583 train 7.174123 (lr=1.6547e-04) (hash(x)=23804913) +1584 train 7.405556 (lr=1.6546e-04) (hash(x)=23615391) +1585 train 7.394158 (lr=1.6545e-04) (hash(x)=24322926) +1586 train 7.130039 (lr=1.6544e-04) (hash(x)=19753104) +1587 train 7.654859 (lr=1.6542e-04) (hash(x)=25537529) +1588 train 7.048524 (lr=1.6541e-04) (hash(x)=22835476) +1589 train 7.184866 (lr=1.6540e-04) (hash(x)=25707197) +1590 train 7.196456 (lr=1.6539e-04) (hash(x)=24191203) +1591 train 7.446921 (lr=1.6538e-04) (hash(x)=26115519) +1592 train 7.339021 (lr=1.6536e-04) (hash(x)=25781547) +1593 train 7.160634 (lr=1.6535e-04) (hash(x)=24850654) +1594 train 7.033348 (lr=1.6534e-04) (hash(x)=23300928) +1595 train 7.339694 (lr=1.6533e-04) (hash(x)=25494804) +1596 train 7.318798 (lr=1.6532e-04) (hash(x)=28169410) +1597 train 7.043469 (lr=1.6530e-04) (hash(x)=21972022) +1598 train 7.610849 (lr=1.6529e-04) (hash(x)=27687290) +1599 train 7.486389 (lr=1.6528e-04) (hash(x)=23210747) +1600 val loss 7.2710 +1600 val perplexity 1437.9382 +1600 train 7.501176 (lr=1.6527e-04) (hash(x)=20362758) +1601 train 7.308906 (lr=1.6526e-04) (hash(x)=17064773) +1602 train 7.364179 (lr=1.6525e-04) (hash(x)=17173694) +1603 train 7.455631 (lr=1.6523e-04) (hash(x)=15717069) +1604 train 7.562051 (lr=1.6522e-04) (hash(x)=15117973) +1605 train 7.355237 (lr=1.6521e-04) (hash(x)=16189636) +1606 train 7.284162 (lr=1.6520e-04) (hash(x)=16552095) +1607 train 7.090854 (lr=1.6519e-04) (hash(x)=18463712) +1608 train 7.307449 (lr=1.6517e-04) (hash(x)=17572155) +1609 train 7.232821 (lr=1.6516e-04) (hash(x)=19970072) +1610 train 7.249608 (lr=1.6515e-04) (hash(x)=20463871) +1611 train 7.331616 (lr=1.6514e-04) (hash(x)=20705573) +1612 train 7.137517 (lr=1.6513e-04) (hash(x)=24441646) +1613 train 7.274456 (lr=1.6511e-04) (hash(x)=22913147) +1614 train 7.427258 (lr=1.6510e-04) (hash(x)=23081598) +1615 train 7.114437 (lr=1.6509e-04) (hash(x)=23245699) +1616 train 7.167871 (lr=1.6508e-04) (hash(x)=23003072) +1617 train 7.463864 (lr=1.6507e-04) (hash(x)=27121904) +1618 train 7.231728 (lr=1.6505e-04) (hash(x)=25092305) +1619 train 7.231902 (lr=1.6504e-04) (hash(x)=23444521) +1620 train 7.220036 (lr=1.6503e-04) (hash(x)=22130531) +1621 train 6.957895 (lr=1.6502e-04) (hash(x)=20917937) +1622 train 7.130357 (lr=1.6501e-04) (hash(x)=22526838) +1623 train 7.286672 (lr=1.6499e-04) (hash(x)=21770300) +1624 train 8.583307 (lr=1.6498e-04) (hash(x)=22333537) +1625 train 8.550054 (lr=1.6497e-04) (hash(x)=24642519) +1626 train 7.556656 (lr=1.6496e-04) (hash(x)=25199038) +1627 train 7.297684 (lr=1.6495e-04) (hash(x)=23334569) +1628 train 7.171978 (lr=1.6493e-04) (hash(x)=23785360) +1629 train 6.791272 (lr=1.6492e-04) (hash(x)=21796200) +1630 train 6.911582 (lr=1.6491e-04) (hash(x)=22389081) +1631 train 7.248747 (lr=1.6490e-04) (hash(x)=25387532) +1632 train 6.758584 (lr=1.6488e-04) (hash(x)=17247578) +1633 train 7.174242 (lr=1.6487e-04) (hash(x)=22203733) +1634 train 7.336106 (lr=1.6486e-04) (hash(x)=24387455) +1635 train 7.887946 (lr=1.6485e-04) (hash(x)=29466743) +1636 train 7.190125 (lr=1.6484e-04) (hash(x)=25354152) +1637 train 7.225708 (lr=1.6482e-04) (hash(x)=21756102) +1638 train 7.206601 (lr=1.6481e-04) (hash(x)=23544029) +1639 train 7.399269 (lr=1.6480e-04) (hash(x)=27718703) +1640 train 7.341606 (lr=1.6479e-04) (hash(x)=25697138) +1641 train 7.148211 (lr=1.6477e-04) (hash(x)=22978681) +1642 train 7.784538 (lr=1.6476e-04) (hash(x)=29527067) +1643 train 6.755062 (lr=1.6475e-04) (hash(x)=17631973) +1644 train 7.216228 (lr=1.6474e-04) (hash(x)=24860172) +1645 train 7.591127 (lr=1.6473e-04) (hash(x)=27947891) +1646 train 7.284027 (lr=1.6471e-04) (hash(x)=23819556) +1647 train 7.315064 (lr=1.6470e-04) (hash(x)=27661052) +1648 train 7.093138 (lr=1.6469e-04) (hash(x)=23014209) +1649 train 7.028848 (lr=1.6468e-04) (hash(x)=23061452) +1650 val loss 7.2766 +1650 val perplexity 1446.1194 +1650 train 7.171418 (lr=1.6466e-04) (hash(x)=21949051) +1651 train 7.186359 (lr=1.6465e-04) (hash(x)=22244096) +1652 train 7.188350 (lr=1.6464e-04) (hash(x)=25997585) +1653 train 7.238754 (lr=1.6463e-04) (hash(x)=25389713) +1654 train 7.218964 (lr=1.6462e-04) (hash(x)=24390520) +1655 train 7.442935 (lr=1.6460e-04) (hash(x)=26538928) +1656 train 7.363515 (lr=1.6459e-04) (hash(x)=28708088) +1657 train 7.504682 (lr=1.6458e-04) (hash(x)=25685569) +1658 train 7.024418 (lr=1.6457e-04) (hash(x)=22163531) +1659 train 7.212404 (lr=1.6455e-04) (hash(x)=26256802) +1660 train 7.657377 (lr=1.6454e-04) (hash(x)=30016026) +1661 train 7.220600 (lr=1.6453e-04) (hash(x)=24412323) +1662 train 7.219957 (lr=1.6452e-04) (hash(x)=24722307) +1663 train 7.085941 (lr=1.6451e-04) (hash(x)=21772654) +1664 train 7.084169 (lr=1.6449e-04) (hash(x)=24984527) +1665 train 7.265189 (lr=1.6448e-04) (hash(x)=25456825) +1666 train 7.654068 (lr=1.6447e-04) (hash(x)=24383976) +1667 train 7.573377 (lr=1.6446e-04) (hash(x)=25026277) +1668 train 7.430221 (lr=1.6444e-04) (hash(x)=28121715) +1669 train 7.444784 (lr=1.6443e-04) (hash(x)=26855439) +1670 train 7.509673 (lr=1.6442e-04) (hash(x)=33370924) +1671 train 7.349098 (lr=1.6441e-04) (hash(x)=26263254) +1672 train 7.790666 (lr=1.6439e-04) (hash(x)=29958158) +1673 train 7.047262 (lr=1.6438e-04) (hash(x)=21917396) +1674 train 7.208477 (lr=1.6437e-04) (hash(x)=24196295) +1675 train 7.249268 (lr=1.6436e-04) (hash(x)=24726314) +1676 train 7.039673 (lr=1.6434e-04) (hash(x)=22137742) +1677 train 7.144693 (lr=1.6433e-04) (hash(x)=24375100) +1678 train 7.098998 (lr=1.6432e-04) (hash(x)=23965039) +1679 train 7.168224 (lr=1.6431e-04) (hash(x)=23552356) +1680 train 7.144143 (lr=1.6429e-04) (hash(x)=26136969) +1681 train 7.417824 (lr=1.6428e-04) (hash(x)=25343112) +1682 train 7.045166 (lr=1.6427e-04) (hash(x)=22831508) +1683 train 7.375862 (lr=1.6426e-04) (hash(x)=26699819) +1684 train 7.475155 (lr=1.6424e-04) (hash(x)=25435504) +1685 train 7.655764 (lr=1.6423e-04) (hash(x)=25218858) +1686 train 8.302829 (lr=1.6422e-04) (hash(x)=25664448) +1687 train 7.280414 (lr=1.6421e-04) (hash(x)=22707141) +1688 train 7.480034 (lr=1.6419e-04) (hash(x)=28001383) +1689 train 7.718097 (lr=1.6418e-04) (hash(x)=29168269) +1690 train 7.666060 (lr=1.6417e-04) (hash(x)=29637522) +1691 train 7.684673 (lr=1.6416e-04) (hash(x)=25676149) +1692 train 7.068163 (lr=1.6414e-04) (hash(x)=20919831) +1693 train 7.296121 (lr=1.6413e-04) (hash(x)=24324401) +1694 train 7.397287 (lr=1.6412e-04) (hash(x)=26862625) +1695 train 7.798262 (lr=1.6411e-04) (hash(x)=34234481) +1696 train 7.368875 (lr=1.6409e-04) (hash(x)=27415195) +1697 train 7.187064 (lr=1.6408e-04) (hash(x)=24511386) +1698 train 7.340076 (lr=1.6407e-04) (hash(x)=26904299) +1699 train 7.212640 (lr=1.6406e-04) (hash(x)=25401624) +1700 val loss 7.3020 +1700 val perplexity 1483.1907 +1700 train 7.248598 (lr=1.6404e-04) (hash(x)=26498489) +1701 train 7.226238 (lr=1.6403e-04) (hash(x)=22340685) +1702 train 7.316528 (lr=1.6402e-04) (hash(x)=26396757) +1703 train 7.886951 (lr=1.6401e-04) (hash(x)=35008670) +1704 train 7.680492 (lr=1.6399e-04) (hash(x)=31782020) +1705 train 7.573119 (lr=1.6398e-04) (hash(x)=29662286) +1706 train 7.731805 (lr=1.6397e-04) (hash(x)=34215782) +1707 train 7.254550 (lr=1.6396e-04) (hash(x)=25682280) +1708 train 7.420062 (lr=1.6394e-04) (hash(x)=27109048) +1709 train 7.471841 (lr=1.6393e-04) (hash(x)=27686498) +1710 train 7.287634 (lr=1.6392e-04) (hash(x)=24247565) +1711 train 7.304961 (lr=1.6390e-04) (hash(x)=25891543) +1712 train 7.439661 (lr=1.6389e-04) (hash(x)=26436778) +1713 train 7.075690 (lr=1.6388e-04) (hash(x)=22538881) +1714 train 7.025755 (lr=1.6387e-04) (hash(x)=21993512) +1715 train 7.483900 (lr=1.6385e-04) (hash(x)=25962407) +1716 train 7.298737 (lr=1.6384e-04) (hash(x)=24130284) +1717 train 7.144246 (lr=1.6383e-04) (hash(x)=24819073) +1718 train 7.014967 (lr=1.6382e-04) (hash(x)=23496648) +1719 train 7.095488 (lr=1.6380e-04) (hash(x)=21971224) +1720 train 7.025270 (lr=1.6379e-04) (hash(x)=21498081) +1721 train 7.115477 (lr=1.6378e-04) (hash(x)=20951317) +1722 train 7.630486 (lr=1.6377e-04) (hash(x)=28848134) +1723 train 7.700840 (lr=1.6375e-04) (hash(x)=30838142) +1724 train 7.634568 (lr=1.6374e-04) (hash(x)=28844392) +1725 train 7.193707 (lr=1.6373e-04) (hash(x)=23102419) +1726 train 7.267460 (lr=1.6371e-04) (hash(x)=22374479) +1727 train 7.542402 (lr=1.6370e-04) (hash(x)=27312186) +1728 train 7.872952 (lr=1.6369e-04) (hash(x)=34362559) +1729 train 7.777922 (lr=1.6368e-04) (hash(x)=30920030) +1730 train 7.121533 (lr=1.6366e-04) (hash(x)=23684126) +1731 train 7.391853 (lr=1.6365e-04) (hash(x)=23657081) +1732 train 7.601189 (lr=1.6364e-04) (hash(x)=28463299) +1733 train 7.867067 (lr=1.6362e-04) (hash(x)=35351214) +1734 train 7.474550 (lr=1.6361e-04) (hash(x)=28855662) +1735 train 6.998113 (lr=1.6360e-04) (hash(x)=22163749) +1736 train 7.058745 (lr=1.6359e-04) (hash(x)=22024585) +1737 train 7.258780 (lr=1.6357e-04) (hash(x)=24629160) +1738 train 7.352330 (lr=1.6356e-04) (hash(x)=25220941) +1739 train 7.297846 (lr=1.6355e-04) (hash(x)=24829818) +1740 train 7.582832 (lr=1.6353e-04) (hash(x)=28453898) +1741 train 7.605388 (lr=1.6352e-04) (hash(x)=25424550) +1742 train 7.254057 (lr=1.6351e-04) (hash(x)=23437814) +1743 train 7.310852 (lr=1.6350e-04) (hash(x)=25942888) +1744 train 7.312141 (lr=1.6348e-04) (hash(x)=24503801) +1745 train 7.611123 (lr=1.6347e-04) (hash(x)=26418501) +1746 train 7.489871 (lr=1.6346e-04) (hash(x)=27177691) +1747 train 7.205851 (lr=1.6344e-04) (hash(x)=23785671) +1748 train 7.623587 (lr=1.6343e-04) (hash(x)=27362772) +1749 train 7.443796 (lr=1.6342e-04) (hash(x)=25097859) +1750 val loss 7.4059 +1750 val perplexity 1645.7390 +1750 train 7.341625 (lr=1.6341e-04) (hash(x)=24662466) +1751 train 7.322026 (lr=1.6339e-04) (hash(x)=25493916) +1752 train 7.418012 (lr=1.6338e-04) (hash(x)=24655868) +1753 train 7.724738 (lr=1.6337e-04) (hash(x)=19819210) +1754 train 7.244172 (lr=1.6335e-04) (hash(x)=21377155) +1755 train 8.055181 (lr=1.6334e-04) (hash(x)=28618702) +1756 train 7.959068 (lr=1.6333e-04) (hash(x)=27324953) +1757 train 7.692624 (lr=1.6332e-04) (hash(x)=29707907) +1758 train 7.513181 (lr=1.6330e-04) (hash(x)=24485921) +1759 train 7.552084 (lr=1.6329e-04) (hash(x)=24289951) +1760 train 7.253102 (lr=1.6328e-04) (hash(x)=22496716) +1761 train 7.381464 (lr=1.6326e-04) (hash(x)=25147026) +1762 train 7.464668 (lr=1.6325e-04) (hash(x)=26851828) +1763 train 7.425089 (lr=1.6324e-04) (hash(x)=26331486) +1764 train 7.308406 (lr=1.6322e-04) (hash(x)=24383054) +1765 train 7.453807 (lr=1.6321e-04) (hash(x)=25885126) +1766 train 7.388313 (lr=1.6320e-04) (hash(x)=25848470) +1767 train 7.233982 (lr=1.6319e-04) (hash(x)=23648671) +1768 train 7.191710 (lr=1.6317e-04) (hash(x)=23168674) +1769 train 7.090745 (lr=1.6316e-04) (hash(x)=20252079) +1770 train 7.258813 (lr=1.6315e-04) (hash(x)=23914287) +1771 train 7.533853 (lr=1.6313e-04) (hash(x)=27292797) +1772 train 6.817169 (lr=1.6312e-04) (hash(x)=16175151) +1773 train 6.873670 (lr=1.6311e-04) (hash(x)=18317379) +1774 train 7.248487 (lr=1.6309e-04) (hash(x)=24464271) +1775 train 7.259520 (lr=1.6308e-04) (hash(x)=24992055) +1776 train 8.015744 (lr=1.6307e-04) (hash(x)=26032451) +1777 train 7.689949 (lr=1.6305e-04) (hash(x)=24734221) +1778 train 7.657399 (lr=1.6304e-04) (hash(x)=25413430) +1779 train 7.516860 (lr=1.6303e-04) (hash(x)=24398330) +1780 train 7.324323 (lr=1.6302e-04) (hash(x)=24568049) +1781 train 7.217259 (lr=1.6300e-04) (hash(x)=23573984) +1782 train 7.430954 (lr=1.6299e-04) (hash(x)=27338410) +1783 train 7.381303 (lr=1.6298e-04) (hash(x)=26005549) +1784 train 7.194011 (lr=1.6296e-04) (hash(x)=24332331) +1785 train 7.042339 (lr=1.6295e-04) (hash(x)=22583878) +1786 train 7.240771 (lr=1.6294e-04) (hash(x)=24599113) +1787 train 7.718166 (lr=1.6292e-04) (hash(x)=30259737) +1788 train 7.466953 (lr=1.6291e-04) (hash(x)=26504237) +1789 train 7.326870 (lr=1.6290e-04) (hash(x)=25196470) +1790 train 7.215918 (lr=1.6288e-04) (hash(x)=23607871) +1791 train 7.167131 (lr=1.6287e-04) (hash(x)=21046554) +1792 train 7.439487 (lr=1.6286e-04) (hash(x)=27285635) +1793 train 7.350099 (lr=1.6284e-04) (hash(x)=25454371) +1794 train 7.439826 (lr=1.6283e-04) (hash(x)=26486575) +1795 train 6.930726 (lr=1.6282e-04) (hash(x)=18773877) +1796 train 7.084840 (lr=1.6280e-04) (hash(x)=22506761) +1797 train 7.266544 (lr=1.6279e-04) (hash(x)=24645168) +1798 train 7.370632 (lr=1.6278e-04) (hash(x)=25046236) +1799 train 7.433629 (lr=1.6276e-04) (hash(x)=26321539) +1800 val loss 7.2692 +1800 val perplexity 1435.3632 +1800 train 7.219833 (lr=1.6275e-04) (hash(x)=24602494) +1801 train 7.365238 (lr=1.6274e-04) (hash(x)=25722713) +1802 train 7.115065 (lr=1.6273e-04) (hash(x)=23711219) +1803 train 7.250369 (lr=1.6271e-04) (hash(x)=22850804) +1804 train 7.586272 (lr=1.6270e-04) (hash(x)=25829388) +1805 train 7.099280 (lr=1.6269e-04) (hash(x)=22503524) +1806 train 7.410714 (lr=1.6267e-04) (hash(x)=26669453) +1807 train 7.327237 (lr=1.6266e-04) (hash(x)=27807872) +1808 train 7.354506 (lr=1.6265e-04) (hash(x)=23543560) +1809 train 7.476438 (lr=1.6263e-04) (hash(x)=25845590) +1810 train 7.240832 (lr=1.6262e-04) (hash(x)=23026635) +1811 train 7.175022 (lr=1.6261e-04) (hash(x)=25545137) +1812 train 7.692465 (lr=1.6259e-04) (hash(x)=27746841) +1813 train 7.074871 (lr=1.6258e-04) (hash(x)=25471231) +1814 train 7.213440 (lr=1.6257e-04) (hash(x)=24333204) +1815 train 7.062416 (lr=1.6255e-04) (hash(x)=21555364) +1816 train 7.306696 (lr=1.6254e-04) (hash(x)=26317977) +1817 train 7.361377 (lr=1.6253e-04) (hash(x)=24474988) +1818 train 7.024857 (lr=1.6251e-04) (hash(x)=21975953) +1819 train 7.670538 (lr=1.6250e-04) (hash(x)=27243798) +1820 train 7.269388 (lr=1.6249e-04) (hash(x)=25097367) +1821 train 7.170856 (lr=1.6247e-04) (hash(x)=24419085) +1822 train 7.134879 (lr=1.6246e-04) (hash(x)=23058837) +1823 train 7.268482 (lr=1.6245e-04) (hash(x)=26325324) +1824 train 7.025890 (lr=1.6243e-04) (hash(x)=20581023) +1825 train 7.364281 (lr=1.6242e-04) (hash(x)=24822111) +1826 train 7.101998 (lr=1.6240e-04) (hash(x)=24336304) +1827 train 7.273628 (lr=1.6239e-04) (hash(x)=26228728) +1828 train 7.374319 (lr=1.6238e-04) (hash(x)=26445781) +1829 train 7.486526 (lr=1.6236e-04) (hash(x)=24707042) +1830 train 7.723287 (lr=1.6235e-04) (hash(x)=27882744) +1831 train 7.233582 (lr=1.6234e-04) (hash(x)=24956294) +1832 train 6.993316 (lr=1.6232e-04) (hash(x)=20984728) +1833 train 7.028873 (lr=1.6231e-04) (hash(x)=23424737) +1834 train 7.472147 (lr=1.6230e-04) (hash(x)=26207120) +1835 train 7.482695 (lr=1.6228e-04) (hash(x)=25592289) +1836 train 7.166344 (lr=1.6227e-04) (hash(x)=24326649) +1837 train 7.284610 (lr=1.6226e-04) (hash(x)=26826109) +1838 train 7.258144 (lr=1.6224e-04) (hash(x)=24759294) +1839 train 7.241713 (lr=1.6223e-04) (hash(x)=24429389) +1840 train 7.199516 (lr=1.6222e-04) (hash(x)=25537519) +1841 train 7.149530 (lr=1.6220e-04) (hash(x)=24747421) +1842 train 7.077511 (lr=1.6219e-04) (hash(x)=23079065) +1843 train 7.511849 (lr=1.6218e-04) (hash(x)=28733708) +1844 train 7.229520 (lr=1.6216e-04) (hash(x)=23937742) +1845 train 7.574337 (lr=1.6215e-04) (hash(x)=29704803) +1846 train 7.762073 (lr=1.6214e-04) (hash(x)=34617155) +1847 train 7.443501 (lr=1.6212e-04) (hash(x)=27929846) +1848 train 7.799062 (lr=1.6211e-04) (hash(x)=28280878) +1849 train 6.842117 (lr=1.6209e-04) (hash(x)=18961171) +1850 val loss 7.3241 +1850 val perplexity 1516.3861 +1850 train 7.426657 (lr=1.6208e-04) (hash(x)=27146015) +1851 train 7.227602 (lr=1.6207e-04) (hash(x)=22417476) +1852 train 7.318500 (lr=1.6205e-04) (hash(x)=24583152) +1853 train 7.352390 (lr=1.6204e-04) (hash(x)=26364120) +1854 train 7.554353 (lr=1.6203e-04) (hash(x)=25946767) +1855 train 7.383958 (lr=1.6201e-04) (hash(x)=25282897) +1856 train 7.317191 (lr=1.6200e-04) (hash(x)=25154557) +1857 train 6.977659 (lr=1.6199e-04) (hash(x)=22082503) +1858 train 7.056587 (lr=1.6197e-04) (hash(x)=23974606) +1859 train 7.221857 (lr=1.6196e-04) (hash(x)=22278062) +1860 train 7.082490 (lr=1.6194e-04) (hash(x)=19509639) +1861 train 7.405208 (lr=1.6193e-04) (hash(x)=24271468) +1862 train 6.980028 (lr=1.6192e-04) (hash(x)=21943809) +1863 train 7.236475 (lr=1.6190e-04) (hash(x)=26802508) +1864 train 7.865304 (lr=1.6189e-04) (hash(x)=34178409) +1865 train 8.028258 (lr=1.6188e-04) (hash(x)=33468379) +1866 train 7.059215 (lr=1.6186e-04) (hash(x)=22109262) +1867 train 6.831377 (lr=1.6185e-04) (hash(x)=22094832) +1868 train 7.101114 (lr=1.6184e-04) (hash(x)=24016953) +1869 train 7.405936 (lr=1.6182e-04) (hash(x)=26759850) +1870 train 7.169353 (lr=1.6181e-04) (hash(x)=23570779) +1871 train 7.711740 (lr=1.6179e-04) (hash(x)=28390416) +1872 train 7.706543 (lr=1.6178e-04) (hash(x)=26215770) +1873 train 7.574484 (lr=1.6177e-04) (hash(x)=22727956) +1874 train 7.356513 (lr=1.6175e-04) (hash(x)=21304587) +1875 train 7.691915 (lr=1.6174e-04) (hash(x)=26379331) +1876 train 7.759737 (lr=1.6173e-04) (hash(x)=25252419) +1877 train 7.557701 (lr=1.6171e-04) (hash(x)=25048158) +1878 train 7.512177 (lr=1.6170e-04) (hash(x)=23588991) +1879 train 7.495528 (lr=1.6168e-04) (hash(x)=26292451) +1880 train 7.394562 (lr=1.6167e-04) (hash(x)=23617086) +1881 train 7.229252 (lr=1.6166e-04) (hash(x)=23336031) +1882 train 7.166322 (lr=1.6164e-04) (hash(x)=19198742) +1883 train 7.854514 (lr=1.6163e-04) (hash(x)=26301866) +1884 train 7.860614 (lr=1.6162e-04) (hash(x)=30114703) +1885 train 7.367090 (lr=1.6160e-04) (hash(x)=26687040) +1886 train 7.205082 (lr=1.6159e-04) (hash(x)=25810717) +1887 train 7.011371 (lr=1.6157e-04) (hash(x)=22915344) +1888 train 7.409688 (lr=1.6156e-04) (hash(x)=27046189) +1889 train 6.975840 (lr=1.6155e-04) (hash(x)=19831900) +1890 train 7.402847 (lr=1.6153e-04) (hash(x)=27786987) +1891 train 7.252219 (lr=1.6152e-04) (hash(x)=25448318) +1892 train 7.277597 (lr=1.6150e-04) (hash(x)=25166953) +1893 train 7.239468 (lr=1.6149e-04) (hash(x)=24993116) +1894 train 7.302376 (lr=1.6148e-04) (hash(x)=25748002) +1895 train 7.500161 (lr=1.6146e-04) (hash(x)=24744383) +1896 train 7.247400 (lr=1.6145e-04) (hash(x)=25560120) +1897 train 7.086308 (lr=1.6144e-04) (hash(x)=23731849) +1898 train 7.086178 (lr=1.6142e-04) (hash(x)=24115851) +1899 train 7.099779 (lr=1.6141e-04) (hash(x)=22835201) +1900 val loss 7.2562 +1900 val perplexity 1416.9086 +1900 train 6.863307 (lr=1.6139e-04) (hash(x)=21927896) +1901 train 7.317227 (lr=1.6138e-04) (hash(x)=24652361) +1902 train 7.477891 (lr=1.6137e-04) (hash(x)=27332405) +1903 train 7.286640 (lr=1.6135e-04) (hash(x)=26284678) +1904 train 7.215805 (lr=1.6134e-04) (hash(x)=23441305) +1905 train 7.327855 (lr=1.6132e-04) (hash(x)=27522881) +1906 train 7.391940 (lr=1.6131e-04) (hash(x)=25521191) +1907 train 7.178020 (lr=1.6130e-04) (hash(x)=24745936) +1908 train 7.034941 (lr=1.6128e-04) (hash(x)=21653364) +1909 train 7.108534 (lr=1.6127e-04) (hash(x)=21973969) +1910 train 7.115398 (lr=1.6125e-04) (hash(x)=24318192) +1911 train 7.030292 (lr=1.6124e-04) (hash(x)=21654269) +1912 train 7.116159 (lr=1.6123e-04) (hash(x)=24142904) +1913 train 6.994406 (lr=1.6121e-04) (hash(x)=21708739) +1914 train 7.206236 (lr=1.6120e-04) (hash(x)=22937923) +1915 train 7.874969 (lr=1.6118e-04) (hash(x)=32387999) +1916 train 8.036023 (lr=1.6117e-04) (hash(x)=28958671) +1917 train 8.100249 (lr=1.6116e-04) (hash(x)=32662682) +1918 train 8.002723 (lr=1.6114e-04) (hash(x)=31364539) +1919 train 8.089328 (lr=1.6113e-04) (hash(x)=29466268) +1920 train 8.085149 (lr=1.6111e-04) (hash(x)=31407564) +1921 train 7.956907 (lr=1.6110e-04) (hash(x)=28372973) +1922 train 8.041545 (lr=1.6109e-04) (hash(x)=28620993) +1923 train 8.099687 (lr=1.6107e-04) (hash(x)=30736727) +1924 train 7.994526 (lr=1.6106e-04) (hash(x)=30370374) +1925 train 7.941513 (lr=1.6104e-04) (hash(x)=29935562) +1926 train 7.950794 (lr=1.6103e-04) (hash(x)=30528627) +1927 train 7.971669 (lr=1.6102e-04) (hash(x)=32616762) +1928 train 7.801467 (lr=1.6100e-04) (hash(x)=29150044) +1929 train 7.996005 (lr=1.6099e-04) (hash(x)=32861403) +1930 train 7.943851 (lr=1.6097e-04) (hash(x)=31053918) +1931 train 7.826106 (lr=1.6096e-04) (hash(x)=29358578) +1932 train 7.932935 (lr=1.6095e-04) (hash(x)=31521292) +1933 train 7.869270 (lr=1.6093e-04) (hash(x)=31218966) +1934 train 7.861826 (lr=1.6092e-04) (hash(x)=31811872) +1935 train 8.047640 (lr=1.6090e-04) (hash(x)=32201138) +1936 train 7.767793 (lr=1.6089e-04) (hash(x)=28631348) +1937 train 7.901022 (lr=1.6088e-04) (hash(x)=30545133) +1938 train 7.926437 (lr=1.6086e-04) (hash(x)=32136080) +1939 train 8.069507 (lr=1.6085e-04) (hash(x)=30041621) +1940 train 7.788131 (lr=1.6083e-04) (hash(x)=30537181) +1941 train 7.820801 (lr=1.6082e-04) (hash(x)=30371023) +1942 train 7.995014 (lr=1.6080e-04) (hash(x)=30734634) +1943 train 7.877399 (lr=1.6079e-04) (hash(x)=33683468) +1944 train 7.916912 (lr=1.6078e-04) (hash(x)=30472451) +1945 train 7.705305 (lr=1.6076e-04) (hash(x)=29809830) +1946 train 7.443088 (lr=1.6075e-04) (hash(x)=26077593) +1947 train 7.412007 (lr=1.6073e-04) (hash(x)=26837755) +1948 train 7.359661 (lr=1.6072e-04) (hash(x)=23910920) +1949 train 7.343625 (lr=1.6070e-04) (hash(x)=26084089) +1950 val loss 7.3108 +1950 val perplexity 1496.3811 +1950 train 7.532030 (lr=1.6069e-04) (hash(x)=26963533) +1951 train 7.390300 (lr=1.6068e-04) (hash(x)=27498125) +1952 train 7.617512 (lr=1.6066e-04) (hash(x)=29512508) +1953 train 7.911982 (lr=1.6065e-04) (hash(x)=34478395) +1954 train 7.521584 (lr=1.6063e-04) (hash(x)=25357046) +1955 train 7.234955 (lr=1.6062e-04) (hash(x)=22372507) +1956 train 7.236884 (lr=1.6061e-04) (hash(x)=24501779) +1957 train 7.311534 (lr=1.6059e-04) (hash(x)=25638879) +1958 train 7.138063 (lr=1.6058e-04) (hash(x)=24243109) +1959 train 7.092000 (lr=1.6056e-04) (hash(x)=25164318) +1960 train 7.259423 (lr=1.6055e-04) (hash(x)=24139533) +1961 train 7.296360 (lr=1.6053e-04) (hash(x)=27271900) +1962 train 7.146139 (lr=1.6052e-04) (hash(x)=24869232) +1963 train 7.317382 (lr=1.6051e-04) (hash(x)=26562947) +1964 train 7.203918 (lr=1.6049e-04) (hash(x)=26477326) +1965 train 7.318383 (lr=1.6048e-04) (hash(x)=24917192) +1966 train 7.071882 (lr=1.6046e-04) (hash(x)=23110147) +1967 train 7.130995 (lr=1.6045e-04) (hash(x)=25690221) +1968 train 7.644417 (lr=1.6043e-04) (hash(x)=26999273) +1969 train 7.291521 (lr=1.6042e-04) (hash(x)=24807841) +1970 train 7.155107 (lr=1.6041e-04) (hash(x)=23918831) +1971 train 7.068317 (lr=1.6039e-04) (hash(x)=21947305) +1972 train 7.163064 (lr=1.6038e-04) (hash(x)=22874486) +1973 train 7.054958 (lr=1.6036e-04) (hash(x)=22195089) +1974 train 7.211752 (lr=1.6035e-04) (hash(x)=25345359) +1975 train 7.402302 (lr=1.6033e-04) (hash(x)=29031550) +1976 train 7.346088 (lr=1.6032e-04) (hash(x)=29947423) +1977 train 7.503078 (lr=1.6030e-04) (hash(x)=29395823) +1978 train 7.311876 (lr=1.6029e-04) (hash(x)=26968216) +1979 train 7.323287 (lr=1.6028e-04) (hash(x)=26551589) +1980 train 7.323671 (lr=1.6026e-04) (hash(x)=25657210) +1981 train 7.254526 (lr=1.6025e-04) (hash(x)=23689487) +1982 train 7.376972 (lr=1.6023e-04) (hash(x)=25744240) +1983 train 7.380562 (lr=1.6022e-04) (hash(x)=24094093) +1984 train 7.036565 (lr=1.6020e-04) (hash(x)=21724872) +1985 train 7.075033 (lr=1.6019e-04) (hash(x)=24106453) +1986 train 7.153900 (lr=1.6017e-04) (hash(x)=25004577) +1987 train 7.193401 (lr=1.6016e-04) (hash(x)=23639076) +1988 train 7.486170 (lr=1.6015e-04) (hash(x)=29408797) +1989 train 7.130006 (lr=1.6013e-04) (hash(x)=25107314) +1990 train 9.678256 (lr=1.6012e-04) (hash(x)=49896019) +1991 train 11.046910 (lr=1.6010e-04) (hash(x)=61455960) +1992 train 10.882050 (lr=1.6009e-04) (hash(x)=63788199) +1993 train 10.831428 (lr=1.6007e-04) (hash(x)=63899424) +1994 train 10.373246 (lr=1.6006e-04) (hash(x)=66412689) +1995 train 9.896728 (lr=1.6004e-04) (hash(x)=65636572) +1996 train 9.853324 (lr=1.6003e-04) (hash(x)=69649789) +1997 train 9.571767 (lr=1.6002e-04) (hash(x)=71578682) +1998 train 9.034022 (lr=1.6000e-04) (hash(x)=58341730) +1999 train 9.092596 (lr=1.5999e-04) (hash(x)=61104710) +2000 val loss 8.6472 +2000 val perplexity 5694.2275 +2000 train 8.894055 (lr=1.5997e-04) (hash(x)=52865322) +2001 train 8.633693 (lr=1.5996e-04) (hash(x)=23633693) +2002 train 8.324859 (lr=1.5994e-04) (hash(x)=25297571) +2003 train 8.494910 (lr=1.5993e-04) (hash(x)=24123821) +2004 train 7.642186 (lr=1.5991e-04) (hash(x)=20161517) +2005 train 7.410820 (lr=1.5990e-04) (hash(x)=19919984) +2006 train 7.188477 (lr=1.5988e-04) (hash(x)=18626507) +2007 train 7.199123 (lr=1.5987e-04) (hash(x)=20881126) +2008 train 7.393880 (lr=1.5986e-04) (hash(x)=26261448) +2009 train 7.533408 (lr=1.5984e-04) (hash(x)=27528050) +2010 train 7.579884 (lr=1.5983e-04) (hash(x)=26692097) +2011 train 7.333307 (lr=1.5981e-04) (hash(x)=23209969) +2012 train 7.323621 (lr=1.5980e-04) (hash(x)=26083446) +2013 train 7.669507 (lr=1.5978e-04) (hash(x)=28426467) +2014 train 7.380187 (lr=1.5977e-04) (hash(x)=26158154) +2015 train 7.479363 (lr=1.5975e-04) (hash(x)=26920243) +2016 train 7.147748 (lr=1.5974e-04) (hash(x)=21365321) +2017 train 7.247185 (lr=1.5972e-04) (hash(x)=25730699) +2018 train 7.316593 (lr=1.5971e-04) (hash(x)=25177106) +2019 train 7.222255 (lr=1.5969e-04) (hash(x)=26127756) +2020 train 6.764052 (lr=1.5968e-04) (hash(x)=19770037) +2021 train 7.228851 (lr=1.5967e-04) (hash(x)=26479346) +2022 train 7.250793 (lr=1.5965e-04) (hash(x)=25967643) +2023 train 7.224297 (lr=1.5964e-04) (hash(x)=21970343) +2024 train 7.417888 (lr=1.5962e-04) (hash(x)=26449648) +2025 train 7.291475 (lr=1.5961e-04) (hash(x)=24874094) +2026 train 6.998661 (lr=1.5959e-04) (hash(x)=21399697) +2027 train 7.216011 (lr=1.5958e-04) (hash(x)=24097897) +2028 train 7.250455 (lr=1.5956e-04) (hash(x)=24453548) +2029 train 7.355218 (lr=1.5955e-04) (hash(x)=26692093) +2030 train 7.181571 (lr=1.5953e-04) (hash(x)=27217002) +2031 train 7.573545 (lr=1.5952e-04) (hash(x)=31676352) +2032 train 7.237731 (lr=1.5950e-04) (hash(x)=23396350) +2033 train 7.262383 (lr=1.5949e-04) (hash(x)=26245173) +2034 train 7.280874 (lr=1.5947e-04) (hash(x)=24821033) +2035 train 7.347166 (lr=1.5946e-04) (hash(x)=23908053) +2036 train 7.044837 (lr=1.5944e-04) (hash(x)=23469373) +2037 train 7.087937 (lr=1.5943e-04) (hash(x)=24102198) +2038 train 7.143228 (lr=1.5941e-04) (hash(x)=24712135) +2039 train 7.417680 (lr=1.5940e-04) (hash(x)=25600562) +2040 train 7.307784 (lr=1.5939e-04) (hash(x)=23193393) +2041 train 7.324036 (lr=1.5937e-04) (hash(x)=24776954) +2042 train 7.413471 (lr=1.5936e-04) (hash(x)=28066546) +2043 train 7.019275 (lr=1.5934e-04) (hash(x)=23549168) +2044 train 7.059479 (lr=1.5933e-04) (hash(x)=22681487) +2045 train 7.265476 (lr=1.5931e-04) (hash(x)=26663184) +2046 train 7.198305 (lr=1.5930e-04) (hash(x)=23320809) +2047 train 7.101631 (lr=1.5928e-04) (hash(x)=22022924) +2048 train 7.423725 (lr=1.5927e-04) (hash(x)=27960930) +2049 train 7.225643 (lr=1.5925e-04) (hash(x)=24899178) +2050 val loss 7.2427 +2050 val perplexity 1397.9066 +2050 train 7.152396 (lr=1.5924e-04) (hash(x)=24450711) +2051 train 7.093633 (lr=1.5922e-04) (hash(x)=23294980) +2052 train 6.998044 (lr=1.5921e-04) (hash(x)=23243665) +2053 train 6.845966 (lr=1.5919e-04) (hash(x)=21004461) +2054 train 7.177963 (lr=1.5918e-04) (hash(x)=24493583) +2055 train 7.111917 (lr=1.5916e-04) (hash(x)=22777085) +2056 train 7.067745 (lr=1.5915e-04) (hash(x)=25169889) +2057 train 7.717716 (lr=1.5913e-04) (hash(x)=28395880) +2058 train 7.649124 (lr=1.5912e-04) (hash(x)=29603726) +2059 train 7.262711 (lr=1.5910e-04) (hash(x)=26271115) +2060 train 7.254970 (lr=1.5909e-04) (hash(x)=25616212) +2061 train 7.365761 (lr=1.5907e-04) (hash(x)=26398325) +2062 train 7.043277 (lr=1.5906e-04) (hash(x)=23836586) +2063 train 6.950112 (lr=1.5904e-04) (hash(x)=21727744) +2064 train 7.210767 (lr=1.5903e-04) (hash(x)=25183195) +2065 train 7.346199 (lr=1.5901e-04) (hash(x)=27108132) +2066 train 7.034501 (lr=1.5900e-04) (hash(x)=20987812) +2067 train 7.370450 (lr=1.5898e-04) (hash(x)=22729318) +2068 train 7.175453 (lr=1.5897e-04) (hash(x)=23129709) +2069 train 7.702399 (lr=1.5895e-04) (hash(x)=32820084) +2070 train 7.779653 (lr=1.5894e-04) (hash(x)=33763489) +2071 train 7.233571 (lr=1.5892e-04) (hash(x)=20701998) +2072 train 7.430488 (lr=1.5891e-04) (hash(x)=27765988) +2073 train 7.189389 (lr=1.5889e-04) (hash(x)=24157446) +2074 train 7.124725 (lr=1.5888e-04) (hash(x)=22014978) +2075 train 7.639429 (lr=1.5886e-04) (hash(x)=27928398) +2076 train 7.459953 (lr=1.5885e-04) (hash(x)=27880142) +2077 train 7.778523 (lr=1.5883e-04) (hash(x)=34991795) +2078 train 7.345614 (lr=1.5882e-04) (hash(x)=25944128) +2079 train 7.036781 (lr=1.5880e-04) (hash(x)=20863982) +2080 train 7.503552 (lr=1.5879e-04) (hash(x)=28036097) +2081 train 7.511941 (lr=1.5877e-04) (hash(x)=25813615) +2082 train 6.928011 (lr=1.5876e-04) (hash(x)=22862316) +2083 train 7.042249 (lr=1.5874e-04) (hash(x)=22827054) +2084 train 7.120474 (lr=1.5873e-04) (hash(x)=23996531) +2085 train 7.235318 (lr=1.5871e-04) (hash(x)=25756087) +2086 train 7.255491 (lr=1.5870e-04) (hash(x)=23165889) +2087 train 7.447152 (lr=1.5868e-04) (hash(x)=25084926) +2088 train 7.257859 (lr=1.5867e-04) (hash(x)=26063862) +2089 train 7.311599 (lr=1.5865e-04) (hash(x)=27843638) +2090 train 7.553064 (lr=1.5864e-04) (hash(x)=27375554) +2091 train 7.354466 (lr=1.5862e-04) (hash(x)=25540961) +2092 train 7.090865 (lr=1.5861e-04) (hash(x)=22933785) +2093 train 7.252834 (lr=1.5859e-04) (hash(x)=23996956) +2094 train 6.974164 (lr=1.5858e-04) (hash(x)=22915854) +2095 train 7.218649 (lr=1.5856e-04) (hash(x)=24412897) +2096 train 7.264292 (lr=1.5855e-04) (hash(x)=25152336) +2097 train 7.578674 (lr=1.5853e-04) (hash(x)=29525589) +2098 train 7.411214 (lr=1.5852e-04) (hash(x)=26435656) +2099 train 7.276034 (lr=1.5850e-04) (hash(x)=26269869) +2100 val loss 7.2206 +2100 val perplexity 1367.2644 +2100 train 7.028121 (lr=1.5849e-04) (hash(x)=23856783) +2101 train 7.324126 (lr=1.5847e-04) (hash(x)=26039611) +2102 train 7.047716 (lr=1.5846e-04) (hash(x)=25048861) +2103 train 7.184316 (lr=1.5844e-04) (hash(x)=25434913) +2104 train 7.369283 (lr=1.5843e-04) (hash(x)=24203891) +2105 train 7.259120 (lr=1.5841e-04) (hash(x)=26016998) +2106 train 7.311174 (lr=1.5840e-04) (hash(x)=23986767) +2107 train 7.251645 (lr=1.5838e-04) (hash(x)=25157653) +2108 train 7.404823 (lr=1.5837e-04) (hash(x)=30193751) +2109 train 7.256639 (lr=1.5835e-04) (hash(x)=22630574) +2110 train 7.100882 (lr=1.5833e-04) (hash(x)=23475467) +2111 train 7.400186 (lr=1.5832e-04) (hash(x)=26302544) +2112 train 7.165282 (lr=1.5830e-04) (hash(x)=21276592) +2113 train 7.446515 (lr=1.5829e-04) (hash(x)=27566393) +2114 train 7.197324 (lr=1.5827e-04) (hash(x)=25028015) +2115 train 6.949304 (lr=1.5826e-04) (hash(x)=22010703) +2116 train 7.336838 (lr=1.5824e-04) (hash(x)=23711709) +2117 train 7.363210 (lr=1.5823e-04) (hash(x)=26105026) +2118 train 7.774164 (lr=1.5821e-04) (hash(x)=34433894) +2119 train 7.801351 (lr=1.5820e-04) (hash(x)=34976197) +2120 train 7.296654 (lr=1.5818e-04) (hash(x)=27690727) +2121 train 7.176854 (lr=1.5817e-04) (hash(x)=24368234) +2122 train 7.153369 (lr=1.5815e-04) (hash(x)=25095726) +2123 train 7.326328 (lr=1.5814e-04) (hash(x)=28248301) +2124 train 7.053979 (lr=1.5812e-04) (hash(x)=23322302) +2125 train 7.497419 (lr=1.5811e-04) (hash(x)=26416200) +2126 train 7.169180 (lr=1.5809e-04) (hash(x)=26577567) +2127 train 7.222746 (lr=1.5808e-04) (hash(x)=23870805) +2128 train 7.119727 (lr=1.5806e-04) (hash(x)=25440544) +2129 train 7.278879 (lr=1.5804e-04) (hash(x)=25795021) +2130 train 7.116126 (lr=1.5803e-04) (hash(x)=20896402) +2131 train 7.135356 (lr=1.5801e-04) (hash(x)=24457252) +2132 train 7.225996 (lr=1.5800e-04) (hash(x)=25926760) +2133 train 7.104825 (lr=1.5798e-04) (hash(x)=23503725) +2134 train 7.681108 (lr=1.5797e-04) (hash(x)=28728828) +2135 train 7.146844 (lr=1.5795e-04) (hash(x)=25041103) +2136 train 7.198147 (lr=1.5794e-04) (hash(x)=22863770) +2137 train 7.071343 (lr=1.5792e-04) (hash(x)=23037755) +2138 train 7.251338 (lr=1.5791e-04) (hash(x)=25848413) +2139 train 7.313591 (lr=1.5789e-04) (hash(x)=25998487) +2140 train 7.177237 (lr=1.5788e-04) (hash(x)=22754440) +2141 train 7.429694 (lr=1.5786e-04) (hash(x)=27705382) +2142 train 7.458894 (lr=1.5784e-04) (hash(x)=27629095) +2143 train 7.307916 (lr=1.5783e-04) (hash(x)=26041745) +2144 train 7.088812 (lr=1.5781e-04) (hash(x)=21909712) +2145 train 7.243863 (lr=1.5780e-04) (hash(x)=24353905) +2146 train 7.163743 (lr=1.5778e-04) (hash(x)=24482587) +2147 train 7.294180 (lr=1.5777e-04) (hash(x)=27249810) +2148 train 7.443761 (lr=1.5775e-04) (hash(x)=26709938) +2149 train 7.052202 (lr=1.5774e-04) (hash(x)=23831457) +2150 val loss 7.1905 +2150 val perplexity 1326.7971 +2150 train 7.474754 (lr=1.5772e-04) (hash(x)=29776243) +2151 train 6.962151 (lr=1.5771e-04) (hash(x)=24068619) +2152 train 7.129467 (lr=1.5769e-04) (hash(x)=22208671) +2153 train 7.320988 (lr=1.5767e-04) (hash(x)=26680905) +2154 train 7.202150 (lr=1.5766e-04) (hash(x)=23567808) +2155 train 7.422235 (lr=1.5764e-04) (hash(x)=26359528) +2156 train 7.226125 (lr=1.5763e-04) (hash(x)=23787652) +2157 train 7.495366 (lr=1.5761e-04) (hash(x)=28347177) +2158 train 7.213588 (lr=1.5760e-04) (hash(x)=25266519) +2159 train 7.121549 (lr=1.5758e-04) (hash(x)=25441262) +2160 train 7.030937 (lr=1.5757e-04) (hash(x)=23959943) +2161 train 7.293767 (lr=1.5755e-04) (hash(x)=27888093) +2162 train 7.166313 (lr=1.5754e-04) (hash(x)=25547833) +2163 train 7.129241 (lr=1.5752e-04) (hash(x)=24413659) +2164 train 8.585050 (lr=1.5750e-04) (hash(x)=34397626) +2165 train 7.103082 (lr=1.5749e-04) (hash(x)=21159323) +2166 train 7.285626 (lr=1.5747e-04) (hash(x)=25360269) +2167 train 7.324788 (lr=1.5746e-04) (hash(x)=29181867) +2168 train 7.132395 (lr=1.5744e-04) (hash(x)=22501613) +2169 train 7.217594 (lr=1.5743e-04) (hash(x)=26469077) +2170 train 7.142225 (lr=1.5741e-04) (hash(x)=26665118) +2171 train 7.838989 (lr=1.5739e-04) (hash(x)=31551575) +2172 train 7.093826 (lr=1.5738e-04) (hash(x)=24803935) +2173 train 6.979804 (lr=1.5736e-04) (hash(x)=20896465) +2174 train 7.454492 (lr=1.5735e-04) (hash(x)=25702284) +2175 train 7.468069 (lr=1.5733e-04) (hash(x)=27093757) +2176 train 7.239467 (lr=1.5732e-04) (hash(x)=26024255) +2177 train 7.443105 (lr=1.5730e-04) (hash(x)=26443521) +2178 train 7.337193 (lr=1.5729e-04) (hash(x)=25478467) +2179 train 7.211060 (lr=1.5727e-04) (hash(x)=23624298) +2180 train 7.316285 (lr=1.5725e-04) (hash(x)=27304178) +2181 train 7.086254 (lr=1.5724e-04) (hash(x)=23016570) +2182 train 7.084910 (lr=1.5722e-04) (hash(x)=21073756) +2183 train 7.164611 (lr=1.5721e-04) (hash(x)=25150275) +2184 train 6.930698 (lr=1.5719e-04) (hash(x)=21004187) +2185 train 7.195397 (lr=1.5718e-04) (hash(x)=25876062) +2186 train 7.141826 (lr=1.5716e-04) (hash(x)=24221275) +2187 train 7.433589 (lr=1.5714e-04) (hash(x)=26239886) +2188 train 7.137836 (lr=1.5713e-04) (hash(x)=23299261) +2189 train 7.585771 (lr=1.5711e-04) (hash(x)=31024703) +2190 train 7.698222 (lr=1.5710e-04) (hash(x)=30084774) +2191 train 7.973690 (lr=1.5708e-04) (hash(x)=33457102) +2192 train 7.139021 (lr=1.5707e-04) (hash(x)=22423723) +2193 train 7.197570 (lr=1.5705e-04) (hash(x)=21989055) +2194 train 7.202808 (lr=1.5703e-04) (hash(x)=23286499) +2195 train 7.134400 (lr=1.5702e-04) (hash(x)=17499738) +2196 train 7.202703 (lr=1.5700e-04) (hash(x)=25329557) +2197 train 7.077791 (lr=1.5699e-04) (hash(x)=24195578) +2198 train 7.341560 (lr=1.5697e-04) (hash(x)=26646383) +2199 train 7.218400 (lr=1.5696e-04) (hash(x)=25755322) +2200 val loss 7.2028 +2200 val perplexity 1343.1740 +2200 train 7.278682 (lr=1.5694e-04) (hash(x)=27592223) +2201 train 7.462245 (lr=1.5692e-04) (hash(x)=26164625) +2202 train 7.295854 (lr=1.5691e-04) (hash(x)=21856341) +2203 train 7.193582 (lr=1.5689e-04) (hash(x)=23722795) +2204 train 7.243820 (lr=1.5688e-04) (hash(x)=25409645) +2205 train 7.193689 (lr=1.5686e-04) (hash(x)=23415339) +2206 train 7.153795 (lr=1.5685e-04) (hash(x)=24147928) +2207 train 7.055360 (lr=1.5683e-04) (hash(x)=23630794) +2208 train 7.127914 (lr=1.5681e-04) (hash(x)=27361452) +2209 train 7.202175 (lr=1.5680e-04) (hash(x)=25632158) +2210 train 7.000299 (lr=1.5678e-04) (hash(x)=21159789) +2211 train 7.143888 (lr=1.5677e-04) (hash(x)=23374168) +2212 train 7.168916 (lr=1.5675e-04) (hash(x)=24844739) +2213 train 7.099088 (lr=1.5673e-04) (hash(x)=23461285) +2214 train 7.149236 (lr=1.5672e-04) (hash(x)=27958481) +2215 train 7.054107 (lr=1.5670e-04) (hash(x)=25167987) +2216 train 7.219252 (lr=1.5669e-04) (hash(x)=22873204) +2217 train 7.771296 (lr=1.5667e-04) (hash(x)=31038116) +2218 train 7.290943 (lr=1.5666e-04) (hash(x)=28883155) +2219 train 7.183564 (lr=1.5664e-04) (hash(x)=30941010) +2220 train 7.184251 (lr=1.5662e-04) (hash(x)=24947521) +2221 train 7.203125 (lr=1.5661e-04) (hash(x)=22703293) +2222 train 7.147859 (lr=1.5659e-04) (hash(x)=23976007) +2223 train 7.106090 (lr=1.5658e-04) (hash(x)=24043224) +2224 train 7.025371 (lr=1.5656e-04) (hash(x)=23981093) +2225 train 7.233047 (lr=1.5654e-04) (hash(x)=26445994) +2226 train 7.460978 (lr=1.5653e-04) (hash(x)=27252393) +2227 train 7.427547 (lr=1.5651e-04) (hash(x)=29736627) +2228 train 7.381726 (lr=1.5650e-04) (hash(x)=24698933) +2229 train 7.048856 (lr=1.5648e-04) (hash(x)=24357840) +2230 train 7.159691 (lr=1.5646e-04) (hash(x)=25384498) +2231 train 7.346642 (lr=1.5645e-04) (hash(x)=24665411) +2232 train 7.221428 (lr=1.5643e-04) (hash(x)=24646352) +2233 train 7.203944 (lr=1.5642e-04) (hash(x)=25670741) +2234 train 7.236210 (lr=1.5640e-04) (hash(x)=26648242) +2235 train 7.512154 (lr=1.5638e-04) (hash(x)=27916043) +2236 train 7.205905 (lr=1.5637e-04) (hash(x)=25963100) +2237 train 7.282026 (lr=1.5635e-04) (hash(x)=27357379) +2238 train 7.065588 (lr=1.5634e-04) (hash(x)=21852360) +2239 train 7.045384 (lr=1.5632e-04) (hash(x)=17321657) +2240 train 7.007039 (lr=1.5630e-04) (hash(x)=18446645) +2241 train 6.777542 (lr=1.5629e-04) (hash(x)=17550988) +2242 train 7.170926 (lr=1.5627e-04) (hash(x)=27052347) +2243 train 7.034857 (lr=1.5626e-04) (hash(x)=23829833) +2244 train 7.271704 (lr=1.5624e-04) (hash(x)=27267264) +2245 train 7.457403 (lr=1.5622e-04) (hash(x)=24673611) +2246 train 7.391397 (lr=1.5621e-04) (hash(x)=25248507) +2247 train 7.658443 (lr=1.5619e-04) (hash(x)=27932591) +2248 train 7.502725 (lr=1.5618e-04) (hash(x)=26078877) +2249 train 7.513823 (lr=1.5616e-04) (hash(x)=26067367) +2250 val loss 7.2082 +2250 val perplexity 1350.4000 +2250 train 7.552484 (lr=1.5614e-04) (hash(x)=29143527) +2251 train 7.489226 (lr=1.5613e-04) (hash(x)=28206079) +2252 train 8.031937 (lr=1.5611e-04) (hash(x)=28894494) +2253 train 7.600426 (lr=1.5610e-04) (hash(x)=27977422) +2254 train 7.253788 (lr=1.5608e-04) (hash(x)=26446420) +2255 train 7.401930 (lr=1.5606e-04) (hash(x)=29447954) +2256 train 7.323130 (lr=1.5605e-04) (hash(x)=22181789) +2257 train 7.258037 (lr=1.5603e-04) (hash(x)=24976337) +2258 train 7.238463 (lr=1.5602e-04) (hash(x)=23277532) +2259 train 7.349601 (lr=1.5600e-04) (hash(x)=25935364) +2260 train 7.511430 (lr=1.5598e-04) (hash(x)=26988889) +2261 train 7.259310 (lr=1.5597e-04) (hash(x)=26887303) +2262 train 7.256271 (lr=1.5595e-04) (hash(x)=25021426) +2263 train 7.195648 (lr=1.5594e-04) (hash(x)=24621816) +2264 train 7.053729 (lr=1.5592e-04) (hash(x)=22132007) +2265 train 7.021738 (lr=1.5590e-04) (hash(x)=22648602) +2266 train 7.299330 (lr=1.5589e-04) (hash(x)=23132242) +2267 train 7.338404 (lr=1.5587e-04) (hash(x)=24070405) +2268 train 6.945098 (lr=1.5585e-04) (hash(x)=21412906) +2269 train 7.640935 (lr=1.5584e-04) (hash(x)=27547292) +2270 train 7.407146 (lr=1.5582e-04) (hash(x)=27740500) +2271 train 7.121562 (lr=1.5581e-04) (hash(x)=24682294) +2272 train 7.520644 (lr=1.5579e-04) (hash(x)=27969424) +2273 train 7.240215 (lr=1.5577e-04) (hash(x)=22172182) +2274 train 7.225128 (lr=1.5576e-04) (hash(x)=26485905) +2275 train 7.073462 (lr=1.5574e-04) (hash(x)=24050209) +2276 train 7.253841 (lr=1.5572e-04) (hash(x)=28802650) +2277 train 7.022732 (lr=1.5571e-04) (hash(x)=23644616) +2278 train 7.194449 (lr=1.5569e-04) (hash(x)=25409768) +2279 train 7.385458 (lr=1.5568e-04) (hash(x)=28057095) +2280 train 7.827838 (lr=1.5566e-04) (hash(x)=31689723) +2281 train 7.073909 (lr=1.5564e-04) (hash(x)=22252427) +2282 train 7.295732 (lr=1.5563e-04) (hash(x)=24142092) +2283 train 7.279134 (lr=1.5561e-04) (hash(x)=22523232) +2284 train 7.451455 (lr=1.5559e-04) (hash(x)=26017294) +2285 train 7.275864 (lr=1.5558e-04) (hash(x)=25025388) +2286 train 7.036748 (lr=1.5556e-04) (hash(x)=23819479) +2287 train 7.212591 (lr=1.5555e-04) (hash(x)=24547536) +2288 train 6.995848 (lr=1.5553e-04) (hash(x)=22622789) +2289 train 6.978000 (lr=1.5551e-04) (hash(x)=23874051) +2290 train 7.322127 (lr=1.5550e-04) (hash(x)=25015641) +2291 train 7.194492 (lr=1.5548e-04) (hash(x)=24978712) +2292 train 7.267041 (lr=1.5546e-04) (hash(x)=25311986) +2293 train 7.014516 (lr=1.5545e-04) (hash(x)=24298295) +2294 train 7.125968 (lr=1.5543e-04) (hash(x)=26481527) +2295 train 6.856767 (lr=1.5542e-04) (hash(x)=18987545) +2296 train 7.098308 (lr=1.5540e-04) (hash(x)=24617990) +2297 train 7.105203 (lr=1.5538e-04) (hash(x)=23903200) +2298 train 7.422249 (lr=1.5537e-04) (hash(x)=26278697) +2299 train 7.191295 (lr=1.5535e-04) (hash(x)=24092784) +2300 val loss 7.2140 +2300 val perplexity 1358.3629 +2300 train 7.128455 (lr=1.5533e-04) (hash(x)=22894919) +2301 train 7.207037 (lr=1.5532e-04) (hash(x)=24253964) +2302 train 7.170662 (lr=1.5530e-04) (hash(x)=23750610) +2303 train 7.179933 (lr=1.5528e-04) (hash(x)=26745063) +2304 train 6.975064 (lr=1.5527e-04) (hash(x)=21407001) +2305 train 7.386869 (lr=1.5525e-04) (hash(x)=26680082) +2306 train 7.290962 (lr=1.5524e-04) (hash(x)=26722122) +2307 train 7.116031 (lr=1.5522e-04) (hash(x)=22539112) +2308 train 6.956487 (lr=1.5520e-04) (hash(x)=19927356) +2309 train 7.006226 (lr=1.5519e-04) (hash(x)=21431267) +2310 train 6.953877 (lr=1.5517e-04) (hash(x)=21073487) +2311 train 6.970673 (lr=1.5515e-04) (hash(x)=21447406) +2312 train 6.947327 (lr=1.5514e-04) (hash(x)=22667253) +2313 train 6.915190 (lr=1.5512e-04) (hash(x)=20849089) +2314 train 6.893802 (lr=1.5510e-04) (hash(x)=19168351) +2315 train 6.928136 (lr=1.5509e-04) (hash(x)=21082139) +2316 train 6.900626 (lr=1.5507e-04) (hash(x)=21493530) +2317 train 6.837878 (lr=1.5505e-04) (hash(x)=19506447) +2318 train 6.974903 (lr=1.5504e-04) (hash(x)=23128797) +2319 train 7.085539 (lr=1.5502e-04) (hash(x)=24650655) +2320 train 6.828388 (lr=1.5501e-04) (hash(x)=21833080) +2321 train 7.394781 (lr=1.5499e-04) (hash(x)=26355512) +2322 train 7.557436 (lr=1.5497e-04) (hash(x)=26746363) +2323 train 6.980466 (lr=1.5496e-04) (hash(x)=22130721) +2324 train 7.369169 (lr=1.5494e-04) (hash(x)=28301752) +2325 train 7.190547 (lr=1.5492e-04) (hash(x)=26444359) +2326 train 7.559658 (lr=1.5491e-04) (hash(x)=24836130) +2327 train 7.957790 (lr=1.5489e-04) (hash(x)=26519976) +2328 train 9.313456 (lr=1.5487e-04) (hash(x)=35558906) +2329 train 7.600545 (lr=1.5486e-04) (hash(x)=30877729) +2330 train 7.497347 (lr=1.5484e-04) (hash(x)=28028485) +2331 train 7.616766 (lr=1.5482e-04) (hash(x)=25582440) +2332 train 7.904592 (lr=1.5481e-04) (hash(x)=29402491) +2333 train 7.202252 (lr=1.5479e-04) (hash(x)=25200284) +2334 train 7.181588 (lr=1.5477e-04) (hash(x)=26288480) +2335 train 6.917838 (lr=1.5476e-04) (hash(x)=20106514) +2336 train 6.946895 (lr=1.5474e-04) (hash(x)=22522123) +2337 train 6.969606 (lr=1.5472e-04) (hash(x)=23362041) +2338 train 7.132684 (lr=1.5471e-04) (hash(x)=26003099) +2339 train 7.160518 (lr=1.5469e-04) (hash(x)=25695510) +2340 train 7.158007 (lr=1.5467e-04) (hash(x)=27225904) +2341 train 6.871559 (lr=1.5466e-04) (hash(x)=21573008) +2342 train 7.296378 (lr=1.5464e-04) (hash(x)=21386628) +2343 train 7.085287 (lr=1.5463e-04) (hash(x)=20117808) +2344 train 7.206694 (lr=1.5461e-04) (hash(x)=21592790) +2345 train 7.093896 (lr=1.5459e-04) (hash(x)=19909192) +2346 train 7.326715 (lr=1.5458e-04) (hash(x)=22529262) +2347 train 7.336053 (lr=1.5456e-04) (hash(x)=24501900) +2348 train 7.106239 (lr=1.5454e-04) (hash(x)=25912171) +2349 train 7.211457 (lr=1.5453e-04) (hash(x)=25606665) +2350 val loss 7.1720 +2350 val perplexity 1302.4860 +2350 train 7.126236 (lr=1.5451e-04) (hash(x)=24487351) +2351 train 7.390485 (lr=1.5449e-04) (hash(x)=25510334) +2352 train 7.295879 (lr=1.5448e-04) (hash(x)=25357989) +2353 train 6.926370 (lr=1.5446e-04) (hash(x)=24656801) +2354 train 7.005455 (lr=1.5444e-04) (hash(x)=23312772) +2355 train 6.877117 (lr=1.5443e-04) (hash(x)=22099158) +2356 train 6.938352 (lr=1.5441e-04) (hash(x)=26507898) +2357 train 7.249841 (lr=1.5439e-04) (hash(x)=28351614) +2358 train 7.242980 (lr=1.5438e-04) (hash(x)=27489567) +2359 train 7.265566 (lr=1.5436e-04) (hash(x)=25749120) +2360 train 7.591507 (lr=1.5434e-04) (hash(x)=31711338) +2361 train 7.732987 (lr=1.5433e-04) (hash(x)=29645018) +2362 train 7.681409 (lr=1.5431e-04) (hash(x)=29713268) +2363 train 6.852782 (lr=1.5429e-04) (hash(x)=21720691) +2364 train 6.976736 (lr=1.5428e-04) (hash(x)=24316633) +2365 train 6.909447 (lr=1.5426e-04) (hash(x)=21597124) +2366 train 6.932871 (lr=1.5424e-04) (hash(x)=22520345) +2367 train 6.976645 (lr=1.5422e-04) (hash(x)=24357241) +2368 train 7.104248 (lr=1.5421e-04) (hash(x)=24085450) +2369 train 7.047561 (lr=1.5419e-04) (hash(x)=25136495) +2370 train 7.549646 (lr=1.5417e-04) (hash(x)=26073986) +2371 train 7.469612 (lr=1.5416e-04) (hash(x)=28911272) +2372 train 7.266843 (lr=1.5414e-04) (hash(x)=26667356) +2373 train 7.084615 (lr=1.5412e-04) (hash(x)=25225894) +2374 train 7.122240 (lr=1.5411e-04) (hash(x)=24404081) +2375 train 7.208936 (lr=1.5409e-04) (hash(x)=25584945) +2376 train 7.023982 (lr=1.5407e-04) (hash(x)=23831571) +2377 train 7.023773 (lr=1.5406e-04) (hash(x)=23521916) +2378 train 7.035966 (lr=1.5404e-04) (hash(x)=25318634) +2379 train 6.875671 (lr=1.5402e-04) (hash(x)=21847287) +2380 train 7.276779 (lr=1.5401e-04) (hash(x)=23877060) +2381 train 7.050318 (lr=1.5399e-04) (hash(x)=24069020) +2382 train 6.822395 (lr=1.5397e-04) (hash(x)=21724290) +2383 train 7.122444 (lr=1.5396e-04) (hash(x)=25198897) +2384 train 6.985084 (lr=1.5394e-04) (hash(x)=24109958) +2385 train 6.857788 (lr=1.5392e-04) (hash(x)=20122390) +2386 train 7.105152 (lr=1.5391e-04) (hash(x)=24062305) +2387 train 6.891525 (lr=1.5389e-04) (hash(x)=22436833) +2388 train 7.216661 (lr=1.5387e-04) (hash(x)=26013214) +2389 train 7.597881 (lr=1.5386e-04) (hash(x)=27691436) +2390 train 7.718685 (lr=1.5384e-04) (hash(x)=30802878) +2391 train 6.848949 (lr=1.5382e-04) (hash(x)=23475891) +2392 train 6.867284 (lr=1.5380e-04) (hash(x)=23118133) +2393 train 6.763780 (lr=1.5379e-04) (hash(x)=21469159) +2394 train 7.128213 (lr=1.5377e-04) (hash(x)=26444484) +2395 train 6.993059 (lr=1.5375e-04) (hash(x)=25083992) +2396 train 7.311016 (lr=1.5374e-04) (hash(x)=23461229) +2397 train 7.147075 (lr=1.5372e-04) (hash(x)=20441653) +2398 train 7.273702 (lr=1.5370e-04) (hash(x)=28024211) +2399 train 7.135667 (lr=1.5369e-04) (hash(x)=23644804) +2400 val loss 7.1537 +2400 val perplexity 1278.7708 +2400 train 6.913914 (lr=1.5367e-04) (hash(x)=26685301) +2401 train 6.762498 (lr=1.5365e-04) (hash(x)=20820913) +2402 train 6.944477 (lr=1.5364e-04) (hash(x)=22178190) +2403 train 7.589761 (lr=1.5362e-04) (hash(x)=31377168) +2404 train 7.793725 (lr=1.5360e-04) (hash(x)=33795307) +2405 train 7.961916 (lr=1.5358e-04) (hash(x)=34450341) +2406 train 7.091927 (lr=1.5357e-04) (hash(x)=25834183) +2407 train 7.324767 (lr=1.5355e-04) (hash(x)=25629584) +2408 train 7.077832 (lr=1.5353e-04) (hash(x)=25080123) +2409 train 6.950243 (lr=1.5352e-04) (hash(x)=21975628) +2410 train 7.540851 (lr=1.5350e-04) (hash(x)=27430197) +2411 train 7.677673 (lr=1.5348e-04) (hash(x)=29285135) +2412 train 7.333495 (lr=1.5347e-04) (hash(x)=24640105) +2413 train 7.528357 (lr=1.5345e-04) (hash(x)=29628864) +2414 train 7.728819 (lr=1.5343e-04) (hash(x)=30096444) +2415 train 7.485021 (lr=1.5341e-04) (hash(x)=29797280) +2416 train 6.904132 (lr=1.5340e-04) (hash(x)=22686143) +2417 train 7.506909 (lr=1.5338e-04) (hash(x)=28346842) +2418 train 7.465044 (lr=1.5336e-04) (hash(x)=28167937) +2419 train 7.686949 (lr=1.5335e-04) (hash(x)=33122326) +2420 train 7.711362 (lr=1.5333e-04) (hash(x)=33044913) +2421 train 7.497859 (lr=1.5331e-04) (hash(x)=31250981) +2422 train 7.734761 (lr=1.5330e-04) (hash(x)=29827111) +2423 train 7.648401 (lr=1.5328e-04) (hash(x)=30026394) +2424 train 7.769916 (lr=1.5326e-04) (hash(x)=26998238) +2425 train 7.743581 (lr=1.5324e-04) (hash(x)=24850684) +2426 train 7.922364 (lr=1.5323e-04) (hash(x)=36659853) +2427 train 7.840289 (lr=1.5321e-04) (hash(x)=34353164) +2428 train 7.149171 (lr=1.5319e-04) (hash(x)=23630644) +2429 train 7.126768 (lr=1.5318e-04) (hash(x)=24528186) +2430 train 6.989317 (lr=1.5316e-04) (hash(x)=22665222) +2431 train 7.140877 (lr=1.5314e-04) (hash(x)=26594177) +2432 train 7.512106 (lr=1.5312e-04) (hash(x)=29300546) +2433 train 6.890776 (lr=1.5311e-04) (hash(x)=21331715) +2434 train 7.225826 (lr=1.5309e-04) (hash(x)=26290885) +2435 train 7.149232 (lr=1.5307e-04) (hash(x)=25554738) +2436 train 7.443042 (lr=1.5306e-04) (hash(x)=26744311) +2437 train 7.351711 (lr=1.5304e-04) (hash(x)=26872344) +2438 train 7.448213 (lr=1.5302e-04) (hash(x)=27636081) +2439 train 7.184001 (lr=1.5300e-04) (hash(x)=23766256) +2440 train 7.303865 (lr=1.5299e-04) (hash(x)=24434438) +2441 train 7.095018 (lr=1.5297e-04) (hash(x)=22992618) +2442 train 6.943678 (lr=1.5295e-04) (hash(x)=22393467) +2443 train 7.256218 (lr=1.5294e-04) (hash(x)=26853444) +2444 train 7.158194 (lr=1.5292e-04) (hash(x)=25101020) +2445 train 7.053073 (lr=1.5290e-04) (hash(x)=24705456) +2446 train 7.377835 (lr=1.5288e-04) (hash(x)=26798611) +2447 train 7.034023 (lr=1.5287e-04) (hash(x)=24250150) +2448 train 7.106258 (lr=1.5285e-04) (hash(x)=24494331) +2449 train 7.135391 (lr=1.5283e-04) (hash(x)=27579257) +2450 val loss 7.1611 +2450 val perplexity 1288.3290 +2450 train 6.862149 (lr=1.5282e-04) (hash(x)=22377407) +2451 train 7.174086 (lr=1.5280e-04) (hash(x)=26289588) +2452 train 7.110649 (lr=1.5278e-04) (hash(x)=25871900) +2453 train 7.003104 (lr=1.5276e-04) (hash(x)=23437197) +2454 train 7.268243 (lr=1.5275e-04) (hash(x)=23557786) +2455 train 7.181674 (lr=1.5273e-04) (hash(x)=26108817) +2456 train 7.078134 (lr=1.5271e-04) (hash(x)=26440482) +2457 train 7.073737 (lr=1.5269e-04) (hash(x)=24583191) +2458 train 7.076431 (lr=1.5268e-04) (hash(x)=23756440) +2459 train 6.940659 (lr=1.5266e-04) (hash(x)=23814987) +2460 train 7.364027 (lr=1.5264e-04) (hash(x)=28508433) +2461 train 6.952703 (lr=1.5263e-04) (hash(x)=25692442) +2462 train 6.930717 (lr=1.5261e-04) (hash(x)=24699197) +2463 train 6.624103 (lr=1.5259e-04) (hash(x)=18582688) +2464 train 6.969110 (lr=1.5257e-04) (hash(x)=23266625) +2465 train 7.318349 (lr=1.5256e-04) (hash(x)=26565489) +2466 train 6.802972 (lr=1.5254e-04) (hash(x)=21686599) +2467 train 7.090028 (lr=1.5252e-04) (hash(x)=25558792) +2468 train 6.841968 (lr=1.5250e-04) (hash(x)=25110035) +2469 train 7.230238 (lr=1.5249e-04) (hash(x)=26263661) +2470 train 6.949924 (lr=1.5247e-04) (hash(x)=22282189) +2471 train 6.938351 (lr=1.5245e-04) (hash(x)=23272705) +2472 train 7.064044 (lr=1.5244e-04) (hash(x)=25300067) +2473 train 7.224979 (lr=1.5242e-04) (hash(x)=26802369) +2474 train 6.916575 (lr=1.5240e-04) (hash(x)=24646471) +2475 train 6.901668 (lr=1.5238e-04) (hash(x)=24709241) +2476 train 6.984997 (lr=1.5237e-04) (hash(x)=26747197) +2477 train 7.037914 (lr=1.5235e-04) (hash(x)=25201108) +2478 train 7.150245 (lr=1.5233e-04) (hash(x)=24962427) +2479 train 6.991340 (lr=1.5231e-04) (hash(x)=24793412) +2480 train 7.063765 (lr=1.5230e-04) (hash(x)=24452301) +2481 train 7.073445 (lr=1.5228e-04) (hash(x)=25177251) +2482 train 6.986265 (lr=1.5226e-04) (hash(x)=25801499) +2483 train 7.165100 (lr=1.5224e-04) (hash(x)=27256707) +2484 train 7.440734 (lr=1.5223e-04) (hash(x)=25303237) +2485 train 7.026193 (lr=1.5221e-04) (hash(x)=21641481) +2486 train 6.969122 (lr=1.5219e-04) (hash(x)=23818831) +2487 train 6.755911 (lr=1.5217e-04) (hash(x)=19280989) +2488 train 7.118567 (lr=1.5216e-04) (hash(x)=24075167) +2489 train 7.100576 (lr=1.5214e-04) (hash(x)=26651546) +2490 train 7.065365 (lr=1.5212e-04) (hash(x)=25367186) +2491 train 7.009181 (lr=1.5210e-04) (hash(x)=26508642) +2492 train 7.125318 (lr=1.5209e-04) (hash(x)=25294182) +2493 train 7.010205 (lr=1.5207e-04) (hash(x)=23916886) +2494 train 6.874182 (lr=1.5205e-04) (hash(x)=21189910) +2495 train 7.004101 (lr=1.5204e-04) (hash(x)=22751150) +2496 train 7.432870 (lr=1.5202e-04) (hash(x)=26608502) +2497 train 7.856473 (lr=1.5200e-04) (hash(x)=25372010) +2498 train 7.056932 (lr=1.5198e-04) (hash(x)=22006251) +2499 train 7.011755 (lr=1.5197e-04) (hash(x)=23880160) +2500 val loss 7.1469 +2500 val perplexity 1270.1656 +2500 train 6.930294 (lr=1.5195e-04) (hash(x)=23225337) +2501 train 7.126791 (lr=1.5193e-04) (hash(x)=24932950) +2502 train 6.835002 (lr=1.5191e-04) (hash(x)=20022340) +2503 train 7.243299 (lr=1.5190e-04) (hash(x)=23537942) +2504 train 7.119513 (lr=1.5188e-04) (hash(x)=24884288) +2505 train 6.738880 (lr=1.5186e-04) (hash(x)=21296580) +2506 train 6.987743 (lr=1.5184e-04) (hash(x)=23001455) +2507 train 7.304556 (lr=1.5183e-04) (hash(x)=26975313) +2508 train 7.292010 (lr=1.5181e-04) (hash(x)=26029962) +2509 train 6.986679 (lr=1.5179e-04) (hash(x)=24302204) +2510 train 6.707054 (lr=1.5177e-04) (hash(x)=22997203) +2511 train 6.817518 (lr=1.5176e-04) (hash(x)=23748375) +2512 train 7.074475 (lr=1.5174e-04) (hash(x)=24453191) +2513 train 6.730492 (lr=1.5172e-04) (hash(x)=22026776) +2514 train 6.824657 (lr=1.5170e-04) (hash(x)=19934168) +2515 train 7.155850 (lr=1.5168e-04) (hash(x)=25541754) +2516 train 7.544952 (lr=1.5167e-04) (hash(x)=26604471) +2517 train 7.504477 (lr=1.5165e-04) (hash(x)=27900386) +2518 train 7.476610 (lr=1.5163e-04) (hash(x)=26403431) +2519 train 7.495322 (lr=1.5161e-04) (hash(x)=27413825) +2520 train 7.560063 (lr=1.5160e-04) (hash(x)=28332637) +2521 train 7.344283 (lr=1.5158e-04) (hash(x)=27223027) +2522 train 7.364841 (lr=1.5156e-04) (hash(x)=23843387) +2523 train 7.403606 (lr=1.5154e-04) (hash(x)=27075951) +2524 train 7.596626 (lr=1.5153e-04) (hash(x)=29300154) +2525 train 7.226836 (lr=1.5151e-04) (hash(x)=28100582) +2526 train 7.300175 (lr=1.5149e-04) (hash(x)=28051084) +2527 train 7.025070 (lr=1.5147e-04) (hash(x)=21682445) +2528 train 7.213558 (lr=1.5146e-04) (hash(x)=24062589) +2529 train 7.399007 (lr=1.5144e-04) (hash(x)=29616079) +2530 train 7.293129 (lr=1.5142e-04) (hash(x)=25170523) +2531 train 6.875052 (lr=1.5140e-04) (hash(x)=23361504) +2532 train 7.092671 (lr=1.5139e-04) (hash(x)=24444462) +2533 train 7.108704 (lr=1.5137e-04) (hash(x)=24035993) +2534 train 7.040284 (lr=1.5135e-04) (hash(x)=24696651) +2535 train 7.046281 (lr=1.5133e-04) (hash(x)=22040184) +2536 train 6.930234 (lr=1.5131e-04) (hash(x)=27400103) +2537 train 7.276354 (lr=1.5130e-04) (hash(x)=27383080) +2538 train 7.061976 (lr=1.5128e-04) (hash(x)=24212212) +2539 train 6.950451 (lr=1.5126e-04) (hash(x)=23727731) +2540 train 7.082475 (lr=1.5124e-04) (hash(x)=24149487) +2541 train 6.831481 (lr=1.5123e-04) (hash(x)=23794649) +2542 train 7.018198 (lr=1.5121e-04) (hash(x)=26147774) +2543 train 7.131169 (lr=1.5119e-04) (hash(x)=24463229) +2544 train 7.221761 (lr=1.5117e-04) (hash(x)=26361238) +2545 train 6.858536 (lr=1.5116e-04) (hash(x)=18891545) +2546 train 7.403035 (lr=1.5114e-04) (hash(x)=30380438) +2547 train 7.635149 (lr=1.5112e-04) (hash(x)=32663792) +2548 train 7.028577 (lr=1.5110e-04) (hash(x)=25175499) +2549 train 7.227487 (lr=1.5108e-04) (hash(x)=26702407) +2550 val loss 7.1136 +2550 val perplexity 1228.5533 +2550 train 7.053188 (lr=1.5107e-04) (hash(x)=24578061) +2551 train 7.065149 (lr=1.5105e-04) (hash(x)=24091954) +2552 train 7.090393 (lr=1.5103e-04) (hash(x)=23041778) +2553 train 6.840335 (lr=1.5101e-04) (hash(x)=23686239) +2554 train 6.973256 (lr=1.5100e-04) (hash(x)=22745355) +2555 train 7.044753 (lr=1.5098e-04) (hash(x)=23599013) +2556 train 6.951663 (lr=1.5096e-04) (hash(x)=26033088) +2557 train 7.055416 (lr=1.5094e-04) (hash(x)=21634218) +2558 train 6.930358 (lr=1.5092e-04) (hash(x)=20985281) +2559 train 7.220418 (lr=1.5091e-04) (hash(x)=26670219) +2560 train 6.984647 (lr=1.5089e-04) (hash(x)=26499936) +2561 train 7.076793 (lr=1.5087e-04) (hash(x)=23547908) +2562 train 6.934162 (lr=1.5085e-04) (hash(x)=22306373) +2563 train 7.069060 (lr=1.5083e-04) (hash(x)=24380893) +2564 train 6.977830 (lr=1.5082e-04) (hash(x)=23726190) +2565 train 7.029648 (lr=1.5080e-04) (hash(x)=26967512) +2566 train 7.128834 (lr=1.5078e-04) (hash(x)=23414576) +2567 train 7.356732 (lr=1.5076e-04) (hash(x)=25558986) +2568 train 7.234155 (lr=1.5075e-04) (hash(x)=27057505) +2569 train 7.230144 (lr=1.5073e-04) (hash(x)=26048135) +2570 train 7.179449 (lr=1.5071e-04) (hash(x)=26991032) +2571 train 7.210098 (lr=1.5069e-04) (hash(x)=25729492) +2572 train 6.752546 (lr=1.5067e-04) (hash(x)=20611723) +2573 train 6.889413 (lr=1.5066e-04) (hash(x)=24563606) +2574 train 6.975897 (lr=1.5064e-04) (hash(x)=23330043) +2575 train 6.975950 (lr=1.5062e-04) (hash(x)=19218943) +2576 train 7.356973 (lr=1.5060e-04) (hash(x)=20985122) +2577 train 6.966020 (lr=1.5058e-04) (hash(x)=24133609) +2578 train 7.330724 (lr=1.5057e-04) (hash(x)=28368610) +2579 train 7.007539 (lr=1.5055e-04) (hash(x)=23952206) +2580 train 6.906406 (lr=1.5053e-04) (hash(x)=23068957) +2581 train 7.037670 (lr=1.5051e-04) (hash(x)=25365277) +2582 train 7.380593 (lr=1.5050e-04) (hash(x)=24721184) +2583 train 7.075549 (lr=1.5048e-04) (hash(x)=24551402) +2584 train 6.786424 (lr=1.5046e-04) (hash(x)=20469327) +2585 train 7.241405 (lr=1.5044e-04) (hash(x)=24966478) +2586 train 6.954514 (lr=1.5042e-04) (hash(x)=18626184) +2587 train 6.966046 (lr=1.5041e-04) (hash(x)=24007642) +2588 train 6.946880 (lr=1.5039e-04) (hash(x)=23521875) +2589 train 7.175200 (lr=1.5037e-04) (hash(x)=25204207) +2590 train 6.906598 (lr=1.5035e-04) (hash(x)=25449801) +2591 train 7.141023 (lr=1.5033e-04) (hash(x)=25229281) +2592 train 6.986961 (lr=1.5032e-04) (hash(x)=23202696) +2593 train 6.805685 (lr=1.5030e-04) (hash(x)=22435944) +2594 train 6.888866 (lr=1.5028e-04) (hash(x)=20787439) +2595 train 6.379148 (lr=1.5026e-04) (hash(x)=18214283) +2596 train 6.603778 (lr=1.5024e-04) (hash(x)=20851477) +2597 train 6.598873 (lr=1.5023e-04) (hash(x)=20609675) +2598 train 6.719247 (lr=1.5021e-04) (hash(x)=20061218) +2599 train 6.773364 (lr=1.5019e-04) (hash(x)=21251127) +2600 val loss 7.1030 +2600 val perplexity 1215.5907 +2600 train 7.305202 (lr=1.5017e-04) (hash(x)=30948038) +2601 train 7.573461 (lr=1.5015e-04) (hash(x)=32279160) +2602 train 7.192358 (lr=1.5014e-04) (hash(x)=26607151) +2603 train 7.081352 (lr=1.5012e-04) (hash(x)=25097619) +2604 train 6.639290 (lr=1.5010e-04) (hash(x)=20892421) +2605 train 6.823328 (lr=1.5008e-04) (hash(x)=22212821) +2606 train 7.144189 (lr=1.5006e-04) (hash(x)=24720588) +2607 train 7.138312 (lr=1.5005e-04) (hash(x)=25800857) +2608 train 6.948888 (lr=1.5003e-04) (hash(x)=22901279) +2609 train 6.806049 (lr=1.5001e-04) (hash(x)=20921910) +2610 train 7.074687 (lr=1.4999e-04) (hash(x)=24846267) +2611 train 6.956853 (lr=1.4997e-04) (hash(x)=22918428) +2612 train 6.877678 (lr=1.4995e-04) (hash(x)=22805901) +2613 train 7.047461 (lr=1.4994e-04) (hash(x)=24345816) +2614 train 6.885321 (lr=1.4992e-04) (hash(x)=22962012) +2615 train 7.163484 (lr=1.4990e-04) (hash(x)=25836189) +2616 train 7.214571 (lr=1.4988e-04) (hash(x)=27922916) +2617 train 6.899690 (lr=1.4986e-04) (hash(x)=21697866) +2618 train 6.930212 (lr=1.4985e-04) (hash(x)=24283369) +2619 train 6.824643 (lr=1.4983e-04) (hash(x)=24504567) +2620 train 6.945812 (lr=1.4981e-04) (hash(x)=25557725) +2621 train 6.989742 (lr=1.4979e-04) (hash(x)=23135849) +2622 train 6.922322 (lr=1.4977e-04) (hash(x)=22888908) +2623 train 7.125389 (lr=1.4976e-04) (hash(x)=25999255) +2624 train 6.997188 (lr=1.4974e-04) (hash(x)=24446851) +2625 train 6.714858 (lr=1.4972e-04) (hash(x)=21137520) +2626 train 7.030676 (lr=1.4970e-04) (hash(x)=26245754) +2627 train 7.399109 (lr=1.4968e-04) (hash(x)=27308968) +2628 train 7.120383 (lr=1.4966e-04) (hash(x)=23961169) +2629 train 7.062837 (lr=1.4965e-04) (hash(x)=25924731) +2630 train 7.138581 (lr=1.4963e-04) (hash(x)=25782315) +2631 train 7.185484 (lr=1.4961e-04) (hash(x)=20149394) +2632 train 7.291530 (lr=1.4959e-04) (hash(x)=23801981) +2633 train 7.028949 (lr=1.4957e-04) (hash(x)=23830286) +2634 train 6.974342 (lr=1.4956e-04) (hash(x)=25325236) +2635 train 6.963615 (lr=1.4954e-04) (hash(x)=24498556) +2636 train 6.913893 (lr=1.4952e-04) (hash(x)=23693078) +2637 train 7.108800 (lr=1.4950e-04) (hash(x)=25484922) +2638 train 6.754720 (lr=1.4948e-04) (hash(x)=22645025) +2639 train 6.734554 (lr=1.4946e-04) (hash(x)=21999338) +2640 train 7.003512 (lr=1.4945e-04) (hash(x)=21758019) +2641 train 6.930909 (lr=1.4943e-04) (hash(x)=24064168) +2642 train 6.954285 (lr=1.4941e-04) (hash(x)=26847292) +2643 train 6.816876 (lr=1.4939e-04) (hash(x)=23280568) +2644 train 6.833010 (lr=1.4937e-04) (hash(x)=21749161) +2645 train 7.450410 (lr=1.4935e-04) (hash(x)=30082352) +2646 train 7.323532 (lr=1.4934e-04) (hash(x)=28334297) +2647 train 7.484505 (lr=1.4932e-04) (hash(x)=27611302) +2648 train 7.907628 (lr=1.4930e-04) (hash(x)=31007436) +2649 train 6.766875 (lr=1.4928e-04) (hash(x)=22356183) +2650 val loss 7.1348 +2650 val perplexity 1254.8794 +2650 train 6.854495 (lr=1.4926e-04) (hash(x)=23071731) +2651 train 6.857643 (lr=1.4924e-04) (hash(x)=23982308) +2652 train 7.187992 (lr=1.4923e-04) (hash(x)=25673823) +2653 train 6.948227 (lr=1.4921e-04) (hash(x)=22973788) +2654 train 7.116024 (lr=1.4919e-04) (hash(x)=25386647) +2655 train 6.802705 (lr=1.4917e-04) (hash(x)=22778356) +2656 train 7.115211 (lr=1.4915e-04) (hash(x)=26669130) +2657 train 6.769322 (lr=1.4913e-04) (hash(x)=23542930) +2658 train 6.929723 (lr=1.4912e-04) (hash(x)=23307871) +2659 train 6.861690 (lr=1.4910e-04) (hash(x)=23467046) +2660 train 7.049831 (lr=1.4908e-04) (hash(x)=24728872) +2661 train 7.712663 (lr=1.4906e-04) (hash(x)=29719902) +2662 train 6.959905 (lr=1.4904e-04) (hash(x)=25114165) +2663 train 6.911148 (lr=1.4902e-04) (hash(x)=24195959) +2664 train 7.109231 (lr=1.4901e-04) (hash(x)=26938509) +2665 train 7.275647 (lr=1.4899e-04) (hash(x)=27168434) +2666 train 7.426726 (lr=1.4897e-04) (hash(x)=27488221) +2667 train 8.110686 (lr=1.4895e-04) (hash(x)=32710438) +2668 train 7.218362 (lr=1.4893e-04) (hash(x)=25073185) +2669 train 7.209074 (lr=1.4891e-04) (hash(x)=26951664) +2670 train 7.392302 (lr=1.4890e-04) (hash(x)=24886228) +2671 train 6.771410 (lr=1.4888e-04) (hash(x)=19127465) +2672 train 7.121171 (lr=1.4886e-04) (hash(x)=27134917) +2673 train 7.037853 (lr=1.4884e-04) (hash(x)=25673955) +2674 train 7.577124 (lr=1.4882e-04) (hash(x)=27111776) +2675 train 7.562141 (lr=1.4880e-04) (hash(x)=28962580) +2676 train 7.074997 (lr=1.4879e-04) (hash(x)=25593381) +2677 train 7.123169 (lr=1.4877e-04) (hash(x)=25238916) +2678 train 6.922254 (lr=1.4875e-04) (hash(x)=27453574) +2679 train 6.935172 (lr=1.4873e-04) (hash(x)=22426274) +2680 train 6.990572 (lr=1.4871e-04) (hash(x)=22974780) +2681 train 7.024533 (lr=1.4869e-04) (hash(x)=24668644) +2682 train 7.044163 (lr=1.4868e-04) (hash(x)=26182084) +2683 train 7.189498 (lr=1.4866e-04) (hash(x)=25606512) +2684 train 7.035353 (lr=1.4864e-04) (hash(x)=24885252) +2685 train 6.841277 (lr=1.4862e-04) (hash(x)=21290254) +2686 train 6.755980 (lr=1.4860e-04) (hash(x)=21367078) +2687 train 6.938178 (lr=1.4858e-04) (hash(x)=23785205) +2688 train 6.846581 (lr=1.4856e-04) (hash(x)=24640056) +2689 train 7.324646 (lr=1.4855e-04) (hash(x)=27083886) +2690 train 6.984239 (lr=1.4853e-04) (hash(x)=23603571) +2691 train 7.060028 (lr=1.4851e-04) (hash(x)=24779414) +2692 train 6.734327 (lr=1.4849e-04) (hash(x)=22200693) +2693 train 7.149426 (lr=1.4847e-04) (hash(x)=26907868) +2694 train 7.447612 (lr=1.4845e-04) (hash(x)=32034827) +2695 train 7.349157 (lr=1.4843e-04) (hash(x)=28505676) +2696 train 6.913701 (lr=1.4842e-04) (hash(x)=23805750) +2697 train 7.252342 (lr=1.4840e-04) (hash(x)=29804750) +2698 train 7.554042 (lr=1.4838e-04) (hash(x)=28443583) +2699 train 7.427953 (lr=1.4836e-04) (hash(x)=29156288) +2700 val loss 7.0841 +2700 val perplexity 1192.8489 +2700 train 7.055606 (lr=1.4834e-04) (hash(x)=25895743) +2701 train 6.696983 (lr=1.4832e-04) (hash(x)=21173795) +2702 train 6.602852 (lr=1.4830e-04) (hash(x)=20790866) +2703 train 7.261346 (lr=1.4829e-04) (hash(x)=27706477) +2704 train 7.325912 (lr=1.4827e-04) (hash(x)=30358985) +2705 train 6.945287 (lr=1.4825e-04) (hash(x)=23548492) +2706 train 7.052394 (lr=1.4823e-04) (hash(x)=25879696) +2707 train 6.941432 (lr=1.4821e-04) (hash(x)=23711800) +2708 train 7.467702 (lr=1.4819e-04) (hash(x)=28763123) +2709 train 7.142119 (lr=1.4817e-04) (hash(x)=23327642) +2710 train 7.187555 (lr=1.4816e-04) (hash(x)=25634166) +2711 train 7.054420 (lr=1.4814e-04) (hash(x)=28684175) +2712 train 7.165923 (lr=1.4812e-04) (hash(x)=23996278) +2713 train 6.751974 (lr=1.4810e-04) (hash(x)=21795980) +2714 train 7.056144 (lr=1.4808e-04) (hash(x)=24840769) +2715 train 7.016533 (lr=1.4806e-04) (hash(x)=25225466) +2716 train 7.356701 (lr=1.4804e-04) (hash(x)=27500471) +2717 train 7.027477 (lr=1.4803e-04) (hash(x)=24703036) +2718 train 7.163373 (lr=1.4801e-04) (hash(x)=24294293) +2719 train 7.085887 (lr=1.4799e-04) (hash(x)=28003600) +2720 train 6.813573 (lr=1.4797e-04) (hash(x)=22822962) +2721 train 6.662955 (lr=1.4795e-04) (hash(x)=24189246) +2722 train 6.813545 (lr=1.4793e-04) (hash(x)=22608951) +2723 train 7.449745 (lr=1.4791e-04) (hash(x)=27989890) +2724 train 7.193363 (lr=1.4790e-04) (hash(x)=24175838) +2725 train 7.064836 (lr=1.4788e-04) (hash(x)=24781792) +2726 train 6.892258 (lr=1.4786e-04) (hash(x)=23413276) +2727 train 7.280737 (lr=1.4784e-04) (hash(x)=27586845) +2728 train 7.049633 (lr=1.4782e-04) (hash(x)=27336264) +2729 train 7.136023 (lr=1.4780e-04) (hash(x)=26808464) +2730 train 6.965496 (lr=1.4778e-04) (hash(x)=22312009) +2731 train 6.992794 (lr=1.4776e-04) (hash(x)=22373927) +2732 train 6.937834 (lr=1.4775e-04) (hash(x)=23428834) +2733 train 6.973222 (lr=1.4773e-04) (hash(x)=25304441) +2734 train 7.010925 (lr=1.4771e-04) (hash(x)=24798164) +2735 train 6.798308 (lr=1.4769e-04) (hash(x)=21176405) +2736 train 6.886014 (lr=1.4767e-04) (hash(x)=22343075) +2737 train 6.937941 (lr=1.4765e-04) (hash(x)=23825332) +2738 train 6.998721 (lr=1.4763e-04) (hash(x)=24191865) +2739 train 6.836322 (lr=1.4761e-04) (hash(x)=23806052) +2740 train 6.859039 (lr=1.4760e-04) (hash(x)=21764591) +2741 train 7.025884 (lr=1.4758e-04) (hash(x)=25548695) +2742 train 7.228382 (lr=1.4756e-04) (hash(x)=26847535) +2743 train 6.924667 (lr=1.4754e-04) (hash(x)=25888433) +2744 train 6.892555 (lr=1.4752e-04) (hash(x)=24327454) +2745 train 6.813457 (lr=1.4750e-04) (hash(x)=22543301) +2746 train 7.245702 (lr=1.4748e-04) (hash(x)=24593022) +2747 train 7.873624 (lr=1.4746e-04) (hash(x)=27797727) +2748 train 7.282182 (lr=1.4745e-04) (hash(x)=28067682) +2749 train 6.929089 (lr=1.4743e-04) (hash(x)=25278538) +2750 val loss 7.0765 +2750 val perplexity 1183.8737 +2750 train 6.846205 (lr=1.4741e-04) (hash(x)=23875731) +2751 train 7.031215 (lr=1.4739e-04) (hash(x)=27916982) +2752 train 7.015106 (lr=1.4737e-04) (hash(x)=25726799) +2753 train 6.840036 (lr=1.4735e-04) (hash(x)=25227141) +2754 train 7.123128 (lr=1.4733e-04) (hash(x)=27679212) +2755 train 6.757295 (lr=1.4731e-04) (hash(x)=24621793) +2756 train 6.738464 (lr=1.4729e-04) (hash(x)=21962296) +2757 train 7.110433 (lr=1.4728e-04) (hash(x)=24899679) +2758 train 6.779369 (lr=1.4726e-04) (hash(x)=21452158) +2759 train 6.903360 (lr=1.4724e-04) (hash(x)=24334708) +2760 train 7.156793 (lr=1.4722e-04) (hash(x)=25523041) +2761 train 7.216086 (lr=1.4720e-04) (hash(x)=30389813) +2762 train 6.821430 (lr=1.4718e-04) (hash(x)=22426014) +2763 train 6.918996 (lr=1.4716e-04) (hash(x)=24419143) +2764 train 6.989602 (lr=1.4714e-04) (hash(x)=24850536) +2765 train 7.062342 (lr=1.4712e-04) (hash(x)=24181393) +2766 train 6.549267 (lr=1.4711e-04) (hash(x)=18882503) +2767 train 7.075835 (lr=1.4709e-04) (hash(x)=25617709) +2768 train 6.977767 (lr=1.4707e-04) (hash(x)=24076662) +2769 train 6.907358 (lr=1.4705e-04) (hash(x)=21656802) +2770 train 6.830225 (lr=1.4703e-04) (hash(x)=21014265) +2771 train 7.001555 (lr=1.4701e-04) (hash(x)=24556034) +2772 train 6.707193 (lr=1.4699e-04) (hash(x)=22046665) +2773 train 7.061160 (lr=1.4697e-04) (hash(x)=26761579) +2774 train 8.671991 (lr=1.4695e-04) (hash(x)=41414315) +2775 train 6.963020 (lr=1.4694e-04) (hash(x)=25152362) +2776 train 7.144858 (lr=1.4692e-04) (hash(x)=25567641) +2777 train 7.090589 (lr=1.4690e-04) (hash(x)=25427935) +2778 train 7.151031 (lr=1.4688e-04) (hash(x)=25824457) +2779 train 7.042968 (lr=1.4686e-04) (hash(x)=24326376) +2780 train 7.077046 (lr=1.4684e-04) (hash(x)=27447230) +2781 train 6.882019 (lr=1.4682e-04) (hash(x)=24003710) +2782 train 6.785607 (lr=1.4680e-04) (hash(x)=24157390) +2783 train 6.926277 (lr=1.4678e-04) (hash(x)=24276512) +2784 train 6.730082 (lr=1.4677e-04) (hash(x)=21503752) +2785 train 6.708063 (lr=1.4675e-04) (hash(x)=20031488) +2786 train 6.699768 (lr=1.4673e-04) (hash(x)=21788715) +2787 train 6.936270 (lr=1.4671e-04) (hash(x)=24344695) +2788 train 6.997646 (lr=1.4669e-04) (hash(x)=22927763) +2789 train 6.862720 (lr=1.4667e-04) (hash(x)=23710755) +2790 train 7.119218 (lr=1.4665e-04) (hash(x)=26924620) +2791 train 7.441808 (lr=1.4663e-04) (hash(x)=26776133) +2792 train 6.864084 (lr=1.4661e-04) (hash(x)=19936770) +2793 train 7.018974 (lr=1.4659e-04) (hash(x)=25440959) +2794 train 6.950125 (lr=1.4658e-04) (hash(x)=25146097) +2795 train 6.767381 (lr=1.4656e-04) (hash(x)=21847282) +2796 train 6.988954 (lr=1.4654e-04) (hash(x)=25639784) +2797 train 6.756124 (lr=1.4652e-04) (hash(x)=21199921) +2798 train 6.941453 (lr=1.4650e-04) (hash(x)=22360806) +2799 train 6.422914 (lr=1.4648e-04) (hash(x)=20254159) +2800 val loss 7.0761 +2800 val perplexity 1183.3308 +2800 train 6.592142 (lr=1.4646e-04) (hash(x)=23348345) +2801 train 7.185472 (lr=1.4644e-04) (hash(x)=24908033) +2802 train 6.903802 (lr=1.4642e-04) (hash(x)=23350309) +2803 train 6.980145 (lr=1.4640e-04) (hash(x)=25044762) +2804 train 6.861524 (lr=1.4638e-04) (hash(x)=24071026) +2805 train 6.653373 (lr=1.4637e-04) (hash(x)=22169363) +2806 train 6.955113 (lr=1.4635e-04) (hash(x)=23757564) +2807 train 7.420169 (lr=1.4633e-04) (hash(x)=27873855) +2808 train 7.133363 (lr=1.4631e-04) (hash(x)=26577893) +2809 train 7.199489 (lr=1.4629e-04) (hash(x)=27001634) +2810 train 6.991457 (lr=1.4627e-04) (hash(x)=24796541) +2811 train 6.864337 (lr=1.4625e-04) (hash(x)=22575615) +2812 train 6.977501 (lr=1.4623e-04) (hash(x)=25876475) +2813 train 6.990419 (lr=1.4621e-04) (hash(x)=24765155) +2814 train 6.902019 (lr=1.4619e-04) (hash(x)=25785699) +2815 train 7.121959 (lr=1.4617e-04) (hash(x)=25113614) +2816 train 6.977991 (lr=1.4616e-04) (hash(x)=24415748) +2817 train 7.050143 (lr=1.4614e-04) (hash(x)=25140622) +2818 train 6.974824 (lr=1.4612e-04) (hash(x)=24845866) +2819 train 7.453195 (lr=1.4610e-04) (hash(x)=28062905) +2820 train 6.921814 (lr=1.4608e-04) (hash(x)=22041086) +2821 train 7.082716 (lr=1.4606e-04) (hash(x)=24957184) +2822 train 6.970317 (lr=1.4604e-04) (hash(x)=24360380) +2823 train 7.115250 (lr=1.4602e-04) (hash(x)=26192886) +2824 train 6.976514 (lr=1.4600e-04) (hash(x)=25001858) +2825 train 6.947998 (lr=1.4598e-04) (hash(x)=24721193) +2826 train 7.000239 (lr=1.4596e-04) (hash(x)=26186227) +2827 train 6.953711 (lr=1.4594e-04) (hash(x)=25770338) +2828 train 7.062195 (lr=1.4593e-04) (hash(x)=25920767) +2829 train 6.960656 (lr=1.4591e-04) (hash(x)=25060684) +2830 train 6.615079 (lr=1.4589e-04) (hash(x)=22933946) +2831 train 6.828625 (lr=1.4587e-04) (hash(x)=24614912) +2832 train 6.548120 (lr=1.4585e-04) (hash(x)=19955522) +2833 train 6.587925 (lr=1.4583e-04) (hash(x)=21111215) +2834 train 7.500885 (lr=1.4581e-04) (hash(x)=28817924) +2835 train 7.058974 (lr=1.4579e-04) (hash(x)=26934071) +2836 train 6.972085 (lr=1.4577e-04) (hash(x)=24768851) +2837 train 6.943922 (lr=1.4575e-04) (hash(x)=25706447) +2838 train 6.715574 (lr=1.4573e-04) (hash(x)=19579834) +2839 train 6.954831 (lr=1.4571e-04) (hash(x)=25397093) +2840 train 7.325934 (lr=1.4569e-04) (hash(x)=27902141) +2841 train 7.039800 (lr=1.4568e-04) (hash(x)=25383069) +2842 train 6.803904 (lr=1.4566e-04) (hash(x)=22007373) +2843 train 6.897631 (lr=1.4564e-04) (hash(x)=25925963) +2844 train 6.960383 (lr=1.4562e-04) (hash(x)=25711128) +2845 train 6.639030 (lr=1.4560e-04) (hash(x)=21881216) +2846 train 6.831920 (lr=1.4558e-04) (hash(x)=20277075) +2847 train 6.883132 (lr=1.4556e-04) (hash(x)=19811802) +2848 train 6.823411 (lr=1.4554e-04) (hash(x)=23878906) +2849 train 7.089432 (lr=1.4552e-04) (hash(x)=25034966) +2850 val loss 7.0608 +2850 val perplexity 1165.3539 +2850 train 7.111237 (lr=1.4550e-04) (hash(x)=24359507) +2851 train 6.866664 (lr=1.4548e-04) (hash(x)=23248423) +2852 train 6.841869 (lr=1.4546e-04) (hash(x)=21782773) +2853 train 6.994428 (lr=1.4544e-04) (hash(x)=23804418) +2854 train 7.044750 (lr=1.4542e-04) (hash(x)=22525078) +2855 train 7.025974 (lr=1.4541e-04) (hash(x)=25579655) +2856 train 7.133368 (lr=1.4539e-04) (hash(x)=27048876) +2857 train 7.226436 (lr=1.4537e-04) (hash(x)=26468479) +2858 train 6.910686 (lr=1.4535e-04) (hash(x)=23854933) +2859 train 7.331135 (lr=1.4533e-04) (hash(x)=25537603) +2860 train 6.728036 (lr=1.4531e-04) (hash(x)=20979252) +2861 train 7.268160 (lr=1.4529e-04) (hash(x)=26504374) +2862 train 7.059073 (lr=1.4527e-04) (hash(x)=27561842) +2863 train 7.060140 (lr=1.4525e-04) (hash(x)=26096514) +2864 train 7.113531 (lr=1.4523e-04) (hash(x)=25926899) +2865 train 7.145185 (lr=1.4521e-04) (hash(x)=26058348) +2866 train 7.101745 (lr=1.4519e-04) (hash(x)=29802259) +2867 train 7.043449 (lr=1.4517e-04) (hash(x)=24132888) +2868 train 6.720363 (lr=1.4515e-04) (hash(x)=23369410) +2869 train 6.885976 (lr=1.4513e-04) (hash(x)=25387506) +2870 train 7.078958 (lr=1.4511e-04) (hash(x)=27375344) +2871 train 6.825575 (lr=1.4510e-04) (hash(x)=22589633) +2872 train 6.996601 (lr=1.4508e-04) (hash(x)=23250237) +2873 train 6.912593 (lr=1.4506e-04) (hash(x)=25511322) +2874 train 6.547803 (lr=1.4504e-04) (hash(x)=18356418) +2875 train 7.025176 (lr=1.4502e-04) (hash(x)=27781566) +2876 train 6.891735 (lr=1.4500e-04) (hash(x)=24878173) +2877 train 7.388432 (lr=1.4498e-04) (hash(x)=30018637) +2878 train 7.201280 (lr=1.4496e-04) (hash(x)=27168416) +2879 train 7.180905 (lr=1.4494e-04) (hash(x)=26757147) +2880 train 7.235468 (lr=1.4492e-04) (hash(x)=26637081) +2881 train 7.084671 (lr=1.4490e-04) (hash(x)=24795024) +2882 train 7.339188 (lr=1.4488e-04) (hash(x)=29787745) +2883 train 7.170990 (lr=1.4486e-04) (hash(x)=26649864) +2884 train 7.015083 (lr=1.4484e-04) (hash(x)=27306612) +2885 train 7.111845 (lr=1.4482e-04) (hash(x)=27568311) +2886 train 7.135700 (lr=1.4480e-04) (hash(x)=27440150) +2887 train 6.870781 (lr=1.4478e-04) (hash(x)=24963730) +2888 train 6.892936 (lr=1.4476e-04) (hash(x)=23619807) +2889 train 7.383066 (lr=1.4475e-04) (hash(x)=29447356) +2890 train 6.863153 (lr=1.4473e-04) (hash(x)=25144675) +2891 train 6.793150 (lr=1.4471e-04) (hash(x)=25249959) +2892 train 6.830724 (lr=1.4469e-04) (hash(x)=26608712) +2893 train 6.873682 (lr=1.4467e-04) (hash(x)=26333258) +2894 train 6.688982 (lr=1.4465e-04) (hash(x)=20682182) +2895 train 7.088427 (lr=1.4463e-04) (hash(x)=27703124) +2896 train 6.886674 (lr=1.4461e-04) (hash(x)=23228180) +2897 train 6.783470 (lr=1.4459e-04) (hash(x)=25252411) +2898 train 6.741062 (lr=1.4457e-04) (hash(x)=22879178) +2899 train 7.028372 (lr=1.4455e-04) (hash(x)=26459082) +2900 val loss 7.0425 +2900 val perplexity 1144.2075 +2900 train 6.865454 (lr=1.4453e-04) (hash(x)=24569501) +2901 train 6.632803 (lr=1.4451e-04) (hash(x)=19803884) +2902 train 6.675519 (lr=1.4449e-04) (hash(x)=18799747) +2903 train 6.997825 (lr=1.4447e-04) (hash(x)=24781713) +2904 train 7.169712 (lr=1.4445e-04) (hash(x)=25016590) +2905 train 7.369180 (lr=1.4443e-04) (hash(x)=29006906) +2906 train 7.065897 (lr=1.4441e-04) (hash(x)=24069959) +2907 train 7.241972 (lr=1.4439e-04) (hash(x)=26597693) +2908 train 6.885385 (lr=1.4437e-04) (hash(x)=25014146) +2909 train 7.096916 (lr=1.4435e-04) (hash(x)=24943747) +2910 train 7.016023 (lr=1.4433e-04) (hash(x)=27847542) +2911 train 6.910855 (lr=1.4432e-04) (hash(x)=24720476) +2912 train 6.783957 (lr=1.4430e-04) (hash(x)=24388804) +2913 train 6.905208 (lr=1.4428e-04) (hash(x)=23567535) +2914 train 7.243207 (lr=1.4426e-04) (hash(x)=29673625) +2915 train 6.939025 (lr=1.4424e-04) (hash(x)=23691295) +2916 train 7.329095 (lr=1.4422e-04) (hash(x)=26572819) +2917 train 6.928617 (lr=1.4420e-04) (hash(x)=23237812) +2918 train 7.209789 (lr=1.4418e-04) (hash(x)=26531016) +2919 train 6.747639 (lr=1.4416e-04) (hash(x)=23481301) +2920 train 7.030760 (lr=1.4414e-04) (hash(x)=24839184) +2921 train 6.902791 (lr=1.4412e-04) (hash(x)=23327755) +2922 train 7.165769 (lr=1.4410e-04) (hash(x)=26347114) +2923 train 6.801168 (lr=1.4408e-04) (hash(x)=23295676) +2924 train 6.882685 (lr=1.4406e-04) (hash(x)=24557178) +2925 train 6.947087 (lr=1.4404e-04) (hash(x)=26067788) +2926 train 6.893883 (lr=1.4402e-04) (hash(x)=25694982) +2927 train 6.967803 (lr=1.4400e-04) (hash(x)=25641033) +2928 train 6.990465 (lr=1.4398e-04) (hash(x)=24906422) +2929 train 7.181004 (lr=1.4396e-04) (hash(x)=27803515) +2930 train 7.162146 (lr=1.4394e-04) (hash(x)=26208803) +2931 train 6.615814 (lr=1.4392e-04) (hash(x)=22441379) +2932 train 6.924759 (lr=1.4390e-04) (hash(x)=24741626) +2933 train 6.787843 (lr=1.4388e-04) (hash(x)=24595257) +2934 train 6.859315 (lr=1.4386e-04) (hash(x)=23939167) +2935 train 7.142414 (lr=1.4384e-04) (hash(x)=27369437) +2936 train 6.746334 (lr=1.4382e-04) (hash(x)=21409783) +2937 train 7.035386 (lr=1.4380e-04) (hash(x)=25923735) +2938 train 7.051840 (lr=1.4378e-04) (hash(x)=29559511) +2939 train 6.912515 (lr=1.4376e-04) (hash(x)=24482272) +2940 train 6.908853 (lr=1.4374e-04) (hash(x)=24767658) +2941 train 7.089004 (lr=1.4372e-04) (hash(x)=26425020) +2942 train 7.448839 (lr=1.4371e-04) (hash(x)=27444868) +2943 train 6.895676 (lr=1.4369e-04) (hash(x)=24760900) +2944 train 6.897703 (lr=1.4367e-04) (hash(x)=25605407) +2945 train 6.783440 (lr=1.4365e-04) (hash(x)=22886951) +2946 train 7.132056 (lr=1.4363e-04) (hash(x)=26112205) +2947 train 6.970706 (lr=1.4361e-04) (hash(x)=23919156) +2948 train 6.923347 (lr=1.4359e-04) (hash(x)=23729312) +2949 train 7.192148 (lr=1.4357e-04) (hash(x)=30440878) +2950 val loss 7.0300 +2950 val perplexity 1130.0724 +2950 train 6.634785 (lr=1.4355e-04) (hash(x)=20004041) +2951 train 6.616620 (lr=1.4353e-04) (hash(x)=21692546) +2952 train 6.689867 (lr=1.4351e-04) (hash(x)=23021681) +2953 train 7.049853 (lr=1.4349e-04) (hash(x)=26663597) +2954 train 6.938548 (lr=1.4347e-04) (hash(x)=23727385) +2955 train 6.898294 (lr=1.4345e-04) (hash(x)=27692087) +2956 train 6.944289 (lr=1.4343e-04) (hash(x)=24003378) +2957 train 7.599442 (lr=1.4341e-04) (hash(x)=29534673) +2958 train 6.866406 (lr=1.4339e-04) (hash(x)=22875068) +2959 train 6.836256 (lr=1.4337e-04) (hash(x)=22720391) +2960 train 6.616296 (lr=1.4335e-04) (hash(x)=17997400) +2961 train 6.809098 (lr=1.4333e-04) (hash(x)=22853822) +2962 train 6.884911 (lr=1.4331e-04) (hash(x)=25238004) +2963 train 7.021463 (lr=1.4329e-04) (hash(x)=26146560) +2964 train 7.182697 (lr=1.4327e-04) (hash(x)=21894867) +2965 train 7.126354 (lr=1.4325e-04) (hash(x)=23001150) +2966 train 6.825625 (lr=1.4323e-04) (hash(x)=23392923) +2967 train 6.904552 (lr=1.4321e-04) (hash(x)=24376979) +2968 train 6.853244 (lr=1.4319e-04) (hash(x)=23781449) +2969 train 7.014609 (lr=1.4317e-04) (hash(x)=25315495) +2970 train 7.153559 (lr=1.4315e-04) (hash(x)=27165470) +2971 train 6.962801 (lr=1.4313e-04) (hash(x)=22917712) +2972 train 7.313821 (lr=1.4311e-04) (hash(x)=27928456) +2973 train 6.701489 (lr=1.4309e-04) (hash(x)=19890855) +2974 train 6.637269 (lr=1.4307e-04) (hash(x)=21318134) +2975 train 6.794785 (lr=1.4305e-04) (hash(x)=22244509) +2976 train 6.742040 (lr=1.4303e-04) (hash(x)=21293137) +2977 train 6.826270 (lr=1.4301e-04) (hash(x)=23465789) +2978 train 6.786849 (lr=1.4299e-04) (hash(x)=21169753) +2979 train 7.189897 (lr=1.4297e-04) (hash(x)=25243385) +2980 train 7.241166 (lr=1.4295e-04) (hash(x)=27465812) +2981 train 6.909630 (lr=1.4293e-04) (hash(x)=24615492) +2982 train 6.836869 (lr=1.4291e-04) (hash(x)=23081307) +2983 train 6.609528 (lr=1.4289e-04) (hash(x)=21831960) +2984 train 6.754645 (lr=1.4287e-04) (hash(x)=23242850) +2985 train 6.862461 (lr=1.4285e-04) (hash(x)=24308188) +2986 train 7.064603 (lr=1.4283e-04) (hash(x)=28541601) +2987 train 6.927665 (lr=1.4281e-04) (hash(x)=24842373) +2988 train 6.678722 (lr=1.4279e-04) (hash(x)=21967126) +2989 train 6.878519 (lr=1.4277e-04) (hash(x)=22951616) +2990 train 6.994030 (lr=1.4275e-04) (hash(x)=24325714) +2991 train 6.783180 (lr=1.4273e-04) (hash(x)=24921535) +2992 train 7.045401 (lr=1.4271e-04) (hash(x)=25937112) +2993 train 6.693784 (lr=1.4269e-04) (hash(x)=20716218) +2994 train 6.990322 (lr=1.4267e-04) (hash(x)=25450724) +2995 train 6.930116 (lr=1.4265e-04) (hash(x)=24344615) +2996 train 6.658379 (lr=1.4263e-04) (hash(x)=20299058) +2997 train 6.886609 (lr=1.4261e-04) (hash(x)=23859426) +2998 train 6.849457 (lr=1.4259e-04) (hash(x)=23094397) +2999 train 7.179789 (lr=1.4257e-04) (hash(x)=25381251) +3000 val loss 7.0216 +3000 val perplexity 1120.5388 +3000 train 6.954779 (lr=1.4255e-04) (hash(x)=23586527) +3001 train 6.825876 (lr=1.4253e-04) (hash(x)=24220410) +3002 train 6.659459 (lr=1.4251e-04) (hash(x)=20597347) +3003 train 6.786027 (lr=1.4249e-04) (hash(x)=22887303) +3004 train 7.095329 (lr=1.4247e-04) (hash(x)=25869462) +3005 train 6.796874 (lr=1.4245e-04) (hash(x)=22098530) +3006 train 7.086026 (lr=1.4243e-04) (hash(x)=26246291) +3007 train 7.029573 (lr=1.4241e-04) (hash(x)=25687352) +3008 train 6.792243 (lr=1.4239e-04) (hash(x)=25425646) +3009 train 6.987615 (lr=1.4237e-04) (hash(x)=26021124) +3010 train 7.022785 (lr=1.4235e-04) (hash(x)=25392057) +3011 train 7.094640 (lr=1.4233e-04) (hash(x)=27791412) +3012 train 6.934822 (lr=1.4231e-04) (hash(x)=23181098) +3013 train 6.923679 (lr=1.4229e-04) (hash(x)=25521889) +3014 train 6.728664 (lr=1.4227e-04) (hash(x)=21685795) +3015 train 6.908954 (lr=1.4225e-04) (hash(x)=25221654) +3016 train 7.081611 (lr=1.4223e-04) (hash(x)=24888744) +3017 train 6.986737 (lr=1.4221e-04) (hash(x)=24200150) +3018 train 6.913415 (lr=1.4219e-04) (hash(x)=26943942) +3019 train 6.872386 (lr=1.4217e-04) (hash(x)=23243731) +3020 train 6.739302 (lr=1.4215e-04) (hash(x)=21068284) +3021 train 6.914907 (lr=1.4213e-04) (hash(x)=23876902) +3022 train 7.068872 (lr=1.4211e-04) (hash(x)=25337639) +3023 train 7.001782 (lr=1.4209e-04) (hash(x)=24469863) +3024 train 7.413959 (lr=1.4207e-04) (hash(x)=27850876) +3025 train 7.262804 (lr=1.4205e-04) (hash(x)=20515778) +3026 train 7.054751 (lr=1.4203e-04) (hash(x)=29019173) +3027 train 6.703275 (lr=1.4201e-04) (hash(x)=22484936) +3028 train 6.884694 (lr=1.4199e-04) (hash(x)=24639400) +3029 train 7.039072 (lr=1.4197e-04) (hash(x)=26835174) +3030 train 7.171783 (lr=1.4195e-04) (hash(x)=29843763) +3031 train 6.889822 (lr=1.4193e-04) (hash(x)=25291413) +3032 train 6.805154 (lr=1.4191e-04) (hash(x)=24590244) +3033 train 7.062431 (lr=1.4189e-04) (hash(x)=28880142) +3034 train 6.798786 (lr=1.4187e-04) (hash(x)=23372199) +3035 train 6.806175 (lr=1.4185e-04) (hash(x)=23952225) +3036 train 6.893361 (lr=1.4183e-04) (hash(x)=24589186) +3037 train 6.916435 (lr=1.4181e-04) (hash(x)=23260323) +3038 train 7.077724 (lr=1.4179e-04) (hash(x)=25824498) +3039 train 7.022209 (lr=1.4177e-04) (hash(x)=25744274) +3040 train 6.963184 (lr=1.4175e-04) (hash(x)=21610247) +3041 train 7.094031 (lr=1.4173e-04) (hash(x)=25079786) +3042 train 6.717859 (lr=1.4171e-04) (hash(x)=23219195) +3043 train 6.700324 (lr=1.4169e-04) (hash(x)=22616739) +3044 train 6.973850 (lr=1.4167e-04) (hash(x)=24908480) +3045 train 6.837415 (lr=1.4165e-04) (hash(x)=22293489) +3046 train 6.818888 (lr=1.4163e-04) (hash(x)=23557651) +3047 train 6.866081 (lr=1.4161e-04) (hash(x)=24246963) +3048 train 6.998309 (lr=1.4159e-04) (hash(x)=24490083) +3049 train 6.967356 (lr=1.4157e-04) (hash(x)=22372895) +3050 val loss 7.0334 +3050 val perplexity 1133.8999 +3050 train 6.673175 (lr=1.4155e-04) (hash(x)=21759470) +3051 train 6.576538 (lr=1.4153e-04) (hash(x)=19407094) +3052 train 6.982529 (lr=1.4151e-04) (hash(x)=23957047) +3053 train 7.064012 (lr=1.4148e-04) (hash(x)=24719318) +3054 train 6.835114 (lr=1.4146e-04) (hash(x)=20719314) +3055 train 6.787624 (lr=1.4144e-04) (hash(x)=19724058) +3056 train 6.609732 (lr=1.4142e-04) (hash(x)=14407266) +3057 train 6.462769 (lr=1.4140e-04) (hash(x)=12468292) +3058 train 6.754627 (lr=1.4138e-04) (hash(x)=16098279) +3059 train 6.838356 (lr=1.4136e-04) (hash(x)=18836491) +3060 train 6.651974 (lr=1.4134e-04) (hash(x)=19132277) +3061 train 6.772598 (lr=1.4132e-04) (hash(x)=22814208) +3062 train 6.870567 (lr=1.4130e-04) (hash(x)=24838508) +3063 train 6.738409 (lr=1.4128e-04) (hash(x)=20705649) +3064 train 7.777894 (lr=1.4126e-04) (hash(x)=29416914) +3065 train 7.241906 (lr=1.4124e-04) (hash(x)=25972430) +3066 train 6.609014 (lr=1.4122e-04) (hash(x)=23705805) +3067 train 6.686887 (lr=1.4120e-04) (hash(x)=21325875) +3068 train 6.902487 (lr=1.4118e-04) (hash(x)=23526506) +3069 train 7.397089 (lr=1.4116e-04) (hash(x)=27282337) +3070 train 7.223746 (lr=1.4114e-04) (hash(x)=27968043) +3071 train 7.033967 (lr=1.4112e-04) (hash(x)=24938685) +3072 train 7.219849 (lr=1.4110e-04) (hash(x)=26942737) +3073 train 7.114247 (lr=1.4108e-04) (hash(x)=23506879) +3074 train 6.787026 (lr=1.4106e-04) (hash(x)=23589913) +3075 train 6.983140 (lr=1.4104e-04) (hash(x)=25152403) +3076 train 7.114691 (lr=1.4102e-04) (hash(x)=23425868) +3077 train 7.278720 (lr=1.4100e-04) (hash(x)=23966181) +3078 train 7.356381 (lr=1.4098e-04) (hash(x)=27312570) +3079 train 6.968453 (lr=1.4096e-04) (hash(x)=21707000) +3080 train 6.856904 (lr=1.4094e-04) (hash(x)=25600427) +3081 train 7.020110 (lr=1.4092e-04) (hash(x)=24270631) +3082 train 7.108582 (lr=1.4090e-04) (hash(x)=25199537) +3083 train 6.374699 (lr=1.4088e-04) (hash(x)=17952018) +3084 train 6.480540 (lr=1.4086e-04) (hash(x)=18733143) +3085 train 7.094807 (lr=1.4083e-04) (hash(x)=26946100) +3086 train 6.926248 (lr=1.4081e-04) (hash(x)=25547515) +3087 train 6.880259 (lr=1.4079e-04) (hash(x)=24948980) +3088 train 8.126212 (lr=1.4077e-04) (hash(x)=35461645) +3089 train 7.156208 (lr=1.4075e-04) (hash(x)=28330877) +3090 train 7.081104 (lr=1.4073e-04) (hash(x)=27687861) +3091 train 7.183820 (lr=1.4071e-04) (hash(x)=28012110) +3092 train 7.052270 (lr=1.4069e-04) (hash(x)=24684480) +3093 train 7.004275 (lr=1.4067e-04) (hash(x)=26225786) +3094 train 6.685342 (lr=1.4065e-04) (hash(x)=23098156) +3095 train 7.285057 (lr=1.4063e-04) (hash(x)=30773958) +3096 train 7.590760 (lr=1.4061e-04) (hash(x)=28640406) +3097 train 7.554583 (lr=1.4059e-04) (hash(x)=28201086) +3098 train 7.834469 (lr=1.4057e-04) (hash(x)=35002344) +3099 train 7.358875 (lr=1.4055e-04) (hash(x)=29481068) +3100 val loss 7.0321 +3100 val perplexity 1132.3875 +3100 train 6.911610 (lr=1.4053e-04) (hash(x)=26374528) +3101 train 6.871686 (lr=1.4051e-04) (hash(x)=24153602) +3102 train 6.934402 (lr=1.4049e-04) (hash(x)=25478746) +3103 train 7.227911 (lr=1.4047e-04) (hash(x)=26769046) +3104 train 6.806159 (lr=1.4045e-04) (hash(x)=21841970) +3105 train 7.149578 (lr=1.4043e-04) (hash(x)=27693052) +3106 train 6.570683 (lr=1.4041e-04) (hash(x)=20689448) +3107 train 6.935520 (lr=1.4038e-04) (hash(x)=26755048) +3108 train 7.011572 (lr=1.4036e-04) (hash(x)=24431904) +3109 train 6.872661 (lr=1.4034e-04) (hash(x)=21009792) +3110 train 6.915995 (lr=1.4032e-04) (hash(x)=21909003) +3111 train 6.984195 (lr=1.4030e-04) (hash(x)=18849656) +3112 train 7.045714 (lr=1.4028e-04) (hash(x)=22223376) +3113 train 7.337810 (lr=1.4026e-04) (hash(x)=25652491) +3114 train 7.249652 (lr=1.4024e-04) (hash(x)=23521434) +3115 train 7.296858 (lr=1.4022e-04) (hash(x)=25449800) +3116 train 7.628407 (lr=1.4020e-04) (hash(x)=27655847) +3117 train 7.651495 (lr=1.4018e-04) (hash(x)=29878248) +3118 train 7.614899 (lr=1.4016e-04) (hash(x)=30444094) +3119 train 7.384429 (lr=1.4014e-04) (hash(x)=24624950) +3120 train 6.757001 (lr=1.4012e-04) (hash(x)=20798511) +3121 train 7.123212 (lr=1.4010e-04) (hash(x)=26581679) +3122 train 6.996698 (lr=1.4008e-04) (hash(x)=25333422) +3123 train 7.058990 (lr=1.4006e-04) (hash(x)=26174069) +3124 train 7.149976 (lr=1.4004e-04) (hash(x)=25219475) +3125 train 7.032917 (lr=1.4002e-04) (hash(x)=20919061) +3126 train 6.971895 (lr=1.3999e-04) (hash(x)=23828688) +3127 train 7.483534 (lr=1.3997e-04) (hash(x)=27299605) +3128 train 6.824922 (lr=1.3995e-04) (hash(x)=23797514) +3129 train 7.070816 (lr=1.3993e-04) (hash(x)=23601883) +3130 train 7.279706 (lr=1.3991e-04) (hash(x)=31003964) +3131 train 7.014076 (lr=1.3989e-04) (hash(x)=24777273) +3132 train 6.866571 (lr=1.3987e-04) (hash(x)=25403249) +3133 train 7.161063 (lr=1.3985e-04) (hash(x)=28913150) +3134 train 7.053827 (lr=1.3983e-04) (hash(x)=26541508) +3135 train 7.053128 (lr=1.3981e-04) (hash(x)=24113445) +3136 train 6.809932 (lr=1.3979e-04) (hash(x)=25464565) +3137 train 7.077193 (lr=1.3977e-04) (hash(x)=26581432) +3138 train 6.928932 (lr=1.3975e-04) (hash(x)=23074513) +3139 train 6.786002 (lr=1.3973e-04) (hash(x)=23970384) +3140 train 7.064447 (lr=1.3971e-04) (hash(x)=26694495) +3141 train 7.045078 (lr=1.3969e-04) (hash(x)=26883445) +3142 train 7.177116 (lr=1.3966e-04) (hash(x)=28632211) +3143 train 7.636470 (lr=1.3964e-04) (hash(x)=32644465) +3144 train 7.318238 (lr=1.3962e-04) (hash(x)=27490443) +3145 train 6.919232 (lr=1.3960e-04) (hash(x)=23814853) +3146 train 7.322248 (lr=1.3958e-04) (hash(x)=29664236) +3147 train 7.630128 (lr=1.3956e-04) (hash(x)=29951548) +3148 train 7.352402 (lr=1.3954e-04) (hash(x)=28426503) +3149 train 6.778499 (lr=1.3952e-04) (hash(x)=23727657) +3150 val loss 7.0585 +3150 val perplexity 1162.6481 +3150 train 6.951931 (lr=1.3950e-04) (hash(x)=21430659) +3151 train 6.992903 (lr=1.3948e-04) (hash(x)=25829219) +3152 train 7.113842 (lr=1.3946e-04) (hash(x)=29735208) +3153 train 7.199296 (lr=1.3944e-04) (hash(x)=28173447) +3154 train 6.886664 (lr=1.3942e-04) (hash(x)=22909641) +3155 train 6.992139 (lr=1.3940e-04) (hash(x)=20556094) +3156 train 6.787427 (lr=1.3938e-04) (hash(x)=24013769) +3157 train 6.811203 (lr=1.3935e-04) (hash(x)=22525971) +3158 train 6.901971 (lr=1.3933e-04) (hash(x)=25492728) +3159 train 6.933763 (lr=1.3931e-04) (hash(x)=25194550) +3160 train 7.037399 (lr=1.3929e-04) (hash(x)=25610603) +3161 train 7.029744 (lr=1.3927e-04) (hash(x)=23848640) +3162 train 6.814719 (lr=1.3925e-04) (hash(x)=24082226) +3163 train 7.200378 (lr=1.3923e-04) (hash(x)=28482186) +3164 train 7.099347 (lr=1.3921e-04) (hash(x)=27542978) +3165 train 6.870113 (lr=1.3919e-04) (hash(x)=22540954) +3166 train 6.987584 (lr=1.3917e-04) (hash(x)=26103641) +3167 train 6.969547 (lr=1.3915e-04) (hash(x)=25941804) +3168 train 6.998022 (lr=1.3913e-04) (hash(x)=25965921) +3169 train 7.212547 (lr=1.3911e-04) (hash(x)=25631269) +3170 train 6.815599 (lr=1.3909e-04) (hash(x)=23471525) +3171 train 7.043671 (lr=1.3906e-04) (hash(x)=27049208) +3172 train 7.044585 (lr=1.3904e-04) (hash(x)=27074992) +3173 train 6.976913 (lr=1.3902e-04) (hash(x)=25712617) +3174 train 6.934067 (lr=1.3900e-04) (hash(x)=25884917) +3175 train 6.974744 (lr=1.3898e-04) (hash(x)=24075727) +3176 train 6.838780 (lr=1.3896e-04) (hash(x)=23681759) +3177 train 7.123473 (lr=1.3894e-04) (hash(x)=25786577) +3178 train 7.082046 (lr=1.3892e-04) (hash(x)=27307614) +3179 train 7.138292 (lr=1.3890e-04) (hash(x)=25082806) +3180 train 7.107864 (lr=1.3888e-04) (hash(x)=26098308) +3181 train 6.867712 (lr=1.3886e-04) (hash(x)=24080140) +3182 train 7.092519 (lr=1.3884e-04) (hash(x)=26399395) +3183 train 7.120273 (lr=1.3882e-04) (hash(x)=23104539) +3184 train 6.776585 (lr=1.3879e-04) (hash(x)=23356930) +3185 train 7.028108 (lr=1.3877e-04) (hash(x)=27972420) +3186 train 6.687612 (lr=1.3875e-04) (hash(x)=21338924) +3187 train 7.161572 (lr=1.3873e-04) (hash(x)=25351113) +3188 train 7.116469 (lr=1.3871e-04) (hash(x)=26019439) +3189 train 7.161747 (lr=1.3869e-04) (hash(x)=30149312) +3190 train 6.837650 (lr=1.3867e-04) (hash(x)=23028152) +3191 train 7.233336 (lr=1.3865e-04) (hash(x)=23018983) +3192 train 6.827641 (lr=1.3863e-04) (hash(x)=23190787) +3193 train 7.253102 (lr=1.3861e-04) (hash(x)=27798543) +3194 train 7.027523 (lr=1.3859e-04) (hash(x)=25193663) +3195 train 6.844335 (lr=1.3856e-04) (hash(x)=25302106) +3196 train 6.988497 (lr=1.3854e-04) (hash(x)=24325364) +3197 train 7.010740 (lr=1.3852e-04) (hash(x)=25399101) +3198 train 6.841630 (lr=1.3850e-04) (hash(x)=23606439) +3199 train 6.902729 (lr=1.3848e-04) (hash(x)=24422929) +3200 val loss 7.0196 +3200 val perplexity 1118.3801 +3200 train 7.070745 (lr=1.3846e-04) (hash(x)=24760381) +3201 train 6.708649 (lr=1.3844e-04) (hash(x)=23278576) +3202 train 6.955152 (lr=1.3842e-04) (hash(x)=24897511) +3203 train 7.305270 (lr=1.3840e-04) (hash(x)=29052117) +3204 train 6.937046 (lr=1.3838e-04) (hash(x)=25772923) +3205 train 7.147914 (lr=1.3836e-04) (hash(x)=25885977) +3206 train 6.917879 (lr=1.3834e-04) (hash(x)=21985272) +3207 train 6.824918 (lr=1.3831e-04) (hash(x)=23389696) +3208 train 6.758564 (lr=1.3829e-04) (hash(x)=25299042) +3209 train 7.070700 (lr=1.3827e-04) (hash(x)=23703987) +3210 train 6.943871 (lr=1.3825e-04) (hash(x)=23362342) +3211 train 6.994569 (lr=1.3823e-04) (hash(x)=23962503) +3212 train 6.857426 (lr=1.3821e-04) (hash(x)=21216023) +3213 train 6.963562 (lr=1.3819e-04) (hash(x)=25841931) +3214 train 6.813507 (lr=1.3817e-04) (hash(x)=23631428) +3215 train 7.209392 (lr=1.3815e-04) (hash(x)=29102969) +3216 train 6.924550 (lr=1.3813e-04) (hash(x)=25782766) +3217 train 7.225320 (lr=1.3810e-04) (hash(x)=28825867) +3218 train 7.164013 (lr=1.3808e-04) (hash(x)=24609499) +3219 train 7.097374 (lr=1.3806e-04) (hash(x)=24948166) +3220 train 7.201769 (lr=1.3804e-04) (hash(x)=26919841) +3221 train 7.014784 (lr=1.3802e-04) (hash(x)=27236198) +3222 train 6.804639 (lr=1.3800e-04) (hash(x)=24029305) +3223 train 7.355251 (lr=1.3798e-04) (hash(x)=28359859) +3224 train 7.150215 (lr=1.3796e-04) (hash(x)=24886008) +3225 train 6.981586 (lr=1.3794e-04) (hash(x)=27159867) +3226 train 7.290050 (lr=1.3792e-04) (hash(x)=20672023) +3227 train 6.907709 (lr=1.3790e-04) (hash(x)=22360298) +3228 train 7.346326 (lr=1.3787e-04) (hash(x)=27478658) +3229 train 7.176300 (lr=1.3785e-04) (hash(x)=26575886) +3230 train 7.354841 (lr=1.3783e-04) (hash(x)=26890615) +3231 train 6.969069 (lr=1.3781e-04) (hash(x)=24630955) +3232 train 7.280580 (lr=1.3779e-04) (hash(x)=27016054) +3233 train 7.412698 (lr=1.3777e-04) (hash(x)=28444407) +3234 train 6.819452 (lr=1.3775e-04) (hash(x)=24053336) +3235 train 7.137734 (lr=1.3773e-04) (hash(x)=26897402) +3236 train 7.305554 (lr=1.3771e-04) (hash(x)=29451214) +3237 train 7.065551 (lr=1.3768e-04) (hash(x)=27268677) +3238 train 7.237040 (lr=1.3766e-04) (hash(x)=27494000) +3239 train 6.859720 (lr=1.3764e-04) (hash(x)=22969113) +3240 train 6.809533 (lr=1.3762e-04) (hash(x)=21944576) +3241 train 7.005728 (lr=1.3760e-04) (hash(x)=21671079) +3242 train 6.904950 (lr=1.3758e-04) (hash(x)=23912980) +3243 train 6.870149 (lr=1.3756e-04) (hash(x)=25205781) +3244 train 6.872405 (lr=1.3754e-04) (hash(x)=25654244) +3245 train 6.795732 (lr=1.3752e-04) (hash(x)=23335929) +3246 train 7.201141 (lr=1.3750e-04) (hash(x)=27953926) +3247 train 6.963520 (lr=1.3747e-04) (hash(x)=27004415) +3248 train 6.655182 (lr=1.3745e-04) (hash(x)=20471566) +3249 train 6.842812 (lr=1.3743e-04) (hash(x)=25797941) +3250 val loss 6.9958 +3250 val perplexity 1092.0662 +3250 train 6.756437 (lr=1.3741e-04) (hash(x)=21787064) +3251 train 6.750515 (lr=1.3739e-04) (hash(x)=22974875) +3252 train 7.041139 (lr=1.3737e-04) (hash(x)=28431267) +3253 train 6.933267 (lr=1.3735e-04) (hash(x)=25584910) +3254 train 6.715953 (lr=1.3733e-04) (hash(x)=23888922) +3255 train 6.944420 (lr=1.3731e-04) (hash(x)=22265063) +3256 train 6.554312 (lr=1.3728e-04) (hash(x)=21926624) +3257 train 6.824380 (lr=1.3726e-04) (hash(x)=23073191) +3258 train 6.825093 (lr=1.3724e-04) (hash(x)=24409183) +3259 train 6.913299 (lr=1.3722e-04) (hash(x)=23312114) +3260 train 6.801816 (lr=1.3720e-04) (hash(x)=21001289) +3261 train 7.038881 (lr=1.3718e-04) (hash(x)=25514824) +3262 train 6.784956 (lr=1.3716e-04) (hash(x)=22526800) +3263 train 7.208756 (lr=1.3714e-04) (hash(x)=26905990) +3264 train 6.852475 (lr=1.3712e-04) (hash(x)=24469631) +3265 train 6.740854 (lr=1.3709e-04) (hash(x)=21149081) +3266 train 6.921844 (lr=1.3707e-04) (hash(x)=24696215) +3267 train 7.213736 (lr=1.3705e-04) (hash(x)=27089280) +3268 train 6.793275 (lr=1.3703e-04) (hash(x)=23100446) +3269 train 7.049330 (lr=1.3701e-04) (hash(x)=25061229) +3270 train 6.923704 (lr=1.3699e-04) (hash(x)=24337543) +3271 train 6.997865 (lr=1.3697e-04) (hash(x)=24047679) +3272 train 7.057082 (lr=1.3695e-04) (hash(x)=27616773) +3273 train 6.972615 (lr=1.3692e-04) (hash(x)=25315110) +3274 train 7.021513 (lr=1.3690e-04) (hash(x)=28354645) +3275 train 6.872674 (lr=1.3688e-04) (hash(x)=25034684) +3276 train 6.930482 (lr=1.3686e-04) (hash(x)=23550342) +3277 train 7.649025 (lr=1.3684e-04) (hash(x)=28661487) +3278 train 7.169363 (lr=1.3682e-04) (hash(x)=24724622) +3279 train 7.073431 (lr=1.3680e-04) (hash(x)=26905582) +3280 train 7.185513 (lr=1.3678e-04) (hash(x)=26838818) +3281 train 6.883102 (lr=1.3676e-04) (hash(x)=23949017) +3282 train 6.400125 (lr=1.3673e-04) (hash(x)=18846300) +3283 train 6.748787 (lr=1.3671e-04) (hash(x)=21406950) +3284 train 6.592018 (lr=1.3669e-04) (hash(x)=21157696) +3285 train 6.688671 (lr=1.3667e-04) (hash(x)=21440152) +3286 train 6.843146 (lr=1.3665e-04) (hash(x)=26749182) +3287 train 7.093030 (lr=1.3663e-04) (hash(x)=29018970) +3288 train 7.051775 (lr=1.3661e-04) (hash(x)=27577517) +3289 train 6.658757 (lr=1.3659e-04) (hash(x)=19190537) +3290 train 6.690207 (lr=1.3656e-04) (hash(x)=21957991) +3291 train 6.753139 (lr=1.3654e-04) (hash(x)=20853530) +3292 train 6.634636 (lr=1.3652e-04) (hash(x)=22291731) +3293 train 6.858980 (lr=1.3650e-04) (hash(x)=23786853) +3294 train 7.008516 (lr=1.3648e-04) (hash(x)=25740147) +3295 train 7.137729 (lr=1.3646e-04) (hash(x)=24503315) +3296 train 6.853649 (lr=1.3644e-04) (hash(x)=22541728) +3297 train 7.158981 (lr=1.3642e-04) (hash(x)=27067328) +3298 train 6.812468 (lr=1.3639e-04) (hash(x)=22600715) +3299 train 6.823227 (lr=1.3637e-04) (hash(x)=23080074) +3300 val loss 6.9976 +3300 val perplexity 1094.0066 +3300 train 6.600009 (lr=1.3635e-04) (hash(x)=22097758) +3301 train 6.799124 (lr=1.3633e-04) (hash(x)=24105430) +3302 train 6.659598 (lr=1.3631e-04) (hash(x)=23343775) +3303 train 6.917558 (lr=1.3629e-04) (hash(x)=22607537) +3304 train 6.988098 (lr=1.3627e-04) (hash(x)=26501182) +3305 train 7.262174 (lr=1.3624e-04) (hash(x)=26063650) +3306 train 6.851001 (lr=1.3622e-04) (hash(x)=23486602) +3307 train 7.954233 (lr=1.3620e-04) (hash(x)=32179773) +3308 train 11.691783 (lr=1.3618e-04) (hash(x)=66155855) +3309 train 8.449422 (lr=1.3616e-04) (hash(x)=37724427) +3310 train 7.377524 (lr=1.3614e-04) (hash(x)=28861610) +3311 train 7.323872 (lr=1.3612e-04) (hash(x)=26690225) +3312 train 6.905852 (lr=1.3610e-04) (hash(x)=24136450) +3313 train 7.120859 (lr=1.3607e-04) (hash(x)=23702010) +3314 train 7.330711 (lr=1.3605e-04) (hash(x)=28761762) +3315 train 6.665617 (lr=1.3603e-04) (hash(x)=22109609) +3316 train 7.059422 (lr=1.3601e-04) (hash(x)=25168631) +3317 train 6.961937 (lr=1.3599e-04) (hash(x)=24503786) +3318 train 6.989730 (lr=1.3597e-04) (hash(x)=23698606) +3319 train 7.009965 (lr=1.3595e-04) (hash(x)=24226255) +3320 train 7.561101 (lr=1.3592e-04) (hash(x)=31110577) +3321 train 6.950149 (lr=1.3590e-04) (hash(x)=24752754) +3322 train 6.774350 (lr=1.3588e-04) (hash(x)=21135610) +3323 train 6.759627 (lr=1.3586e-04) (hash(x)=23013573) +3324 train 6.467842 (lr=1.3584e-04) (hash(x)=20289715) +3325 train 6.773947 (lr=1.3582e-04) (hash(x)=22700287) +3326 train 6.858918 (lr=1.3580e-04) (hash(x)=21320362) +3327 train 6.976583 (lr=1.3577e-04) (hash(x)=23622702) +3328 train 7.230529 (lr=1.3575e-04) (hash(x)=27435461) +3329 train 6.974157 (lr=1.3573e-04) (hash(x)=25435452) +3330 train 7.009584 (lr=1.3571e-04) (hash(x)=27952557) +3331 train 6.647436 (lr=1.3569e-04) (hash(x)=21517429) +3332 train 6.771521 (lr=1.3567e-04) (hash(x)=24288985) +3333 train 6.918591 (lr=1.3565e-04) (hash(x)=23374788) +3334 train 6.695923 (lr=1.3563e-04) (hash(x)=22042499) +3335 train 7.019725 (lr=1.3560e-04) (hash(x)=23910425) +3336 train 7.301218 (lr=1.3558e-04) (hash(x)=28118508) +3337 train 7.113372 (lr=1.3556e-04) (hash(x)=26737440) +3338 train 6.889277 (lr=1.3554e-04) (hash(x)=24472271) +3339 train 6.866661 (lr=1.3552e-04) (hash(x)=24407484) +3340 train 7.365753 (lr=1.3550e-04) (hash(x)=27908937) +3341 train 7.464420 (lr=1.3547e-04) (hash(x)=29038937) +3342 train 7.281830 (lr=1.3545e-04) (hash(x)=24802580) +3343 train 7.280717 (lr=1.3543e-04) (hash(x)=27213318) +3344 train 7.347125 (lr=1.3541e-04) (hash(x)=28693458) +3345 train 6.611223 (lr=1.3539e-04) (hash(x)=20332324) +3346 train 7.011702 (lr=1.3537e-04) (hash(x)=26726007) +3347 train 6.909769 (lr=1.3535e-04) (hash(x)=25524191) +3348 train 6.980306 (lr=1.3532e-04) (hash(x)=25553293) +3349 train 6.925434 (lr=1.3530e-04) (hash(x)=25614848) +3350 val loss 6.9953 +3350 val perplexity 1091.4888 +3350 train 7.022693 (lr=1.3528e-04) (hash(x)=25747903) +3351 train 6.996542 (lr=1.3526e-04) (hash(x)=26701577) +3352 train 6.728776 (lr=1.3524e-04) (hash(x)=21964135) +3353 train 6.859302 (lr=1.3522e-04) (hash(x)=24461007) +3354 train 6.881705 (lr=1.3520e-04) (hash(x)=25818495) +3355 train 6.739444 (lr=1.3517e-04) (hash(x)=22091266) +3356 train 6.769426 (lr=1.3515e-04) (hash(x)=24476213) +3357 train 7.106587 (lr=1.3513e-04) (hash(x)=24500423) +3358 train 6.839563 (lr=1.3511e-04) (hash(x)=21754841) +3359 train 7.201297 (lr=1.3509e-04) (hash(x)=26216794) +3360 train 6.648851 (lr=1.3507e-04) (hash(x)=24267249) +3361 train 7.008192 (lr=1.3505e-04) (hash(x)=23143515) +3362 train 6.901906 (lr=1.3502e-04) (hash(x)=24120302) +3363 train 7.083134 (lr=1.3500e-04) (hash(x)=20817340) +3364 train 7.000034 (lr=1.3498e-04) (hash(x)=22285847) +3365 train 7.305698 (lr=1.3496e-04) (hash(x)=28151597) +3366 train 7.754307 (lr=1.3494e-04) (hash(x)=31593285) +3367 train 7.367079 (lr=1.3492e-04) (hash(x)=27579623) +3368 train 6.969931 (lr=1.3489e-04) (hash(x)=24995988) +3369 train 6.662035 (lr=1.3487e-04) (hash(x)=22166810) +3370 train 6.858117 (lr=1.3485e-04) (hash(x)=23948298) +3371 train 6.791917 (lr=1.3483e-04) (hash(x)=21532187) +3372 train 6.896554 (lr=1.3481e-04) (hash(x)=23571652) +3373 train 7.254276 (lr=1.3479e-04) (hash(x)=26911513) +3374 train 7.206384 (lr=1.3476e-04) (hash(x)=24011329) +3375 train 7.414172 (lr=1.3474e-04) (hash(x)=26086198) +3376 train 6.949653 (lr=1.3472e-04) (hash(x)=22844402) +3377 train 6.874065 (lr=1.3470e-04) (hash(x)=21817762) +3378 train 6.934484 (lr=1.3468e-04) (hash(x)=23903232) +3379 train 6.903883 (lr=1.3466e-04) (hash(x)=23911729) +3380 train 6.900756 (lr=1.3464e-04) (hash(x)=24485288) +3381 train 7.082473 (lr=1.3461e-04) (hash(x)=27955492) +3382 train 6.813580 (lr=1.3459e-04) (hash(x)=25884586) +3383 train 7.007249 (lr=1.3457e-04) (hash(x)=24863441) +3384 train 7.265157 (lr=1.3455e-04) (hash(x)=22045992) +3385 train 7.407591 (lr=1.3453e-04) (hash(x)=29174796) +3386 train 7.711259 (lr=1.3451e-04) (hash(x)=32589942) +3387 train 7.334129 (lr=1.3448e-04) (hash(x)=28856978) +3388 train 6.741721 (lr=1.3446e-04) (hash(x)=21667904) +3389 train 6.756139 (lr=1.3444e-04) (hash(x)=23431801) +3390 train 6.556397 (lr=1.3442e-04) (hash(x)=20877285) +3391 train 6.820555 (lr=1.3440e-04) (hash(x)=25236385) +3392 train 7.093338 (lr=1.3438e-04) (hash(x)=25373071) +3393 train 7.222187 (lr=1.3435e-04) (hash(x)=25713464) +3394 train 7.147217 (lr=1.3433e-04) (hash(x)=25713475) +3395 train 7.010877 (lr=1.3431e-04) (hash(x)=24278687) +3396 train 7.136163 (lr=1.3429e-04) (hash(x)=27491349) +3397 train 7.020214 (lr=1.3427e-04) (hash(x)=24513692) +3398 train 7.130429 (lr=1.3425e-04) (hash(x)=26853415) +3399 train 7.192997 (lr=1.3422e-04) (hash(x)=25330803) +3400 val loss 6.9983 +3400 val perplexity 1094.8165 +3400 train 7.167897 (lr=1.3420e-04) (hash(x)=26578066) +3401 train 7.185939 (lr=1.3418e-04) (hash(x)=26811522) +3402 train 6.940518 (lr=1.3416e-04) (hash(x)=25611092) +3403 train 6.764583 (lr=1.3414e-04) (hash(x)=21568545) +3404 train 6.746807 (lr=1.3412e-04) (hash(x)=22756484) +3405 train 6.964372 (lr=1.3409e-04) (hash(x)=27927608) +3406 train 7.015483 (lr=1.3407e-04) (hash(x)=27497018) +3407 train 6.840282 (lr=1.3405e-04) (hash(x)=22508532) +3408 train 7.272917 (lr=1.3403e-04) (hash(x)=26673287) +3409 train 6.898431 (lr=1.3401e-04) (hash(x)=23675869) +3410 train 6.875780 (lr=1.3399e-04) (hash(x)=25496948) +3411 train 6.834123 (lr=1.3396e-04) (hash(x)=24850662) +3412 train 7.109216 (lr=1.3394e-04) (hash(x)=29790167) +3413 train 6.764361 (lr=1.3392e-04) (hash(x)=24193434) +3414 train 7.154913 (lr=1.3390e-04) (hash(x)=25310919) +3415 train 6.750829 (lr=1.3388e-04) (hash(x)=21799261) +3416 train 7.065254 (lr=1.3386e-04) (hash(x)=26620074) +3417 train 6.997636 (lr=1.3383e-04) (hash(x)=26719309) +3418 train 7.326285 (lr=1.3381e-04) (hash(x)=23190530) +3419 train 6.944620 (lr=1.3379e-04) (hash(x)=24884891) +3420 train 6.967049 (lr=1.3377e-04) (hash(x)=25545849) +3421 train 6.942304 (lr=1.3375e-04) (hash(x)=26021405) +3422 train 6.879812 (lr=1.3372e-04) (hash(x)=23887343) +3423 train 6.967824 (lr=1.3370e-04) (hash(x)=26311168) +3424 train 6.634823 (lr=1.3368e-04) (hash(x)=21051541) +3425 train 7.041477 (lr=1.3366e-04) (hash(x)=23553179) +3426 train 6.896002 (lr=1.3364e-04) (hash(x)=24345540) +3427 train 7.363275 (lr=1.3362e-04) (hash(x)=27549895) +3428 train 6.676736 (lr=1.3359e-04) (hash(x)=22559753) +3429 train 6.659846 (lr=1.3357e-04) (hash(x)=21647642) +3430 train 6.551833 (lr=1.3355e-04) (hash(x)=20130901) +3431 train 6.663190 (lr=1.3353e-04) (hash(x)=20977430) +3432 train 6.686951 (lr=1.3351e-04) (hash(x)=21356429) +3433 train 6.700814 (lr=1.3348e-04) (hash(x)=23494380) +3434 train 6.945981 (lr=1.3346e-04) (hash(x)=23805501) +3435 train 6.857668 (lr=1.3344e-04) (hash(x)=23448855) +3436 train 7.250634 (lr=1.3342e-04) (hash(x)=26000319) +3437 train 6.708769 (lr=1.3340e-04) (hash(x)=21760032) +3438 train 6.857580 (lr=1.3338e-04) (hash(x)=24424886) +3439 train 7.254055 (lr=1.3335e-04) (hash(x)=26941617) +3440 train 7.278296 (lr=1.3333e-04) (hash(x)=26798528) +3441 train 7.282504 (lr=1.3331e-04) (hash(x)=27464193) +3442 train 7.194459 (lr=1.3329e-04) (hash(x)=25649118) +3443 train 7.234679 (lr=1.3327e-04) (hash(x)=26953192) +3444 train 7.054183 (lr=1.3324e-04) (hash(x)=22224958) +3445 train 6.845384 (lr=1.3322e-04) (hash(x)=24044587) +3446 train 7.307870 (lr=1.3320e-04) (hash(x)=29584466) +3447 train 7.708257 (lr=1.3318e-04) (hash(x)=30008957) +3448 train 7.538831 (lr=1.3316e-04) (hash(x)=26059290) +3449 train 6.497850 (lr=1.3314e-04) (hash(x)=19733965) +3450 val loss 6.9763 +3450 val perplexity 1070.9957 +3450 train 7.019980 (lr=1.3311e-04) (hash(x)=23960200) +3451 train 7.224156 (lr=1.3309e-04) (hash(x)=27069893) +3452 train 6.849233 (lr=1.3307e-04) (hash(x)=23947772) +3453 train 6.911417 (lr=1.3305e-04) (hash(x)=22707406) +3454 train 7.093987 (lr=1.3303e-04) (hash(x)=27832550) +3455 train 6.946278 (lr=1.3300e-04) (hash(x)=27125962) +3456 train 6.831172 (lr=1.3298e-04) (hash(x)=24510254) +3457 train 6.608379 (lr=1.3296e-04) (hash(x)=23545652) +3458 train 6.721421 (lr=1.3294e-04) (hash(x)=23554751) +3459 train 6.830671 (lr=1.3292e-04) (hash(x)=23341415) +3460 train 7.013230 (lr=1.3289e-04) (hash(x)=21784583) +3461 train 6.781618 (lr=1.3287e-04) (hash(x)=22214769) +3462 train 6.865263 (lr=1.3285e-04) (hash(x)=24206922) +3463 train 6.966641 (lr=1.3283e-04) (hash(x)=25888358) +3464 train 6.780701 (lr=1.3281e-04) (hash(x)=22689666) +3465 train 6.912263 (lr=1.3279e-04) (hash(x)=24918697) +3466 train 7.176478 (lr=1.3276e-04) (hash(x)=28237214) +3467 train 7.330933 (lr=1.3274e-04) (hash(x)=26761645) +3468 train 6.970390 (lr=1.3272e-04) (hash(x)=26979307) +3469 train 6.841333 (lr=1.3270e-04) (hash(x)=23553754) +3470 train 6.991359 (lr=1.3268e-04) (hash(x)=25256849) +3471 train 6.855034 (lr=1.3265e-04) (hash(x)=21725719) +3472 train 6.960973 (lr=1.3263e-04) (hash(x)=24897801) +3473 train 6.896886 (lr=1.3261e-04) (hash(x)=26175307) +3474 train 6.680513 (lr=1.3259e-04) (hash(x)=23309218) +3475 train 6.756039 (lr=1.3257e-04) (hash(x)=25746493) +3476 train 7.090311 (lr=1.3254e-04) (hash(x)=27169613) +3477 train 6.807236 (lr=1.3252e-04) (hash(x)=22937341) +3478 train 6.918764 (lr=1.3250e-04) (hash(x)=24250636) +3479 train 6.767995 (lr=1.3248e-04) (hash(x)=21669704) +3480 train 6.732761 (lr=1.3246e-04) (hash(x)=24431839) +3481 train 6.780620 (lr=1.3243e-04) (hash(x)=22763387) +3482 train 6.780787 (lr=1.3241e-04) (hash(x)=20489446) +3483 train 6.735088 (lr=1.3239e-04) (hash(x)=21167493) +3484 train 6.734831 (lr=1.3237e-04) (hash(x)=23465087) +3485 train 6.947737 (lr=1.3235e-04) (hash(x)=26175023) +3486 train 7.033956 (lr=1.3232e-04) (hash(x)=24986207) +3487 train 6.618076 (lr=1.3230e-04) (hash(x)=23166993) +3488 train 6.927070 (lr=1.3228e-04) (hash(x)=25281216) +3489 train 6.698654 (lr=1.3226e-04) (hash(x)=21824285) +3490 train 6.738439 (lr=1.3224e-04) (hash(x)=22352750) +3491 train 7.000003 (lr=1.3221e-04) (hash(x)=23947208) +3492 train 7.042306 (lr=1.3219e-04) (hash(x)=26257363) +3493 train 6.866084 (lr=1.3217e-04) (hash(x)=25103214) +3494 train 6.947305 (lr=1.3215e-04) (hash(x)=25267583) +3495 train 7.001667 (lr=1.3213e-04) (hash(x)=26235974) +3496 train 7.223473 (lr=1.3210e-04) (hash(x)=26430769) +3497 train 7.612762 (lr=1.3208e-04) (hash(x)=28282027) +3498 train 7.399137 (lr=1.3206e-04) (hash(x)=28386462) +3499 train 7.066657 (lr=1.3204e-04) (hash(x)=29822604) +3500 val loss 6.9609 +3500 val perplexity 1054.5378 +3500 train 7.010213 (lr=1.3202e-04) (hash(x)=29225386) +3501 train 6.895373 (lr=1.3199e-04) (hash(x)=25249294) +3502 train 6.634665 (lr=1.3197e-04) (hash(x)=20020741) +3503 train 6.784894 (lr=1.3195e-04) (hash(x)=25426430) +3504 train 6.767563 (lr=1.3193e-04) (hash(x)=25720411) +3505 train 6.779306 (lr=1.3191e-04) (hash(x)=25602639) +3506 train 6.903211 (lr=1.3188e-04) (hash(x)=26724388) +3507 train 6.831116 (lr=1.3186e-04) (hash(x)=26043735) +3508 train 6.770441 (lr=1.3184e-04) (hash(x)=24955163) +3509 train 6.745351 (lr=1.3182e-04) (hash(x)=20936107) +3510 train 6.757347 (lr=1.3180e-04) (hash(x)=20317378) +3511 train 6.789766 (lr=1.3177e-04) (hash(x)=22966314) +3512 train 7.130946 (lr=1.3175e-04) (hash(x)=25870930) +3513 train 6.935658 (lr=1.3173e-04) (hash(x)=24656635) +3514 train 7.213396 (lr=1.3171e-04) (hash(x)=28576810) +3515 train 7.117644 (lr=1.3169e-04) (hash(x)=27944619) +3516 train 6.962120 (lr=1.3166e-04) (hash(x)=27421509) +3517 train 6.682872 (lr=1.3164e-04) (hash(x)=20844620) +3518 train 6.877368 (lr=1.3162e-04) (hash(x)=28569406) +3519 train 6.778484 (lr=1.3160e-04) (hash(x)=23448505) +3520 train 7.000886 (lr=1.3157e-04) (hash(x)=24852577) +3521 train 6.820371 (lr=1.3155e-04) (hash(x)=23963103) +3522 train 6.695656 (lr=1.3153e-04) (hash(x)=24816516) +3523 train 6.894044 (lr=1.3151e-04) (hash(x)=24205942) +3524 train 6.473996 (lr=1.3149e-04) (hash(x)=20988660) +3525 train 6.559101 (lr=1.3146e-04) (hash(x)=21631366) +3526 train 6.792981 (lr=1.3144e-04) (hash(x)=23499370) +3527 train 6.919757 (lr=1.3142e-04) (hash(x)=26330693) +3528 train 6.562959 (lr=1.3140e-04) (hash(x)=23937176) +3529 train 6.872957 (lr=1.3138e-04) (hash(x)=27345885) +3530 train 6.540484 (lr=1.3135e-04) (hash(x)=21104610) +3531 train 6.944436 (lr=1.3133e-04) (hash(x)=24844466) +3532 train 6.276188 (lr=1.3131e-04) (hash(x)=21055483) +3533 train 6.640216 (lr=1.3129e-04) (hash(x)=23229414) +3534 train 6.945076 (lr=1.3126e-04) (hash(x)=26676920) +3535 train 6.912792 (lr=1.3124e-04) (hash(x)=29550596) +3536 train 6.657772 (lr=1.3122e-04) (hash(x)=22231942) +3537 train 6.858272 (lr=1.3120e-04) (hash(x)=25843852) +3538 train 7.030081 (lr=1.3118e-04) (hash(x)=27110533) +3539 train 6.515546 (lr=1.3115e-04) (hash(x)=20506540) +3540 train 6.659354 (lr=1.3113e-04) (hash(x)=21599346) +3541 train 6.890414 (lr=1.3111e-04) (hash(x)=26395519) +3542 train 6.829453 (lr=1.3109e-04) (hash(x)=25892512) +3543 train 6.934930 (lr=1.3106e-04) (hash(x)=22124892) +3544 train 6.789958 (lr=1.3104e-04) (hash(x)=21882567) +3545 train 6.849266 (lr=1.3102e-04) (hash(x)=24316212) +3546 train 6.748138 (lr=1.3100e-04) (hash(x)=24296310) +3547 train 6.849428 (lr=1.3098e-04) (hash(x)=24867036) +3548 train 6.846870 (lr=1.3095e-04) (hash(x)=23351896) +3549 train 6.787235 (lr=1.3093e-04) (hash(x)=21576408) +3550 val loss 6.9414 +3550 val perplexity 1034.2147 +3550 train 6.946562 (lr=1.3091e-04) (hash(x)=26377338) +3551 train 6.757901 (lr=1.3089e-04) (hash(x)=25607640) +3552 train 7.101516 (lr=1.3087e-04) (hash(x)=27619776) +3553 train 6.600803 (lr=1.3084e-04) (hash(x)=23454533) +3554 train 6.783766 (lr=1.3082e-04) (hash(x)=22542519) +3555 train 6.838431 (lr=1.3080e-04) (hash(x)=26176930) +3556 train 6.653073 (lr=1.3078e-04) (hash(x)=22815181) +3557 train 6.675179 (lr=1.3075e-04) (hash(x)=21821757) +3558 train 6.701219 (lr=1.3073e-04) (hash(x)=23988293) +3559 train 6.615177 (lr=1.3071e-04) (hash(x)=23795894) +3560 train 6.530674 (lr=1.3069e-04) (hash(x)=22898969) +3561 train 6.536973 (lr=1.3066e-04) (hash(x)=21510825) +3562 train 6.477179 (lr=1.3064e-04) (hash(x)=22499317) +3563 train 6.486926 (lr=1.3062e-04) (hash(x)=23756298) +3564 train 6.537212 (lr=1.3060e-04) (hash(x)=23964512) +3565 train 6.671792 (lr=1.3058e-04) (hash(x)=23262803) +3566 train 6.872067 (lr=1.3055e-04) (hash(x)=23347279) +3567 train 6.780126 (lr=1.3053e-04) (hash(x)=24165449) +3568 train 6.921657 (lr=1.3051e-04) (hash(x)=25503946) +3569 train 6.851115 (lr=1.3049e-04) (hash(x)=26532839) +3570 train 6.537634 (lr=1.3046e-04) (hash(x)=21889816) +3571 train 6.793571 (lr=1.3044e-04) (hash(x)=26643739) +3572 train 7.010816 (lr=1.3042e-04) (hash(x)=26826130) +3573 train 7.024525 (lr=1.3040e-04) (hash(x)=25810624) +3574 train 6.915213 (lr=1.3038e-04) (hash(x)=23080331) +3575 train 7.037751 (lr=1.3035e-04) (hash(x)=24697756) +3576 train 6.913372 (lr=1.3033e-04) (hash(x)=25158900) +3577 train 7.028075 (lr=1.3031e-04) (hash(x)=25793633) +3578 train 6.581616 (lr=1.3029e-04) (hash(x)=21468493) +3579 train 6.917076 (lr=1.3026e-04) (hash(x)=24431101) +3580 train 6.759183 (lr=1.3024e-04) (hash(x)=27314357) +3581 train 7.025686 (lr=1.3022e-04) (hash(x)=26286249) +3582 train 7.250736 (lr=1.3020e-04) (hash(x)=25954856) +3583 train 7.120753 (lr=1.3017e-04) (hash(x)=27218899) +3584 train 6.896631 (lr=1.3015e-04) (hash(x)=24249114) +3585 train 6.770279 (lr=1.3013e-04) (hash(x)=23659934) +3586 train 6.776763 (lr=1.3011e-04) (hash(x)=25995600) +3587 train 6.722219 (lr=1.3009e-04) (hash(x)=29462219) +3588 train 6.847783 (lr=1.3006e-04) (hash(x)=23346714) +3589 train 6.962747 (lr=1.3004e-04) (hash(x)=27168432) +3590 train 6.782134 (lr=1.3002e-04) (hash(x)=23954240) +3591 train 6.760689 (lr=1.3000e-04) (hash(x)=24748522) +3592 train 6.934822 (lr=1.2997e-04) (hash(x)=24887007) +3593 train 6.708878 (lr=1.2995e-04) (hash(x)=25539383) +3594 train 6.608147 (lr=1.2993e-04) (hash(x)=20104613) +3595 train 7.195297 (lr=1.2991e-04) (hash(x)=24843486) +3596 train 7.186061 (lr=1.2988e-04) (hash(x)=24357864) +3597 train 6.852677 (lr=1.2986e-04) (hash(x)=23873745) +3598 train 6.978594 (lr=1.2984e-04) (hash(x)=25142829) +3599 train 7.024830 (lr=1.2982e-04) (hash(x)=24965317) +3600 val loss 6.9331 +3600 val perplexity 1025.6581 +3600 train 6.530768 (lr=1.2979e-04) (hash(x)=18505205) +3601 train 6.543206 (lr=1.2977e-04) (hash(x)=23632877) +3602 train 6.801306 (lr=1.2975e-04) (hash(x)=23704554) +3603 train 6.970020 (lr=1.2973e-04) (hash(x)=26584754) +3604 train 6.588559 (lr=1.2970e-04) (hash(x)=20667709) +3605 train 6.438791 (lr=1.2968e-04) (hash(x)=20573248) +3606 train 6.575664 (lr=1.2966e-04) (hash(x)=23998997) +3607 train 6.786308 (lr=1.2964e-04) (hash(x)=22031210) +3608 train 6.812028 (lr=1.2962e-04) (hash(x)=24124536) +3609 train 6.759367 (lr=1.2959e-04) (hash(x)=22650144) +3610 train 6.820914 (lr=1.2957e-04) (hash(x)=23796998) +3611 train 6.866444 (lr=1.2955e-04) (hash(x)=24860582) +3612 train 6.364896 (lr=1.2953e-04) (hash(x)=20591300) +3613 train 6.803270 (lr=1.2950e-04) (hash(x)=23447130) +3614 train 6.823944 (lr=1.2948e-04) (hash(x)=26237963) +3615 train 6.942628 (lr=1.2946e-04) (hash(x)=25877990) +3616 train 6.704161 (lr=1.2944e-04) (hash(x)=24808003) +3617 train 6.902978 (lr=1.2941e-04) (hash(x)=24103543) +3618 train 6.844274 (lr=1.2939e-04) (hash(x)=24877184) +3619 train 6.896917 (lr=1.2937e-04) (hash(x)=24970646) +3620 train 6.865775 (lr=1.2935e-04) (hash(x)=25764524) +3621 train 7.046545 (lr=1.2932e-04) (hash(x)=25313591) +3622 train 6.875549 (lr=1.2930e-04) (hash(x)=23260940) +3623 train 6.799875 (lr=1.2928e-04) (hash(x)=24382381) +3624 train 6.746906 (lr=1.2926e-04) (hash(x)=24618902) +3625 train 6.899644 (lr=1.2923e-04) (hash(x)=25074871) +3626 train 6.642292 (lr=1.2921e-04) (hash(x)=24472251) +3627 train 6.813727 (lr=1.2919e-04) (hash(x)=25221746) +3628 train 6.916043 (lr=1.2917e-04) (hash(x)=27448790) +3629 train 6.846650 (lr=1.2914e-04) (hash(x)=25221431) +3630 train 6.380847 (lr=1.2912e-04) (hash(x)=22034366) +3631 train 6.981751 (lr=1.2910e-04) (hash(x)=24551999) +3632 train 6.669002 (lr=1.2908e-04) (hash(x)=24330217) +3633 train 6.809836 (lr=1.2905e-04) (hash(x)=22792380) +3634 train 6.570020 (lr=1.2903e-04) (hash(x)=22393767) +3635 train 6.926546 (lr=1.2901e-04) (hash(x)=28151378) +3636 train 6.944542 (lr=1.2899e-04) (hash(x)=26999341) +3637 train 6.932378 (lr=1.2896e-04) (hash(x)=27251870) +3638 train 6.868120 (lr=1.2894e-04) (hash(x)=23439462) +3639 train 6.940967 (lr=1.2892e-04) (hash(x)=25765516) +3640 train 6.869924 (lr=1.2890e-04) (hash(x)=24720171) +3641 train 7.080144 (lr=1.2887e-04) (hash(x)=23927187) +3642 train 6.840927 (lr=1.2885e-04) (hash(x)=23879561) +3643 train 6.944922 (lr=1.2883e-04) (hash(x)=25630696) +3644 train 6.503911 (lr=1.2881e-04) (hash(x)=22030016) +3645 train 6.970154 (lr=1.2878e-04) (hash(x)=28781600) +3646 train 6.997999 (lr=1.2876e-04) (hash(x)=26668019) +3647 train 7.069182 (lr=1.2874e-04) (hash(x)=25204247) +3648 train 7.277089 (lr=1.2872e-04) (hash(x)=31261394) +3649 train 7.071196 (lr=1.2869e-04) (hash(x)=26193103) +3650 val loss 6.9575 +3650 val perplexity 1051.0057 +3650 train 6.888711 (lr=1.2867e-04) (hash(x)=23872456) +3651 train 6.771593 (lr=1.2865e-04) (hash(x)=26326447) +3652 train 6.759810 (lr=1.2863e-04) (hash(x)=26449631) +3653 train 7.092484 (lr=1.2860e-04) (hash(x)=26373461) +3654 train 6.889381 (lr=1.2858e-04) (hash(x)=24882768) +3655 train 6.987625 (lr=1.2856e-04) (hash(x)=26321813) +3656 train 7.017995 (lr=1.2854e-04) (hash(x)=27056428) +3657 train 6.966999 (lr=1.2851e-04) (hash(x)=24583976) +3658 train 6.677335 (lr=1.2849e-04) (hash(x)=22259624) +3659 train 6.814416 (lr=1.2847e-04) (hash(x)=25400396) +3660 train 6.683164 (lr=1.2845e-04) (hash(x)=21095507) +3661 train 6.928586 (lr=1.2842e-04) (hash(x)=27231042) +3662 train 6.758564 (lr=1.2840e-04) (hash(x)=27292771) +3663 train 7.087497 (lr=1.2838e-04) (hash(x)=25528323) +3664 train 6.857697 (lr=1.2836e-04) (hash(x)=24374502) +3665 train 6.683760 (lr=1.2833e-04) (hash(x)=22463800) +3666 train 6.979941 (lr=1.2831e-04) (hash(x)=25413960) +3667 train 6.892137 (lr=1.2829e-04) (hash(x)=24035353) +3668 train 6.801030 (lr=1.2826e-04) (hash(x)=24815852) +3669 train 6.705039 (lr=1.2824e-04) (hash(x)=22995856) +3670 train 6.967885 (lr=1.2822e-04) (hash(x)=28128238) +3671 train 6.981964 (lr=1.2820e-04) (hash(x)=25114729) +3672 train 6.704354 (lr=1.2817e-04) (hash(x)=19337726) +3673 train 7.146616 (lr=1.2815e-04) (hash(x)=26674420) +3674 train 6.620992 (lr=1.2813e-04) (hash(x)=22553270) +3675 train 6.464500 (lr=1.2811e-04) (hash(x)=21634962) +3676 train 6.685344 (lr=1.2808e-04) (hash(x)=23362669) +3677 train 6.883733 (lr=1.2806e-04) (hash(x)=24781824) +3678 train 6.361870 (lr=1.2804e-04) (hash(x)=17909688) +3679 train 7.551361 (lr=1.2802e-04) (hash(x)=31341964) +3680 train 7.104024 (lr=1.2799e-04) (hash(x)=29071335) +3681 train 6.550704 (lr=1.2797e-04) (hash(x)=19486640) +3682 train 6.749702 (lr=1.2795e-04) (hash(x)=24301133) +3683 train 6.903809 (lr=1.2793e-04) (hash(x)=29172813) +3684 train 7.462833 (lr=1.2790e-04) (hash(x)=31501337) +3685 train 7.063069 (lr=1.2788e-04) (hash(x)=27377840) +3686 train 6.847644 (lr=1.2786e-04) (hash(x)=24499761) +3687 train 6.842557 (lr=1.2783e-04) (hash(x)=26326024) +3688 train 6.789429 (lr=1.2781e-04) (hash(x)=23179996) +3689 train 6.443737 (lr=1.2779e-04) (hash(x)=20963675) +3690 train 6.759531 (lr=1.2777e-04) (hash(x)=26650521) +3691 train 6.500687 (lr=1.2774e-04) (hash(x)=20140071) +3692 train 6.496011 (lr=1.2772e-04) (hash(x)=21734340) +3693 train 6.829550 (lr=1.2770e-04) (hash(x)=23848422) +3694 train 6.870893 (lr=1.2768e-04) (hash(x)=27499953) +3695 train 7.096891 (lr=1.2765e-04) (hash(x)=27273311) +3696 train 7.024601 (lr=1.2763e-04) (hash(x)=25741091) +3697 train 6.702805 (lr=1.2761e-04) (hash(x)=22010794) +3698 train 6.838637 (lr=1.2759e-04) (hash(x)=24616138) +3699 train 7.229499 (lr=1.2756e-04) (hash(x)=31276487) +3700 val loss 6.9485 +3700 val perplexity 1041.6072 +3700 train 6.898679 (lr=1.2754e-04) (hash(x)=24042922) +3701 train 6.667500 (lr=1.2752e-04) (hash(x)=21985431) +3702 train 6.539708 (lr=1.2749e-04) (hash(x)=21336316) +3703 train 6.365979 (lr=1.2747e-04) (hash(x)=17819313) +3704 train 7.000166 (lr=1.2745e-04) (hash(x)=27033851) +3705 train 7.066230 (lr=1.2743e-04) (hash(x)=27260043) +3706 train 7.123216 (lr=1.2740e-04) (hash(x)=26847649) +3707 train 7.035142 (lr=1.2738e-04) (hash(x)=25843618) +3708 train 7.023154 (lr=1.2736e-04) (hash(x)=25828009) +3709 train 7.042207 (lr=1.2734e-04) (hash(x)=24960960) +3710 train 7.150642 (lr=1.2731e-04) (hash(x)=24852741) +3711 train 6.621271 (lr=1.2729e-04) (hash(x)=23769243) +3712 train 6.821214 (lr=1.2727e-04) (hash(x)=27110690) +3713 train 6.859556 (lr=1.2724e-04) (hash(x)=22817285) +3714 train 6.491318 (lr=1.2722e-04) (hash(x)=19618355) +3715 train 7.108918 (lr=1.2720e-04) (hash(x)=28731298) +3716 train 6.843507 (lr=1.2718e-04) (hash(x)=23091196) +3717 train 7.378790 (lr=1.2715e-04) (hash(x)=28825233) +3718 train 6.913315 (lr=1.2713e-04) (hash(x)=25778506) +3719 train 6.855517 (lr=1.2711e-04) (hash(x)=23788738) +3720 train 6.159176 (lr=1.2708e-04) (hash(x)=16684794) +3721 train 6.716537 (lr=1.2706e-04) (hash(x)=24755102) +3722 train 7.003185 (lr=1.2704e-04) (hash(x)=26839238) +3723 train 7.032323 (lr=1.2702e-04) (hash(x)=26599031) +3724 train 6.880853 (lr=1.2699e-04) (hash(x)=25945650) +3725 train 7.053838 (lr=1.2697e-04) (hash(x)=27434751) +3726 train 6.822168 (lr=1.2695e-04) (hash(x)=24814591) +3727 train 6.751277 (lr=1.2693e-04) (hash(x)=24818744) +3728 train 6.857151 (lr=1.2690e-04) (hash(x)=25649817) +3729 train 6.763166 (lr=1.2688e-04) (hash(x)=24987021) +3730 train 6.740072 (lr=1.2686e-04) (hash(x)=24667779) +3731 train 6.729906 (lr=1.2683e-04) (hash(x)=23053871) +3732 train 6.367654 (lr=1.2681e-04) (hash(x)=19264856) +3733 train 7.006622 (lr=1.2679e-04) (hash(x)=23718117) +3734 train 6.694061 (lr=1.2677e-04) (hash(x)=21904779) +3735 train 6.898012 (lr=1.2674e-04) (hash(x)=23472795) +3736 train 7.112982 (lr=1.2672e-04) (hash(x)=24650440) +3737 train 7.146305 (lr=1.2670e-04) (hash(x)=25243911) +3738 train 7.554223 (lr=1.2667e-04) (hash(x)=30423616) +3739 train 7.545901 (lr=1.2665e-04) (hash(x)=29748225) +3740 train 7.000217 (lr=1.2663e-04) (hash(x)=25180684) +3741 train 6.971852 (lr=1.2661e-04) (hash(x)=25619065) +3742 train 7.296751 (lr=1.2658e-04) (hash(x)=31847002) +3743 train 6.876470 (lr=1.2656e-04) (hash(x)=24991832) +3744 train 6.820168 (lr=1.2654e-04) (hash(x)=23836263) +3745 train 6.720180 (lr=1.2651e-04) (hash(x)=24651902) +3746 train 7.283158 (lr=1.2649e-04) (hash(x)=22936538) +3747 train 7.239089 (lr=1.2647e-04) (hash(x)=23681545) +3748 train 6.646680 (lr=1.2645e-04) (hash(x)=21140825) +3749 train 6.814262 (lr=1.2642e-04) (hash(x)=24932453) +3750 val loss 6.9204 +3750 val perplexity 1012.7039 +3750 train 7.012283 (lr=1.2640e-04) (hash(x)=25919062) +3751 train 6.801523 (lr=1.2638e-04) (hash(x)=22424066) +3752 train 6.851096 (lr=1.2635e-04) (hash(x)=23542210) +3753 train 6.721667 (lr=1.2633e-04) (hash(x)=22113561) +3754 train 6.647913 (lr=1.2631e-04) (hash(x)=24892794) +3755 train 7.132595 (lr=1.2629e-04) (hash(x)=25262748) +3756 train 6.878116 (lr=1.2626e-04) (hash(x)=24477975) +3757 train 6.679142 (lr=1.2624e-04) (hash(x)=24681189) +3758 train 6.726888 (lr=1.2622e-04) (hash(x)=24052603) +3759 train 6.929821 (lr=1.2619e-04) (hash(x)=26474878) +3760 train 7.496999 (lr=1.2617e-04) (hash(x)=28228836) +3761 train 7.048479 (lr=1.2615e-04) (hash(x)=23832522) +3762 train 6.994243 (lr=1.2613e-04) (hash(x)=24416789) +3763 train 6.723751 (lr=1.2610e-04) (hash(x)=23930593) +3764 train 6.786855 (lr=1.2608e-04) (hash(x)=23895092) +3765 train 6.727199 (lr=1.2606e-04) (hash(x)=26865287) +3766 train 6.770018 (lr=1.2603e-04) (hash(x)=21330722) +3767 train 6.838459 (lr=1.2601e-04) (hash(x)=22704349) +3768 train 6.987274 (lr=1.2599e-04) (hash(x)=27740886) +3769 train 6.980076 (lr=1.2597e-04) (hash(x)=24935936) +3770 train 6.844869 (lr=1.2594e-04) (hash(x)=23497487) +3771 train 7.052368 (lr=1.2592e-04) (hash(x)=24801048) +3772 train 6.809330 (lr=1.2590e-04) (hash(x)=25490486) +3773 train 6.806189 (lr=1.2587e-04) (hash(x)=21166466) +3774 train 6.992953 (lr=1.2585e-04) (hash(x)=23225244) +3775 train 6.779209 (lr=1.2583e-04) (hash(x)=22293673) +3776 train 7.121315 (lr=1.2581e-04) (hash(x)=25700016) +3777 train 6.606519 (lr=1.2578e-04) (hash(x)=22370207) +3778 train 6.947371 (lr=1.2576e-04) (hash(x)=25224849) +3779 train 6.838582 (lr=1.2574e-04) (hash(x)=23311934) +3780 train 6.581562 (lr=1.2571e-04) (hash(x)=19627124) +3781 train 7.108037 (lr=1.2569e-04) (hash(x)=27132838) +3782 train 7.075656 (lr=1.2567e-04) (hash(x)=27242104) +3783 train 6.538818 (lr=1.2564e-04) (hash(x)=21785487) +3784 train 6.902679 (lr=1.2562e-04) (hash(x)=25798262) +3785 train 6.775481 (lr=1.2560e-04) (hash(x)=24806937) +3786 train 6.632065 (lr=1.2558e-04) (hash(x)=24098756) +3787 train 6.593663 (lr=1.2555e-04) (hash(x)=22981456) +3788 train 7.082569 (lr=1.2553e-04) (hash(x)=22441908) +3789 train 6.963519 (lr=1.2551e-04) (hash(x)=25867804) +3790 train 6.881213 (lr=1.2548e-04) (hash(x)=22835586) +3791 train 7.092804 (lr=1.2546e-04) (hash(x)=25251063) +3792 train 6.931432 (lr=1.2544e-04) (hash(x)=27059729) +3793 train 6.885393 (lr=1.2542e-04) (hash(x)=23819311) +3794 train 6.570916 (lr=1.2539e-04) (hash(x)=21345757) +3795 train 6.815817 (lr=1.2537e-04) (hash(x)=25796422) +3796 train 6.497163 (lr=1.2535e-04) (hash(x)=21414971) +3797 train 6.796408 (lr=1.2532e-04) (hash(x)=26120920) +3798 train 6.764698 (lr=1.2530e-04) (hash(x)=22008247) +3799 train 6.844535 (lr=1.2528e-04) (hash(x)=22722211) +3800 val loss 6.9279 +3800 val perplexity 1020.3046 +3800 train 6.554695 (lr=1.2525e-04) (hash(x)=24484513) +3801 train 6.954820 (lr=1.2523e-04) (hash(x)=24463866) +3802 train 6.963861 (lr=1.2521e-04) (hash(x)=26470775) +3803 train 6.936246 (lr=1.2519e-04) (hash(x)=24296755) +3804 train 6.925880 (lr=1.2516e-04) (hash(x)=24381309) +3805 train 7.133101 (lr=1.2514e-04) (hash(x)=26781262) +3806 train 6.624533 (lr=1.2512e-04) (hash(x)=23563137) +3807 train 6.842873 (lr=1.2509e-04) (hash(x)=24522269) +3808 train 6.624593 (lr=1.2507e-04) (hash(x)=22871995) +3809 train 6.971261 (lr=1.2505e-04) (hash(x)=24751946) +3810 train 6.778997 (lr=1.2502e-04) (hash(x)=19879741) +3811 train 6.855810 (lr=1.2500e-04) (hash(x)=25617184) +3812 train 6.509169 (lr=1.2498e-04) (hash(x)=21776722) +3813 train 6.665822 (lr=1.2495e-04) (hash(x)=22663402) +3814 train 6.997835 (lr=1.2493e-04) (hash(x)=26072046) +3815 train 6.675586 (lr=1.2491e-04) (hash(x)=23329475) +3816 train 6.762662 (lr=1.2489e-04) (hash(x)=25519031) +3817 train 6.692060 (lr=1.2486e-04) (hash(x)=22846270) +3818 train 6.752923 (lr=1.2484e-04) (hash(x)=20299429) +3819 train 7.182949 (lr=1.2482e-04) (hash(x)=30652062) +3820 train 6.484005 (lr=1.2479e-04) (hash(x)=19824665) +3821 train 7.093946 (lr=1.2477e-04) (hash(x)=26698904) +3822 train 6.891267 (lr=1.2475e-04) (hash(x)=27612163) +3823 train 6.661027 (lr=1.2472e-04) (hash(x)=24735165) +3824 train 6.428437 (lr=1.2470e-04) (hash(x)=19965890) +3825 train 6.570422 (lr=1.2468e-04) (hash(x)=23518594) +3826 train 6.646640 (lr=1.2466e-04) (hash(x)=22388460) +3827 train 6.675674 (lr=1.2463e-04) (hash(x)=23795686) +3828 train 6.570833 (lr=1.2461e-04) (hash(x)=24470150) +3829 train 6.245211 (lr=1.2459e-04) (hash(x)=19483392) +3830 train 6.699922 (lr=1.2456e-04) (hash(x)=23304516) +3831 train 7.040700 (lr=1.2454e-04) (hash(x)=27002892) +3832 train 6.780934 (lr=1.2452e-04) (hash(x)=22114813) +3833 train 6.879292 (lr=1.2449e-04) (hash(x)=26221916) +3834 train 6.384672 (lr=1.2447e-04) (hash(x)=27261960) +3835 train 6.745900 (lr=1.2445e-04) (hash(x)=21189101) +3836 train 6.416786 (lr=1.2442e-04) (hash(x)=20638173) +3837 train 6.856290 (lr=1.2440e-04) (hash(x)=25497439) +3838 train 6.321103 (lr=1.2438e-04) (hash(x)=20460499) +3839 train 6.778675 (lr=1.2435e-04) (hash(x)=23499349) +3840 train 7.644760 (lr=1.2433e-04) (hash(x)=22671939) +3841 train 7.646671 (lr=1.2431e-04) (hash(x)=26809295) +3842 train 6.829975 (lr=1.2429e-04) (hash(x)=28094504) +3843 train 6.825185 (lr=1.2426e-04) (hash(x)=26807896) +3844 train 6.907653 (lr=1.2424e-04) (hash(x)=24749334) +3845 train 6.832084 (lr=1.2422e-04) (hash(x)=25031330) +3846 train 6.716120 (lr=1.2419e-04) (hash(x)=23008126) +3847 train 6.720009 (lr=1.2417e-04) (hash(x)=22461589) +3848 train 7.020515 (lr=1.2415e-04) (hash(x)=24959391) +3849 train 6.870380 (lr=1.2412e-04) (hash(x)=24239512) +3850 val loss 6.9194 +3850 val perplexity 1011.7255 +3850 train 6.691668 (lr=1.2410e-04) (hash(x)=24760422) +3851 train 7.210217 (lr=1.2408e-04) (hash(x)=26904123) +3852 train 6.352558 (lr=1.2405e-04) (hash(x)=17986444) +3853 train 6.688438 (lr=1.2403e-04) (hash(x)=21618533) +3854 train 6.741390 (lr=1.2401e-04) (hash(x)=27107027) +3855 train 7.033836 (lr=1.2398e-04) (hash(x)=26415040) +3856 train 7.542926 (lr=1.2396e-04) (hash(x)=28682703) +3857 train 6.746352 (lr=1.2394e-04) (hash(x)=22824767) +3858 train 6.849821 (lr=1.2392e-04) (hash(x)=24540450) +3859 train 6.852625 (lr=1.2389e-04) (hash(x)=24463181) +3860 train 6.761381 (lr=1.2387e-04) (hash(x)=22832558) +3861 train 6.999127 (lr=1.2385e-04) (hash(x)=26582384) +3862 train 7.647514 (lr=1.2382e-04) (hash(x)=32327364) +3863 train 6.995851 (lr=1.2380e-04) (hash(x)=26349465) +3864 train 6.719748 (lr=1.2378e-04) (hash(x)=23079414) +3865 train 6.746405 (lr=1.2375e-04) (hash(x)=23464639) +3866 train 6.610013 (lr=1.2373e-04) (hash(x)=21406620) +3867 train 6.424170 (lr=1.2371e-04) (hash(x)=21205988) +3868 train 6.512635 (lr=1.2368e-04) (hash(x)=22742634) +3869 train 6.520880 (lr=1.2366e-04) (hash(x)=24868938) +3870 train 6.943584 (lr=1.2364e-04) (hash(x)=28095283) +3871 train 6.654041 (lr=1.2361e-04) (hash(x)=21596677) +3872 train 6.909078 (lr=1.2359e-04) (hash(x)=26884381) +3873 train 6.965906 (lr=1.2357e-04) (hash(x)=26410272) +3874 train 6.741126 (lr=1.2354e-04) (hash(x)=22915785) +3875 train 6.757624 (lr=1.2352e-04) (hash(x)=23575666) +3876 train 6.673447 (lr=1.2350e-04) (hash(x)=25313223) +3877 train 6.182974 (lr=1.2347e-04) (hash(x)=16319719) +3878 train 6.811484 (lr=1.2345e-04) (hash(x)=23227579) +3879 train 6.705326 (lr=1.2343e-04) (hash(x)=24117012) +3880 train 6.788818 (lr=1.2340e-04) (hash(x)=24681517) +3881 train 6.729778 (lr=1.2338e-04) (hash(x)=23186527) +3882 train 6.690475 (lr=1.2336e-04) (hash(x)=23472784) +3883 train 6.679101 (lr=1.2334e-04) (hash(x)=26013014) +3884 train 6.902173 (lr=1.2331e-04) (hash(x)=25952206) +3885 train 7.056989 (lr=1.2329e-04) (hash(x)=23897834) +3886 train 6.791304 (lr=1.2327e-04) (hash(x)=26350364) +3887 train 6.831531 (lr=1.2324e-04) (hash(x)=24105761) +3888 train 6.935683 (lr=1.2322e-04) (hash(x)=22801707) +3889 train 6.736090 (lr=1.2320e-04) (hash(x)=21821937) +3890 train 6.642774 (lr=1.2317e-04) (hash(x)=24264640) +3891 train 6.597213 (lr=1.2315e-04) (hash(x)=20369133) +3892 train 6.619815 (lr=1.2313e-04) (hash(x)=24313506) +3893 train 6.608972 (lr=1.2310e-04) (hash(x)=22104086) +3894 train 6.836118 (lr=1.2308e-04) (hash(x)=25312602) +3895 train 6.889841 (lr=1.2306e-04) (hash(x)=25725049) +3896 train 6.716225 (lr=1.2303e-04) (hash(x)=22981231) +3897 train 6.572423 (lr=1.2301e-04) (hash(x)=18021467) +3898 train 6.555199 (lr=1.2299e-04) (hash(x)=17960254) +3899 train 6.699306 (lr=1.2296e-04) (hash(x)=19808118) +3900 val loss 6.9151 +3900 val perplexity 1007.3306 +3900 train 6.485040 (lr=1.2294e-04) (hash(x)=21022829) +3901 train 6.657527 (lr=1.2292e-04) (hash(x)=22434663) +3902 train 6.403424 (lr=1.2289e-04) (hash(x)=20208091) +3903 train 6.517320 (lr=1.2287e-04) (hash(x)=22892776) +3904 train 6.628226 (lr=1.2285e-04) (hash(x)=21554367) +3905 train 6.769382 (lr=1.2282e-04) (hash(x)=23704875) +3906 train 6.697723 (lr=1.2280e-04) (hash(x)=21690340) +3907 train 6.688629 (lr=1.2278e-04) (hash(x)=23736780) +3908 train 6.524750 (lr=1.2275e-04) (hash(x)=21060920) +3909 train 6.479326 (lr=1.2273e-04) (hash(x)=20091559) +3910 train 6.743532 (lr=1.2271e-04) (hash(x)=22147974) +3911 train 6.676486 (lr=1.2268e-04) (hash(x)=21630383) +3912 train 6.927208 (lr=1.2266e-04) (hash(x)=28339385) +3913 train 6.770096 (lr=1.2264e-04) (hash(x)=25355505) +3914 train 6.645074 (lr=1.2261e-04) (hash(x)=20843914) +3915 train 7.138208 (lr=1.2259e-04) (hash(x)=25397467) +3916 train 6.906905 (lr=1.2257e-04) (hash(x)=23587501) +3917 train 6.450665 (lr=1.2254e-04) (hash(x)=19036533) +3918 train 6.653395 (lr=1.2252e-04) (hash(x)=29749389) +3919 train 6.485448 (lr=1.2250e-04) (hash(x)=24727094) +3920 train 6.575980 (lr=1.2247e-04) (hash(x)=22723450) +3921 train 6.767517 (lr=1.2245e-04) (hash(x)=24424680) +3922 train 6.855541 (lr=1.2243e-04) (hash(x)=25817917) +3923 train 6.645864 (lr=1.2240e-04) (hash(x)=23951182) +3924 train 6.714357 (lr=1.2238e-04) (hash(x)=21177944) +3925 train 6.550487 (lr=1.2236e-04) (hash(x)=23533768) +3926 train 6.772037 (lr=1.2233e-04) (hash(x)=24263615) +3927 train 6.559465 (lr=1.2231e-04) (hash(x)=22835000) +3928 train 6.799512 (lr=1.2229e-04) (hash(x)=26076156) +3929 train 6.805534 (lr=1.2226e-04) (hash(x)=25171508) +3930 train 6.826355 (lr=1.2224e-04) (hash(x)=22021396) +3931 train 6.985444 (lr=1.2222e-04) (hash(x)=28767849) +3932 train 6.908518 (lr=1.2219e-04) (hash(x)=29497606) +3933 train 6.622125 (lr=1.2217e-04) (hash(x)=22723124) +3934 train 6.932976 (lr=1.2215e-04) (hash(x)=27106616) +3935 train 6.766390 (lr=1.2212e-04) (hash(x)=22839049) +3936 train 6.869057 (lr=1.2210e-04) (hash(x)=25101923) +3937 train 6.794312 (lr=1.2208e-04) (hash(x)=25945975) +3938 train 6.882585 (lr=1.2205e-04) (hash(x)=25382013) +3939 train 6.438648 (lr=1.2203e-04) (hash(x)=19930900) +3940 train 6.605394 (lr=1.2201e-04) (hash(x)=22202373) +3941 train 6.763996 (lr=1.2198e-04) (hash(x)=24592992) +3942 train 6.688757 (lr=1.2196e-04) (hash(x)=25002271) +3943 train 6.528769 (lr=1.2194e-04) (hash(x)=20654136) +3944 train 6.568292 (lr=1.2191e-04) (hash(x)=20061590) +3945 train 6.468310 (lr=1.2189e-04) (hash(x)=21441361) +3946 train 6.720113 (lr=1.2187e-04) (hash(x)=20055468) +3947 train 7.463836 (lr=1.2184e-04) (hash(x)=28495621) +3948 train 6.871197 (lr=1.2182e-04) (hash(x)=25959236) +3949 train 7.191345 (lr=1.2180e-04) (hash(x)=26750193) +3950 val loss 6.9113 +3950 val perplexity 1003.5430 +3950 train 6.975675 (lr=1.2177e-04) (hash(x)=25882605) +3951 train 7.079428 (lr=1.2175e-04) (hash(x)=26776000) +3952 train 6.657867 (lr=1.2173e-04) (hash(x)=24155107) +3953 train 6.753281 (lr=1.2170e-04) (hash(x)=23441845) +3954 train 6.694824 (lr=1.2168e-04) (hash(x)=22860915) +3955 train 6.494001 (lr=1.2166e-04) (hash(x)=21584429) +3956 train 6.119210 (lr=1.2163e-04) (hash(x)=16535556) +3957 train 6.196938 (lr=1.2161e-04) (hash(x)=17946180) +3958 train 6.724327 (lr=1.2159e-04) (hash(x)=25367610) +3959 train 6.591411 (lr=1.2156e-04) (hash(x)=22560658) +3960 train 6.862697 (lr=1.2154e-04) (hash(x)=23809585) +3961 train 7.130869 (lr=1.2152e-04) (hash(x)=20438213) +3962 train 7.503836 (lr=1.2149e-04) (hash(x)=30520037) +3963 train 7.102693 (lr=1.2147e-04) (hash(x)=25276565) +3964 train 6.844360 (lr=1.2144e-04) (hash(x)=26796532) +3965 train 6.609709 (lr=1.2142e-04) (hash(x)=22850475) +3966 train 7.115921 (lr=1.2140e-04) (hash(x)=25983698) +3967 train 6.986852 (lr=1.2137e-04) (hash(x)=25995933) +3968 train 7.201233 (lr=1.2135e-04) (hash(x)=25319339) +3969 train 6.819847 (lr=1.2133e-04) (hash(x)=25066892) +3970 train 7.033891 (lr=1.2130e-04) (hash(x)=26931819) +3971 train 7.046597 (lr=1.2128e-04) (hash(x)=24163910) +3972 train 6.876476 (lr=1.2126e-04) (hash(x)=25359634) +3973 train 6.702634 (lr=1.2123e-04) (hash(x)=24323444) +3974 train 6.917003 (lr=1.2121e-04) (hash(x)=26529231) +3975 train 6.926521 (lr=1.2119e-04) (hash(x)=24635394) +3976 train 7.210862 (lr=1.2116e-04) (hash(x)=24783093) +3977 train 7.321268 (lr=1.2114e-04) (hash(x)=26710509) +3978 train 6.758715 (lr=1.2112e-04) (hash(x)=25396630) +3979 train 6.661824 (lr=1.2109e-04) (hash(x)=22556381) +3980 train 6.996555 (lr=1.2107e-04) (hash(x)=26912161) +3981 train 6.516074 (lr=1.2105e-04) (hash(x)=22268078) +3982 train 7.621494 (lr=1.2102e-04) (hash(x)=30430328) +3983 train 7.219022 (lr=1.2100e-04) (hash(x)=27537228) +3984 train 6.638630 (lr=1.2098e-04) (hash(x)=24468603) +3985 train 6.946663 (lr=1.2095e-04) (hash(x)=27006663) +3986 train 7.209945 (lr=1.2093e-04) (hash(x)=27014728) +3987 train 6.603774 (lr=1.2090e-04) (hash(x)=20883633) +3988 train 6.725623 (lr=1.2088e-04) (hash(x)=23361791) +3989 train 6.870388 (lr=1.2086e-04) (hash(x)=26775925) +3990 train 7.385649 (lr=1.2083e-04) (hash(x)=30648934) +3991 train 6.930132 (lr=1.2081e-04) (hash(x)=26496730) +3992 train 6.700974 (lr=1.2079e-04) (hash(x)=25942897) +3993 train 6.718629 (lr=1.2076e-04) (hash(x)=24887111) +3994 train 6.613406 (lr=1.2074e-04) (hash(x)=22908550) +3995 train 6.318223 (lr=1.2072e-04) (hash(x)=20342150) +3996 train 6.650997 (lr=1.2069e-04) (hash(x)=22261760) +3997 train 6.708106 (lr=1.2067e-04) (hash(x)=22731641) +3998 train 6.585401 (lr=1.2065e-04) (hash(x)=20669749) +3999 train 6.569410 (lr=1.2062e-04) (hash(x)=16533310) +4000 val loss 6.9031 +4000 val perplexity 995.3992 +4000 train 6.726811 (lr=1.2060e-04) (hash(x)=23661341) +4001 train 6.725716 (lr=1.2058e-04) (hash(x)=24644301) +4002 train 6.563680 (lr=1.2055e-04) (hash(x)=22938438) +4003 train 6.654729 (lr=1.2053e-04) (hash(x)=24315862) +4004 train 6.842297 (lr=1.2051e-04) (hash(x)=25169315) +4005 train 6.839000 (lr=1.2048e-04) (hash(x)=24752796) +4006 train 6.784370 (lr=1.2046e-04) (hash(x)=23103706) +4007 train 6.893901 (lr=1.2043e-04) (hash(x)=24881176) +4008 train 6.768341 (lr=1.2041e-04) (hash(x)=23971947) +4009 train 7.027747 (lr=1.2039e-04) (hash(x)=27741054) +4010 train 7.458342 (lr=1.2036e-04) (hash(x)=30956251) +4011 train 6.826958 (lr=1.2034e-04) (hash(x)=23649686) +4012 train 6.658992 (lr=1.2032e-04) (hash(x)=23344798) +4013 train 7.320745 (lr=1.2029e-04) (hash(x)=29529498) +4014 train 6.816574 (lr=1.2027e-04) (hash(x)=24688359) +4015 train 6.806478 (lr=1.2025e-04) (hash(x)=25593613) +4016 train 6.887517 (lr=1.2022e-04) (hash(x)=25674488) +4017 train 6.367689 (lr=1.2020e-04) (hash(x)=21345346) +4018 train 6.650189 (lr=1.2018e-04) (hash(x)=21978324) +4019 train 6.687062 (lr=1.2015e-04) (hash(x)=23669244) +4020 train 6.553806 (lr=1.2013e-04) (hash(x)=22479613) +4021 train 6.551958 (lr=1.2010e-04) (hash(x)=22855256) +4022 train 7.006187 (lr=1.2008e-04) (hash(x)=19759826) +4023 train 6.871177 (lr=1.2006e-04) (hash(x)=22886646) +4024 train 6.829549 (lr=1.2003e-04) (hash(x)=25553008) +4025 train 6.718166 (lr=1.2001e-04) (hash(x)=25487028) +4026 train 7.230465 (lr=1.1999e-04) (hash(x)=26799246) +4027 train 7.564032 (lr=1.1996e-04) (hash(x)=30728540) +4028 train 6.995132 (lr=1.1994e-04) (hash(x)=23966676) +4029 train 6.651077 (lr=1.1992e-04) (hash(x)=22118783) +4030 train 6.804625 (lr=1.1989e-04) (hash(x)=24744703) +4031 train 6.810358 (lr=1.1987e-04) (hash(x)=21407676) +4032 train 6.782664 (lr=1.1985e-04) (hash(x)=20623349) +4033 train 6.557344 (lr=1.1982e-04) (hash(x)=24723788) +4034 train 6.878276 (lr=1.1980e-04) (hash(x)=25030709) +4035 train 6.912709 (lr=1.1977e-04) (hash(x)=26326164) +4036 train 6.757048 (lr=1.1975e-04) (hash(x)=23754475) +4037 train 7.444484 (lr=1.1973e-04) (hash(x)=30112933) +4038 train 7.156368 (lr=1.1970e-04) (hash(x)=27474299) +4039 train 6.599236 (lr=1.1968e-04) (hash(x)=21720304) +4040 train 7.016707 (lr=1.1966e-04) (hash(x)=25142674) +4041 train 7.253154 (lr=1.1963e-04) (hash(x)=25284552) +4042 train 7.145948 (lr=1.1961e-04) (hash(x)=24554942) +4043 train 6.882611 (lr=1.1959e-04) (hash(x)=23773870) +4044 train 6.594276 (lr=1.1956e-04) (hash(x)=23896338) +4045 train 7.450992 (lr=1.1954e-04) (hash(x)=34984911) +4046 train 6.728227 (lr=1.1951e-04) (hash(x)=23854263) +4047 train 7.010466 (lr=1.1949e-04) (hash(x)=27263416) +4048 train 6.679870 (lr=1.1947e-04) (hash(x)=24989642) +4049 train 6.720703 (lr=1.1944e-04) (hash(x)=24492055) +4050 val loss 6.8927 +4050 val perplexity 985.0892 +4050 train 6.594495 (lr=1.1942e-04) (hash(x)=21579916) +4051 train 6.872084 (lr=1.1940e-04) (hash(x)=25274710) +4052 train 6.750773 (lr=1.1937e-04) (hash(x)=24701947) +4053 train 6.720321 (lr=1.1935e-04) (hash(x)=25477340) +4054 train 6.637640 (lr=1.1933e-04) (hash(x)=23774195) +4055 train 6.931831 (lr=1.1930e-04) (hash(x)=25840801) +4056 train 7.064575 (lr=1.1928e-04) (hash(x)=27972529) +4057 train 6.858153 (lr=1.1925e-04) (hash(x)=26952458) +4058 train 6.382118 (lr=1.1923e-04) (hash(x)=22683653) +4059 train 6.418502 (lr=1.1921e-04) (hash(x)=20984129) +4060 train 6.603748 (lr=1.1918e-04) (hash(x)=22816482) +4061 train 6.903783 (lr=1.1916e-04) (hash(x)=24285302) +4062 train 7.296204 (lr=1.1914e-04) (hash(x)=31517950) +4063 train 7.489150 (lr=1.1911e-04) (hash(x)=31424568) +4064 train 7.099732 (lr=1.1909e-04) (hash(x)=29497876) +4065 train 7.084853 (lr=1.1906e-04) (hash(x)=27277376) +4066 train 6.860046 (lr=1.1904e-04) (hash(x)=26832588) +4067 train 6.681670 (lr=1.1902e-04) (hash(x)=25149712) +4068 train 6.694902 (lr=1.1899e-04) (hash(x)=23728457) +4069 train 6.556245 (lr=1.1897e-04) (hash(x)=25265136) +4070 train 7.146224 (lr=1.1895e-04) (hash(x)=25241681) +4071 train 6.844131 (lr=1.1892e-04) (hash(x)=23403065) +4072 train 6.806676 (lr=1.1890e-04) (hash(x)=25808207) +4073 train 6.721283 (lr=1.1888e-04) (hash(x)=23904844) +4074 train 6.377700 (lr=1.1885e-04) (hash(x)=18865309) +4075 train 6.839321 (lr=1.1883e-04) (hash(x)=23531744) +4076 train 6.855598 (lr=1.1880e-04) (hash(x)=25784275) +4077 train 6.602623 (lr=1.1878e-04) (hash(x)=22417529) +4078 train 6.611071 (lr=1.1876e-04) (hash(x)=23095491) +4079 train 6.740816 (lr=1.1873e-04) (hash(x)=22656033) +4080 train 6.722498 (lr=1.1871e-04) (hash(x)=25865435) +4081 train 6.861084 (lr=1.1869e-04) (hash(x)=25699377) +4082 train 6.853552 (lr=1.1866e-04) (hash(x)=20854084) +4083 train 6.403146 (lr=1.1864e-04) (hash(x)=18950799) +4084 train 6.656323 (lr=1.1861e-04) (hash(x)=22633739) +4085 train 7.299286 (lr=1.1859e-04) (hash(x)=34054446) +4086 train 7.063293 (lr=1.1857e-04) (hash(x)=27599387) +4087 train 6.880246 (lr=1.1854e-04) (hash(x)=26869295) +4088 train 6.822272 (lr=1.1852e-04) (hash(x)=24075139) +4089 train 7.267555 (lr=1.1850e-04) (hash(x)=29784110) +4090 train 7.648786 (lr=1.1847e-04) (hash(x)=34273918) +4091 train 8.107950 (lr=1.1845e-04) (hash(x)=34472685) +4092 train 7.363191 (lr=1.1842e-04) (hash(x)=30113791) +4093 train 6.594265 (lr=1.1840e-04) (hash(x)=22366381) +4094 train 6.875203 (lr=1.1838e-04) (hash(x)=24922935) +4095 train 7.028378 (lr=1.1835e-04) (hash(x)=25504151) +4096 train 6.937978 (lr=1.1833e-04) (hash(x)=24517375) +4097 train 7.712081 (lr=1.1831e-04) (hash(x)=25871651) +4098 train 6.696948 (lr=1.1828e-04) (hash(x)=23480225) +4099 train 6.546510 (lr=1.1826e-04) (hash(x)=22559978) +4100 val loss 6.8922 +4100 val perplexity 984.5486 +4100 train 7.004048 (lr=1.1823e-04) (hash(x)=25795272) +4101 train 6.947208 (lr=1.1821e-04) (hash(x)=25440399) +4102 train 6.639002 (lr=1.1819e-04) (hash(x)=21581806) +4103 train 6.662446 (lr=1.1816e-04) (hash(x)=25781518) +4104 train 6.769337 (lr=1.1814e-04) (hash(x)=24682372) +4105 train 6.618103 (lr=1.1812e-04) (hash(x)=22440094) +4106 train 6.809694 (lr=1.1809e-04) (hash(x)=23661032) +4107 train 7.010854 (lr=1.1807e-04) (hash(x)=26966012) +4108 train 7.092265 (lr=1.1804e-04) (hash(x)=26232227) +4109 train 6.725766 (lr=1.1802e-04) (hash(x)=24110656) +4110 train 7.006861 (lr=1.1800e-04) (hash(x)=25938621) +4111 train 6.831136 (lr=1.1797e-04) (hash(x)=26432850) +4112 train 6.817021 (lr=1.1795e-04) (hash(x)=25387672) +4113 train 6.554794 (lr=1.1793e-04) (hash(x)=22740017) +4114 train 6.932236 (lr=1.1790e-04) (hash(x)=26384190) +4115 train 6.634575 (lr=1.1788e-04) (hash(x)=24725583) +4116 train 6.802251 (lr=1.1785e-04) (hash(x)=23986700) +4117 train 6.758174 (lr=1.1783e-04) (hash(x)=18529900) +4118 train 6.813724 (lr=1.1781e-04) (hash(x)=22236257) +4119 train 6.415771 (lr=1.1778e-04) (hash(x)=20155894) +4120 train 6.265871 (lr=1.1776e-04) (hash(x)=17423813) +4121 train 6.199460 (lr=1.1774e-04) (hash(x)=18905183) +4122 train 6.539836 (lr=1.1771e-04) (hash(x)=22534398) +4123 train 7.271462 (lr=1.1769e-04) (hash(x)=25247868) +4124 train 6.784390 (lr=1.1766e-04) (hash(x)=23994188) +4125 train 6.681304 (lr=1.1764e-04) (hash(x)=22929754) +4126 train 6.497590 (lr=1.1762e-04) (hash(x)=22485897) +4127 train 6.599805 (lr=1.1759e-04) (hash(x)=22270169) +4128 train 6.570027 (lr=1.1757e-04) (hash(x)=23638027) +4129 train 6.891403 (lr=1.1754e-04) (hash(x)=23821210) +4130 train 6.787939 (lr=1.1752e-04) (hash(x)=25021512) +4131 train 6.821859 (lr=1.1750e-04) (hash(x)=25240141) +4132 train 6.774928 (lr=1.1747e-04) (hash(x)=22833160) +4133 train 6.709072 (lr=1.1745e-04) (hash(x)=22909944) +4134 train 7.012720 (lr=1.1743e-04) (hash(x)=26163558) +4135 train 6.688500 (lr=1.1740e-04) (hash(x)=22108461) +4136 train 6.663825 (lr=1.1738e-04) (hash(x)=22549232) +4137 train 6.861847 (lr=1.1735e-04) (hash(x)=24701302) +4138 train 6.848348 (lr=1.1733e-04) (hash(x)=25206013) +4139 train 6.905240 (lr=1.1731e-04) (hash(x)=27896130) +4140 train 6.665279 (lr=1.1728e-04) (hash(x)=24106243) +4141 train 7.310445 (lr=1.1726e-04) (hash(x)=27158651) +4142 train 6.819376 (lr=1.1723e-04) (hash(x)=23841147) +4143 train 6.682332 (lr=1.1721e-04) (hash(x)=24802848) +4144 train 7.033682 (lr=1.1719e-04) (hash(x)=24911295) +4145 train 6.858247 (lr=1.1716e-04) (hash(x)=26473900) +4146 train 6.885757 (lr=1.1714e-04) (hash(x)=26785092) +4147 train 7.162770 (lr=1.1712e-04) (hash(x)=30188532) +4148 train 6.704360 (lr=1.1709e-04) (hash(x)=25010649) +4149 train 6.680315 (lr=1.1707e-04) (hash(x)=22409016) +4150 val loss 6.8767 +4150 val perplexity 969.4200 +4150 train 7.420698 (lr=1.1704e-04) (hash(x)=31675024) +4151 train 6.719598 (lr=1.1702e-04) (hash(x)=25086604) +4152 train 6.744656 (lr=1.1700e-04) (hash(x)=24429343) +4153 train 6.903751 (lr=1.1697e-04) (hash(x)=25014232) +4154 train 6.802356 (lr=1.1695e-04) (hash(x)=25366275) +4155 train 7.281841 (lr=1.1692e-04) (hash(x)=24031473) +4156 train 6.773767 (lr=1.1690e-04) (hash(x)=26651059) +4157 train 6.895282 (lr=1.1688e-04) (hash(x)=26069721) +4158 train 7.089228 (lr=1.1685e-04) (hash(x)=28114382) +4159 train 7.074296 (lr=1.1683e-04) (hash(x)=26983186) +4160 train 6.382518 (lr=1.1681e-04) (hash(x)=21944670) +4161 train 7.147031 (lr=1.1678e-04) (hash(x)=28155702) +4162 train 6.606984 (lr=1.1676e-04) (hash(x)=24765002) +4163 train 6.835852 (lr=1.1673e-04) (hash(x)=26492636) +4164 train 6.825619 (lr=1.1671e-04) (hash(x)=24063705) +4165 train 7.127799 (lr=1.1669e-04) (hash(x)=27079573) +4166 train 6.722322 (lr=1.1666e-04) (hash(x)=24912201) +4167 train 6.864298 (lr=1.1664e-04) (hash(x)=27208507) +4168 train 6.745786 (lr=1.1661e-04) (hash(x)=25824320) +4169 train 7.331207 (lr=1.1659e-04) (hash(x)=29641677) +4170 train 7.007743 (lr=1.1657e-04) (hash(x)=26275614) +4171 train 6.846224 (lr=1.1654e-04) (hash(x)=25227725) +4172 train 6.919567 (lr=1.1652e-04) (hash(x)=27417375) +4173 train 7.131793 (lr=1.1649e-04) (hash(x)=25581973) +4174 train 7.346969 (lr=1.1647e-04) (hash(x)=30360417) +4175 train 6.676294 (lr=1.1645e-04) (hash(x)=23862845) +4176 train 6.744316 (lr=1.1642e-04) (hash(x)=25415130) +4177 train 6.763356 (lr=1.1640e-04) (hash(x)=23111123) +4178 train 6.694789 (lr=1.1637e-04) (hash(x)=24022804) +4179 train 6.739572 (lr=1.1635e-04) (hash(x)=25148490) +4180 train 6.945079 (lr=1.1633e-04) (hash(x)=22792092) +4181 train 6.973319 (lr=1.1630e-04) (hash(x)=24779698) +4182 train 6.955075 (lr=1.1628e-04) (hash(x)=24870844) +4183 train 6.610846 (lr=1.1626e-04) (hash(x)=22664494) +4184 train 6.687723 (lr=1.1623e-04) (hash(x)=22599729) +4185 train 6.896049 (lr=1.1621e-04) (hash(x)=24707078) +4186 train 6.648776 (lr=1.1618e-04) (hash(x)=23823945) +4187 train 6.343909 (lr=1.1616e-04) (hash(x)=22219856) +4188 train 7.109982 (lr=1.1614e-04) (hash(x)=27061401) +4189 train 6.779524 (lr=1.1611e-04) (hash(x)=23398766) +4190 train 6.952336 (lr=1.1609e-04) (hash(x)=27916730) +4191 train 6.792135 (lr=1.1606e-04) (hash(x)=24092927) +4192 train 6.832822 (lr=1.1604e-04) (hash(x)=24723657) +4193 train 6.835369 (lr=1.1602e-04) (hash(x)=24676155) +4194 train 6.754184 (lr=1.1599e-04) (hash(x)=23455369) +4195 train 6.671506 (lr=1.1597e-04) (hash(x)=21999890) +4196 train 6.587266 (lr=1.1594e-04) (hash(x)=23385567) +4197 train 6.826514 (lr=1.1592e-04) (hash(x)=25120814) +4198 train 6.525623 (lr=1.1590e-04) (hash(x)=21308113) +4199 train 6.865631 (lr=1.1587e-04) (hash(x)=27213812) +4200 val loss 6.8749 +4200 val perplexity 967.6314 +4200 train 6.404999 (lr=1.1585e-04) (hash(x)=19675382) +4201 train 6.707126 (lr=1.1582e-04) (hash(x)=23882161) +4202 train 6.684561 (lr=1.1580e-04) (hash(x)=24338567) +4203 train 7.003706 (lr=1.1578e-04) (hash(x)=27649723) +4204 train 6.787686 (lr=1.1575e-04) (hash(x)=27563514) +4205 train 6.776265 (lr=1.1573e-04) (hash(x)=23128552) +4206 train 6.651554 (lr=1.1570e-04) (hash(x)=26203283) +4207 train 6.735607 (lr=1.1568e-04) (hash(x)=23929955) +4208 train 6.360071 (lr=1.1566e-04) (hash(x)=20978691) +4209 train 6.709500 (lr=1.1563e-04) (hash(x)=21875178) +4210 train 6.787141 (lr=1.1561e-04) (hash(x)=23563293) +4211 train 6.884539 (lr=1.1558e-04) (hash(x)=25538503) +4212 train 7.008478 (lr=1.1556e-04) (hash(x)=24171014) +4213 train 6.813035 (lr=1.1554e-04) (hash(x)=22306665) +4214 train 6.732624 (lr=1.1551e-04) (hash(x)=26082318) +4215 train 6.473619 (lr=1.1549e-04) (hash(x)=23025790) +4216 train 6.642731 (lr=1.1546e-04) (hash(x)=21146597) +4217 train 6.993717 (lr=1.1544e-04) (hash(x)=27470230) +4218 train 6.702882 (lr=1.1542e-04) (hash(x)=22691005) +4219 train 6.527533 (lr=1.1539e-04) (hash(x)=21550313) +4220 train 6.631397 (lr=1.1537e-04) (hash(x)=20618443) +4221 train 6.713689 (lr=1.1534e-04) (hash(x)=25260787) +4222 train 6.782829 (lr=1.1532e-04) (hash(x)=25249873) +4223 train 6.353371 (lr=1.1530e-04) (hash(x)=20452272) +4224 train 6.711606 (lr=1.1527e-04) (hash(x)=25649764) +4225 train 6.562444 (lr=1.1525e-04) (hash(x)=19589460) +4226 train 6.980374 (lr=1.1522e-04) (hash(x)=26477595) +4227 train 7.187389 (lr=1.1520e-04) (hash(x)=27585442) +4228 train 6.994653 (lr=1.1518e-04) (hash(x)=25821343) +4229 train 6.896478 (lr=1.1515e-04) (hash(x)=24549919) +4230 train 6.786471 (lr=1.1513e-04) (hash(x)=26124522) +4231 train 7.133371 (lr=1.1510e-04) (hash(x)=26473464) +4232 train 7.112649 (lr=1.1508e-04) (hash(x)=28883028) +4233 train 7.039879 (lr=1.1506e-04) (hash(x)=29611296) +4234 train 6.952442 (lr=1.1503e-04) (hash(x)=29059941) +4235 train 6.776764 (lr=1.1501e-04) (hash(x)=26368203) +4236 train 6.844765 (lr=1.1498e-04) (hash(x)=27021360) +4237 train 6.719870 (lr=1.1496e-04) (hash(x)=26135379) +4238 train 6.518003 (lr=1.1494e-04) (hash(x)=25862549) +4239 train 6.929771 (lr=1.1491e-04) (hash(x)=28276603) +4240 train 6.509495 (lr=1.1489e-04) (hash(x)=22170090) +4241 train 6.854236 (lr=1.1486e-04) (hash(x)=22625589) +4242 train 6.860516 (lr=1.1484e-04) (hash(x)=25751475) +4243 train 6.791663 (lr=1.1482e-04) (hash(x)=25836838) +4244 train 6.725383 (lr=1.1479e-04) (hash(x)=23938214) +4245 train 6.659402 (lr=1.1477e-04) (hash(x)=22759365) +4246 train 6.627791 (lr=1.1474e-04) (hash(x)=24964628) +4247 train 6.301672 (lr=1.1472e-04) (hash(x)=21480367) +4248 train 6.872798 (lr=1.1470e-04) (hash(x)=25974694) +4249 train 7.227910 (lr=1.1467e-04) (hash(x)=29830546) +4250 val loss 6.8768 +4250 val perplexity 969.5370 +4250 train 6.863719 (lr=1.1465e-04) (hash(x)=26283200) +4251 train 6.965238 (lr=1.1462e-04) (hash(x)=25605672) +4252 train 6.560869 (lr=1.1460e-04) (hash(x)=21439107) +4253 train 6.496811 (lr=1.1458e-04) (hash(x)=22626883) +4254 train 6.835656 (lr=1.1455e-04) (hash(x)=25627150) +4255 train 6.993433 (lr=1.1453e-04) (hash(x)=24658642) +4256 train 7.070979 (lr=1.1450e-04) (hash(x)=29755505) +4257 train 6.913571 (lr=1.1448e-04) (hash(x)=22750846) +4258 train 6.869358 (lr=1.1446e-04) (hash(x)=21892651) +4259 train 6.923648 (lr=1.1443e-04) (hash(x)=22487960) +4260 train 6.950584 (lr=1.1441e-04) (hash(x)=24059869) +4261 train 6.697372 (lr=1.1438e-04) (hash(x)=21090180) +4262 train 6.789844 (lr=1.1436e-04) (hash(x)=22716452) +4263 train 6.967620 (lr=1.1433e-04) (hash(x)=26854801) +4264 train 6.763443 (lr=1.1431e-04) (hash(x)=23815428) +4265 train 6.581035 (lr=1.1429e-04) (hash(x)=23368704) +4266 train 6.689565 (lr=1.1426e-04) (hash(x)=24301098) +4267 train 6.937509 (lr=1.1424e-04) (hash(x)=25025039) +4268 train 6.649505 (lr=1.1421e-04) (hash(x)=25425736) +4269 train 6.868677 (lr=1.1419e-04) (hash(x)=27439380) +4270 train 6.380021 (lr=1.1417e-04) (hash(x)=18682756) +4271 train 6.521466 (lr=1.1414e-04) (hash(x)=17862226) +4272 train 7.032360 (lr=1.1412e-04) (hash(x)=29946491) +4273 train 6.357440 (lr=1.1409e-04) (hash(x)=21392062) +4274 train 6.903114 (lr=1.1407e-04) (hash(x)=25195556) +4275 train 6.879236 (lr=1.1405e-04) (hash(x)=26682036) +4276 train 6.749240 (lr=1.1402e-04) (hash(x)=21235260) +4277 train 6.583957 (lr=1.1400e-04) (hash(x)=22118984) +4278 train 6.616268 (lr=1.1397e-04) (hash(x)=24094510) +4279 train 7.134381 (lr=1.1395e-04) (hash(x)=28519182) +4280 train 6.834741 (lr=1.1393e-04) (hash(x)=26652859) +4281 train 6.711021 (lr=1.1390e-04) (hash(x)=24463139) +4282 train 6.684972 (lr=1.1388e-04) (hash(x)=23281870) +4283 train 6.911228 (lr=1.1385e-04) (hash(x)=29181174) +4284 train 6.572948 (lr=1.1383e-04) (hash(x)=24797417) +4285 train 6.953146 (lr=1.1380e-04) (hash(x)=29026537) +4286 train 6.738305 (lr=1.1378e-04) (hash(x)=23045165) +4287 train 6.683746 (lr=1.1376e-04) (hash(x)=25193694) +4288 train 6.716819 (lr=1.1373e-04) (hash(x)=23475407) +4289 train 6.855777 (lr=1.1371e-04) (hash(x)=24875410) +4290 train 6.736800 (lr=1.1368e-04) (hash(x)=26328101) +4291 train 7.077619 (lr=1.1366e-04) (hash(x)=26273661) +4292 train 6.804006 (lr=1.1364e-04) (hash(x)=23271891) +4293 train 6.751578 (lr=1.1361e-04) (hash(x)=23300732) +4294 train 6.829657 (lr=1.1359e-04) (hash(x)=24243693) +4295 train 6.900365 (lr=1.1356e-04) (hash(x)=25642620) +4296 train 6.916579 (lr=1.1354e-04) (hash(x)=27730411) +4297 train 6.690370 (lr=1.1351e-04) (hash(x)=25485335) +4298 train 6.536905 (lr=1.1349e-04) (hash(x)=25268789) +4299 train 7.002655 (lr=1.1347e-04) (hash(x)=28917143) +4300 val loss 6.8852 +4300 val perplexity 977.7373 +4300 train 7.136726 (lr=1.1344e-04) (hash(x)=28987991) +4301 train 6.870740 (lr=1.1342e-04) (hash(x)=25989151) +4302 train 6.768816 (lr=1.1339e-04) (hash(x)=25658195) +4303 train 6.759248 (lr=1.1337e-04) (hash(x)=25765909) +4304 train 6.764999 (lr=1.1335e-04) (hash(x)=25704261) +4305 train 6.781233 (lr=1.1332e-04) (hash(x)=24438198) +4306 train 6.583403 (lr=1.1330e-04) (hash(x)=22871710) +4307 train 6.429105 (lr=1.1327e-04) (hash(x)=20160896) +4308 train 6.974614 (lr=1.1325e-04) (hash(x)=24218641) +4309 train 6.403909 (lr=1.1323e-04) (hash(x)=22073751) +4310 train 6.731169 (lr=1.1320e-04) (hash(x)=26434959) +4311 train 6.464548 (lr=1.1318e-04) (hash(x)=20750531) +4312 train 6.589012 (lr=1.1315e-04) (hash(x)=22232293) +4313 train 6.860292 (lr=1.1313e-04) (hash(x)=27324521) +4314 train 6.491408 (lr=1.1310e-04) (hash(x)=22217862) +4315 train 6.951881 (lr=1.1308e-04) (hash(x)=25741958) +4316 train 6.723384 (lr=1.1306e-04) (hash(x)=22738456) +4317 train 6.778276 (lr=1.1303e-04) (hash(x)=25387302) +4318 train 6.738789 (lr=1.1301e-04) (hash(x)=24669014) +4319 train 6.859085 (lr=1.1298e-04) (hash(x)=24917098) +4320 train 6.818135 (lr=1.1296e-04) (hash(x)=26698227) +4321 train 6.600322 (lr=1.1294e-04) (hash(x)=23518293) +4322 train 6.509251 (lr=1.1291e-04) (hash(x)=23643971) +4323 train 6.719019 (lr=1.1289e-04) (hash(x)=25659505) +4324 train 6.514568 (lr=1.1286e-04) (hash(x)=22697720) +4325 train 7.024172 (lr=1.1284e-04) (hash(x)=25082178) +4326 train 6.552349 (lr=1.1281e-04) (hash(x)=24166546) +4327 train 6.706999 (lr=1.1279e-04) (hash(x)=24499766) +4328 train 6.835264 (lr=1.1277e-04) (hash(x)=24338607) +4329 train 6.620943 (lr=1.1274e-04) (hash(x)=23225420) +4330 train 6.778339 (lr=1.1272e-04) (hash(x)=25907032) +4331 train 6.578378 (lr=1.1269e-04) (hash(x)=24634979) +4332 train 6.681398 (lr=1.1267e-04) (hash(x)=22161377) +4333 train 6.855897 (lr=1.1264e-04) (hash(x)=22559939) +4334 train 6.622368 (lr=1.1262e-04) (hash(x)=20840022) +4335 train 6.887577 (lr=1.1260e-04) (hash(x)=25067358) +4336 train 6.531037 (lr=1.1257e-04) (hash(x)=23432626) +4337 train 6.700373 (lr=1.1255e-04) (hash(x)=23820385) +4338 train 7.472566 (lr=1.1252e-04) (hash(x)=31594930) +4339 train 6.873558 (lr=1.1250e-04) (hash(x)=27138750) +4340 train 7.130610 (lr=1.1248e-04) (hash(x)=30031341) +4341 train 6.660939 (lr=1.1245e-04) (hash(x)=24602807) +4342 train 6.413717 (lr=1.1243e-04) (hash(x)=21584976) +4343 train 6.867789 (lr=1.1240e-04) (hash(x)=27479796) +4344 train 6.563232 (lr=1.1238e-04) (hash(x)=22746241) +4345 train 6.723877 (lr=1.1235e-04) (hash(x)=19728452) +4346 train 6.523982 (lr=1.1233e-04) (hash(x)=24502020) +4347 train 6.990807 (lr=1.1231e-04) (hash(x)=28225954) +4348 train 6.622151 (lr=1.1228e-04) (hash(x)=23893447) +4349 train 6.995981 (lr=1.1226e-04) (hash(x)=25654586) +4350 val loss 6.8634 +4350 val perplexity 956.6223 +4350 train 6.820099 (lr=1.1223e-04) (hash(x)=23856469) +4351 train 6.722633 (lr=1.1221e-04) (hash(x)=23136080) +4352 train 6.820030 (lr=1.1218e-04) (hash(x)=26532918) +4353 train 6.752078 (lr=1.1216e-04) (hash(x)=25461947) +4354 train 6.799665 (lr=1.1214e-04) (hash(x)=26590231) +4355 train 6.502518 (lr=1.1211e-04) (hash(x)=21441985) +4356 train 6.778801 (lr=1.1209e-04) (hash(x)=26507941) +4357 train 7.106828 (lr=1.1206e-04) (hash(x)=26245238) +4358 train 6.850607 (lr=1.1204e-04) (hash(x)=24879059) +4359 train 7.113782 (lr=1.1202e-04) (hash(x)=29810074) +4360 train 6.492182 (lr=1.1199e-04) (hash(x)=24258069) +4361 train 6.637973 (lr=1.1197e-04) (hash(x)=25229360) +4362 train 6.864442 (lr=1.1194e-04) (hash(x)=25440206) +4363 train 6.736638 (lr=1.1192e-04) (hash(x)=23222125) +4364 train 6.553017 (lr=1.1189e-04) (hash(x)=23353186) +4365 train 6.798561 (lr=1.1187e-04) (hash(x)=26995240) +4366 train 6.732833 (lr=1.1185e-04) (hash(x)=24135899) +4367 train 6.737957 (lr=1.1182e-04) (hash(x)=24765539) +4368 train 6.799739 (lr=1.1180e-04) (hash(x)=26051004) +4369 train 6.569355 (lr=1.1177e-04) (hash(x)=22559142) +4370 train 6.507099 (lr=1.1175e-04) (hash(x)=20364388) +4371 train 6.975516 (lr=1.1172e-04) (hash(x)=25938817) +4372 train 6.980691 (lr=1.1170e-04) (hash(x)=26060945) +4373 train 6.928461 (lr=1.1168e-04) (hash(x)=27866714) +4374 train 6.808836 (lr=1.1165e-04) (hash(x)=27104972) +4375 train 6.516376 (lr=1.1163e-04) (hash(x)=22216309) +4376 train 6.571417 (lr=1.1160e-04) (hash(x)=20781533) +4377 train 6.482620 (lr=1.1158e-04) (hash(x)=18784350) +4378 train 6.593120 (lr=1.1155e-04) (hash(x)=21102897) +4379 train 6.849143 (lr=1.1153e-04) (hash(x)=25647489) +4380 train 6.693892 (lr=1.1151e-04) (hash(x)=24486462) +4381 train 6.940499 (lr=1.1148e-04) (hash(x)=26539114) +4382 train 6.603386 (lr=1.1146e-04) (hash(x)=20026045) +4383 train 6.923805 (lr=1.1143e-04) (hash(x)=20613861) +4384 train 6.568573 (lr=1.1141e-04) (hash(x)=20676237) +4385 train 6.799518 (lr=1.1138e-04) (hash(x)=24893163) +4386 train 6.306348 (lr=1.1136e-04) (hash(x)=17299395) +4387 train 6.482405 (lr=1.1134e-04) (hash(x)=19580191) +4388 train 6.760183 (lr=1.1131e-04) (hash(x)=25588218) +4389 train 6.838454 (lr=1.1129e-04) (hash(x)=26433063) +4390 train 6.946050 (lr=1.1126e-04) (hash(x)=24917693) +4391 train 6.603215 (lr=1.1124e-04) (hash(x)=23462447) +4392 train 6.802551 (lr=1.1121e-04) (hash(x)=27185416) +4393 train 6.979080 (lr=1.1119e-04) (hash(x)=24109010) +4394 train 6.688887 (lr=1.1117e-04) (hash(x)=21486000) +4395 train 6.569292 (lr=1.1114e-04) (hash(x)=22230006) +4396 train 7.036473 (lr=1.1112e-04) (hash(x)=26092311) +4397 train 6.728233 (lr=1.1109e-04) (hash(x)=24112426) +4398 train 6.532207 (lr=1.1107e-04) (hash(x)=21881373) +4399 train 6.661887 (lr=1.1104e-04) (hash(x)=26739455) +4400 val loss 6.8527 +4400 val perplexity 946.4750 +4400 train 6.539908 (lr=1.1102e-04) (hash(x)=22873602) +4401 train 6.636081 (lr=1.1100e-04) (hash(x)=26748712) +4402 train 6.820879 (lr=1.1097e-04) (hash(x)=26306618) +4403 train 6.961433 (lr=1.1095e-04) (hash(x)=26898808) +4404 train 6.747739 (lr=1.1092e-04) (hash(x)=25067751) +4405 train 6.758910 (lr=1.1090e-04) (hash(x)=25397145) +4406 train 6.938241 (lr=1.1087e-04) (hash(x)=24796962) +4407 train 6.715644 (lr=1.1085e-04) (hash(x)=23222996) +4408 train 6.690985 (lr=1.1083e-04) (hash(x)=24820189) +4409 train 7.165001 (lr=1.1080e-04) (hash(x)=27669038) +4410 train 6.719083 (lr=1.1078e-04) (hash(x)=24283976) +4411 train 6.857028 (lr=1.1075e-04) (hash(x)=25018789) +4412 train 6.821234 (lr=1.1073e-04) (hash(x)=26247064) +4413 train 6.897636 (lr=1.1070e-04) (hash(x)=22942904) +4414 train 6.722508 (lr=1.1068e-04) (hash(x)=23918746) +4415 train 6.819942 (lr=1.1066e-04) (hash(x)=26489285) +4416 train 5.812871 (lr=1.1063e-04) (hash(x)=14942495) +4417 train 6.653198 (lr=1.1061e-04) (hash(x)=23908505) +4418 train 6.892986 (lr=1.1058e-04) (hash(x)=25854036) +4419 train 6.752235 (lr=1.1056e-04) (hash(x)=27522868) +4420 train 6.637966 (lr=1.1053e-04) (hash(x)=26549205) +4421 train 6.494039 (lr=1.1051e-04) (hash(x)=24565522) +4422 train 6.846768 (lr=1.1048e-04) (hash(x)=23919123) +4423 train 6.700152 (lr=1.1046e-04) (hash(x)=25185942) +4424 train 6.681415 (lr=1.1044e-04) (hash(x)=24818969) +4425 train 6.818797 (lr=1.1041e-04) (hash(x)=26750372) +4426 train 6.801338 (lr=1.1039e-04) (hash(x)=25621536) +4427 train 7.276358 (lr=1.1036e-04) (hash(x)=28037060) +4428 train 7.253221 (lr=1.1034e-04) (hash(x)=30829517) +4429 train 6.839067 (lr=1.1031e-04) (hash(x)=28728766) +4430 train 6.814000 (lr=1.1029e-04) (hash(x)=25936895) +4431 train 6.948958 (lr=1.1027e-04) (hash(x)=27476158) +4432 train 6.679091 (lr=1.1024e-04) (hash(x)=23297921) +4433 train 6.616779 (lr=1.1022e-04) (hash(x)=23201299) +4434 train 6.566354 (lr=1.1019e-04) (hash(x)=22681766) +4435 train 6.631386 (lr=1.1017e-04) (hash(x)=23217512) +4436 train 7.079426 (lr=1.1014e-04) (hash(x)=29322443) +4437 train 6.663914 (lr=1.1012e-04) (hash(x)=23502072) +4438 train 6.743325 (lr=1.1010e-04) (hash(x)=28873527) +4439 train 6.787039 (lr=1.1007e-04) (hash(x)=23653175) +4440 train 6.564794 (lr=1.1005e-04) (hash(x)=21635879) +4441 train 6.599442 (lr=1.1002e-04) (hash(x)=22201854) +4442 train 6.530988 (lr=1.1000e-04) (hash(x)=23101164) +4443 train 6.958904 (lr=1.0997e-04) (hash(x)=25475122) +4444 train 6.667703 (lr=1.0995e-04) (hash(x)=25124825) +4445 train 6.865986 (lr=1.0992e-04) (hash(x)=26883852) +4446 train 6.628404 (lr=1.0990e-04) (hash(x)=24731829) +4447 train 6.558084 (lr=1.0988e-04) (hash(x)=22405076) +4448 train 6.746816 (lr=1.0985e-04) (hash(x)=27633869) +4449 train 6.824681 (lr=1.0983e-04) (hash(x)=25162594) +4450 val loss 6.8576 +4450 val perplexity 951.0665 +4450 train 6.821115 (lr=1.0980e-04) (hash(x)=26438149) +4451 train 6.858237 (lr=1.0978e-04) (hash(x)=26748800) +4452 train 6.560364 (lr=1.0975e-04) (hash(x)=22971620) +4453 train 6.752801 (lr=1.0973e-04) (hash(x)=25886430) +4454 train 6.491395 (lr=1.0971e-04) (hash(x)=21084137) +4455 train 6.698833 (lr=1.0968e-04) (hash(x)=25673545) +4456 train 7.373737 (lr=1.0966e-04) (hash(x)=29389002) +4457 train 6.412174 (lr=1.0963e-04) (hash(x)=21676076) +4458 train 6.466153 (lr=1.0961e-04) (hash(x)=22616647) +4459 train 6.953214 (lr=1.0958e-04) (hash(x)=22771197) +4460 train 6.829374 (lr=1.0956e-04) (hash(x)=26393514) +4461 train 7.035613 (lr=1.0953e-04) (hash(x)=24996433) +4462 train 6.665694 (lr=1.0951e-04) (hash(x)=19594028) +4463 train 6.815343 (lr=1.0949e-04) (hash(x)=22675428) +4464 train 6.840880 (lr=1.0946e-04) (hash(x)=26566551) +4465 train 6.820470 (lr=1.0944e-04) (hash(x)=22469290) +4466 train 7.295476 (lr=1.0941e-04) (hash(x)=29821654) +4467 train 6.763467 (lr=1.0939e-04) (hash(x)=26305388) +4468 train 6.658956 (lr=1.0936e-04) (hash(x)=21998506) +4469 train 7.111360 (lr=1.0934e-04) (hash(x)=23953315) +4470 train 6.683774 (lr=1.0932e-04) (hash(x)=23985456) +4471 train 7.134689 (lr=1.0929e-04) (hash(x)=28168456) +4472 train 6.766160 (lr=1.0927e-04) (hash(x)=25126411) +4473 train 6.549648 (lr=1.0924e-04) (hash(x)=24619336) +4474 train 6.689400 (lr=1.0922e-04) (hash(x)=24467798) +4475 train 7.678867 (lr=1.0919e-04) (hash(x)=31673254) +4476 train 7.395103 (lr=1.0917e-04) (hash(x)=29929610) +4477 train 7.108229 (lr=1.0914e-04) (hash(x)=29412572) +4478 train 7.249128 (lr=1.0912e-04) (hash(x)=31910006) +4479 train 6.917618 (lr=1.0910e-04) (hash(x)=26072586) +4480 train 6.831331 (lr=1.0907e-04) (hash(x)=25782825) +4481 train 6.687007 (lr=1.0905e-04) (hash(x)=21131363) +4482 train 6.798760 (lr=1.0902e-04) (hash(x)=25071223) +4483 train 7.383536 (lr=1.0900e-04) (hash(x)=32249577) +4484 train 6.667591 (lr=1.0897e-04) (hash(x)=24752808) +4485 train 6.701117 (lr=1.0895e-04) (hash(x)=24970539) +4486 train 6.618896 (lr=1.0892e-04) (hash(x)=24191005) +4487 train 6.850942 (lr=1.0890e-04) (hash(x)=24974331) +4488 train 6.972054 (lr=1.0888e-04) (hash(x)=27043409) +4489 train 6.616115 (lr=1.0885e-04) (hash(x)=11320385) +4490 train 6.607973 (lr=1.0883e-04) (hash(x)=11919565) +4491 train 6.556039 (lr=1.0880e-04) (hash(x)=10404694) +4492 train 6.556934 (lr=1.0878e-04) (hash(x)=12393159) +4493 train 6.411604 (lr=1.0875e-04) (hash(x)=11843609) +4494 train 6.374088 (lr=1.0873e-04) (hash(x)=12632729) +4495 train 6.785667 (lr=1.0870e-04) (hash(x)=21951984) +4496 train 7.582158 (lr=1.0868e-04) (hash(x)=19411544) +4497 train 7.484384 (lr=1.0866e-04) (hash(x)=21000228) +4498 train 7.023090 (lr=1.0863e-04) (hash(x)=26018207) +4499 train 7.014317 (lr=1.0861e-04) (hash(x)=24659058) +4500 val loss 6.8866 +4500 val perplexity 979.0566 +4500 train 7.170261 (lr=1.0858e-04) (hash(x)=27919597) +4501 train 6.774933 (lr=1.0856e-04) (hash(x)=26232596) +4502 train 6.932002 (lr=1.0853e-04) (hash(x)=26248912) +4503 train 6.742361 (lr=1.0851e-04) (hash(x)=25403751) +4504 train 6.653321 (lr=1.0848e-04) (hash(x)=21096637) +4505 train 6.797240 (lr=1.0846e-04) (hash(x)=26560941) +4506 train 6.810861 (lr=1.0844e-04) (hash(x)=24942406) +4507 train 6.928360 (lr=1.0841e-04) (hash(x)=24405748) +4508 train 6.799391 (lr=1.0839e-04) (hash(x)=22975455) +4509 train 6.751592 (lr=1.0836e-04) (hash(x)=26358820) +4510 train 6.726832 (lr=1.0834e-04) (hash(x)=24211938) +4511 train 6.913689 (lr=1.0831e-04) (hash(x)=26396012) +4512 train 6.540916 (lr=1.0829e-04) (hash(x)=22534410) +4513 train 6.659586 (lr=1.0826e-04) (hash(x)=23855025) +4514 train 6.563371 (lr=1.0824e-04) (hash(x)=22722345) +4515 train 6.492651 (lr=1.0822e-04) (hash(x)=22779251) +4516 train 6.915483 (lr=1.0819e-04) (hash(x)=23973078) +4517 train 6.736141 (lr=1.0817e-04) (hash(x)=19886228) +4518 train 6.773309 (lr=1.0814e-04) (hash(x)=23849694) +4519 train 7.212554 (lr=1.0812e-04) (hash(x)=24827190) +4520 train 6.783329 (lr=1.0809e-04) (hash(x)=25111498) +4521 train 7.568985 (lr=1.0807e-04) (hash(x)=29752556) +4522 train 7.013879 (lr=1.0804e-04) (hash(x)=25606805) +4523 train 6.830718 (lr=1.0802e-04) (hash(x)=22209714) +4524 train 6.492610 (lr=1.0800e-04) (hash(x)=24991834) +4525 train 6.775069 (lr=1.0797e-04) (hash(x)=27808158) +4526 train 6.720567 (lr=1.0795e-04) (hash(x)=23041199) +4527 train 6.773820 (lr=1.0792e-04) (hash(x)=24847458) +4528 train 6.717274 (lr=1.0790e-04) (hash(x)=25091787) +4529 train 7.690418 (lr=1.0787e-04) (hash(x)=29745551) +4530 train 6.408120 (lr=1.0785e-04) (hash(x)=20447167) +4531 train 6.695793 (lr=1.0782e-04) (hash(x)=20720911) +4532 train 6.785028 (lr=1.0780e-04) (hash(x)=24803353) +4533 train 6.891068 (lr=1.0778e-04) (hash(x)=23780724) +4534 train 6.890140 (lr=1.0775e-04) (hash(x)=23423120) +4535 train 6.536229 (lr=1.0773e-04) (hash(x)=22159088) +4536 train 6.718841 (lr=1.0770e-04) (hash(x)=25820304) +4537 train 6.492555 (lr=1.0768e-04) (hash(x)=22813612) +4538 train 6.852617 (lr=1.0765e-04) (hash(x)=27827979) +4539 train 6.856029 (lr=1.0763e-04) (hash(x)=25737179) +4540 train 7.064414 (lr=1.0760e-04) (hash(x)=23401504) +4541 train 6.719790 (lr=1.0758e-04) (hash(x)=25071988) +4542 train 6.763723 (lr=1.0756e-04) (hash(x)=22844541) +4543 train 6.561891 (lr=1.0753e-04) (hash(x)=22140034) +4544 train 6.758461 (lr=1.0751e-04) (hash(x)=26522091) +4545 train 6.798600 (lr=1.0748e-04) (hash(x)=24099725) +4546 train 6.420185 (lr=1.0746e-04) (hash(x)=19127182) +4547 train 6.529798 (lr=1.0743e-04) (hash(x)=18992693) +4548 train 7.535482 (lr=1.0741e-04) (hash(x)=26723015) +4549 train 7.287289 (lr=1.0738e-04) (hash(x)=30389969) +4550 val loss 6.8436 +4550 val perplexity 937.8892 +4550 train 6.601673 (lr=1.0736e-04) (hash(x)=24065654) +4551 train 6.373163 (lr=1.0733e-04) (hash(x)=19044797) +4552 train 6.884641 (lr=1.0731e-04) (hash(x)=24919665) +4553 train 6.956775 (lr=1.0729e-04) (hash(x)=22780968) +4554 train 6.670299 (lr=1.0726e-04) (hash(x)=24549699) +4555 train 6.540570 (lr=1.0724e-04) (hash(x)=21374811) +4556 train 6.639923 (lr=1.0721e-04) (hash(x)=25225950) +4557 train 6.766254 (lr=1.0719e-04) (hash(x)=25691882) +4558 train 6.691986 (lr=1.0716e-04) (hash(x)=24685235) +4559 train 6.506688 (lr=1.0714e-04) (hash(x)=23932794) +4560 train 7.151065 (lr=1.0711e-04) (hash(x)=28152043) +4561 train 6.595692 (lr=1.0709e-04) (hash(x)=23417051) +4562 train 6.652985 (lr=1.0707e-04) (hash(x)=26250211) +4563 train 6.933074 (lr=1.0704e-04) (hash(x)=25428813) +4564 train 7.051471 (lr=1.0702e-04) (hash(x)=27477379) +4565 train 6.812379 (lr=1.0699e-04) (hash(x)=23015212) +4566 train 6.562259 (lr=1.0697e-04) (hash(x)=22837608) +4567 train 6.669378 (lr=1.0694e-04) (hash(x)=25256890) +4568 train 6.543359 (lr=1.0692e-04) (hash(x)=22742827) +4569 train 6.964053 (lr=1.0689e-04) (hash(x)=30167922) +4570 train 6.630865 (lr=1.0687e-04) (hash(x)=24540265) +4571 train 7.010461 (lr=1.0684e-04) (hash(x)=26752941) +4572 train 6.780099 (lr=1.0682e-04) (hash(x)=25094026) +4573 train 7.505234 (lr=1.0680e-04) (hash(x)=28508785) +4574 train 6.921729 (lr=1.0677e-04) (hash(x)=26501871) +4575 train 6.626780 (lr=1.0675e-04) (hash(x)=24161711) +4576 train 6.597162 (lr=1.0672e-04) (hash(x)=24313695) +4577 train 7.064887 (lr=1.0670e-04) (hash(x)=28248933) +4578 train 7.222296 (lr=1.0667e-04) (hash(x)=28445722) +4579 train 6.774419 (lr=1.0665e-04) (hash(x)=24589015) +4580 train 6.969073 (lr=1.0662e-04) (hash(x)=26192193) +4581 train 6.574613 (lr=1.0660e-04) (hash(x)=25131316) +4582 train 6.662455 (lr=1.0657e-04) (hash(x)=26631504) +4583 train 6.500681 (lr=1.0655e-04) (hash(x)=22036817) +4584 train 7.141458 (lr=1.0653e-04) (hash(x)=28361254) +4585 train 6.784888 (lr=1.0650e-04) (hash(x)=24828340) +4586 train 6.422285 (lr=1.0648e-04) (hash(x)=24067304) +4587 train 6.231550 (lr=1.0645e-04) (hash(x)=20733289) +4588 train 6.150353 (lr=1.0643e-04) (hash(x)=19526622) +4589 train 6.525940 (lr=1.0640e-04) (hash(x)=22148688) +4590 train 6.779009 (lr=1.0638e-04) (hash(x)=24141800) +4591 train 6.845410 (lr=1.0635e-04) (hash(x)=26663208) +4592 train 6.490400 (lr=1.0633e-04) (hash(x)=22536305) +4593 train 6.803476 (lr=1.0631e-04) (hash(x)=23608185) +4594 train 6.618015 (lr=1.0628e-04) (hash(x)=23348495) +4595 train 6.779398 (lr=1.0626e-04) (hash(x)=25409759) +4596 train 6.762429 (lr=1.0623e-04) (hash(x)=25572131) +4597 train 6.790740 (lr=1.0621e-04) (hash(x)=21782039) +4598 train 6.686376 (lr=1.0618e-04) (hash(x)=24643923) +4599 train 6.663164 (lr=1.0616e-04) (hash(x)=24072213) +4600 val loss 6.8566 +4600 val perplexity 950.1078 +4600 train 6.617399 (lr=1.0613e-04) (hash(x)=23925612) +4601 train 6.684378 (lr=1.0611e-04) (hash(x)=23315415) +4602 train 6.717186 (lr=1.0608e-04) (hash(x)=21793800) +4603 train 6.614044 (lr=1.0606e-04) (hash(x)=24921200) +4604 train 6.866420 (lr=1.0604e-04) (hash(x)=27226113) +4605 train 6.681446 (lr=1.0601e-04) (hash(x)=22920960) +4606 train 6.585495 (lr=1.0599e-04) (hash(x)=21947750) +4607 train 6.705594 (lr=1.0596e-04) (hash(x)=22766044) +4608 train 7.066425 (lr=1.0594e-04) (hash(x)=28237005) +4609 train 6.505200 (lr=1.0591e-04) (hash(x)=24922621) +4610 train 6.791173 (lr=1.0589e-04) (hash(x)=24899830) +4611 train 7.117586 (lr=1.0586e-04) (hash(x)=32920298) +4612 train 6.564771 (lr=1.0584e-04) (hash(x)=25083835) +4613 train 6.658756 (lr=1.0581e-04) (hash(x)=22863054) +4614 train 6.612369 (lr=1.0579e-04) (hash(x)=24841464) +4615 train 6.973583 (lr=1.0576e-04) (hash(x)=27871153) +4616 train 6.936882 (lr=1.0574e-04) (hash(x)=28025163) +4617 train 6.553988 (lr=1.0572e-04) (hash(x)=24659561) +4618 train 6.692768 (lr=1.0569e-04) (hash(x)=25067194) +4619 train 6.705860 (lr=1.0567e-04) (hash(x)=22731460) +4620 train 6.711382 (lr=1.0564e-04) (hash(x)=20445873) +4621 train 6.737525 (lr=1.0562e-04) (hash(x)=26033948) +4622 train 6.608256 (lr=1.0559e-04) (hash(x)=22473213) +4623 train 7.272658 (lr=1.0557e-04) (hash(x)=24037280) +4624 train 7.783902 (lr=1.0554e-04) (hash(x)=25624131) +4625 train 7.287795 (lr=1.0552e-04) (hash(x)=26799867) +4626 train 6.775449 (lr=1.0549e-04) (hash(x)=27187602) +4627 train 6.712476 (lr=1.0547e-04) (hash(x)=23277695) +4628 train 6.696064 (lr=1.0545e-04) (hash(x)=24748234) +4629 train 6.861444 (lr=1.0542e-04) (hash(x)=26103104) +4630 train 6.763756 (lr=1.0540e-04) (hash(x)=24327389) +4631 train 6.868932 (lr=1.0537e-04) (hash(x)=24121850) +4632 train 6.701993 (lr=1.0535e-04) (hash(x)=23714590) +4633 train 6.769855 (lr=1.0532e-04) (hash(x)=22379412) +4634 train 7.011658 (lr=1.0530e-04) (hash(x)=24454713) +4635 train 6.661302 (lr=1.0527e-04) (hash(x)=22966977) +4636 train 6.680625 (lr=1.0525e-04) (hash(x)=23764884) +4637 train 6.539600 (lr=1.0522e-04) (hash(x)=23827429) +4638 train 6.768747 (lr=1.0520e-04) (hash(x)=24088592) +4639 train 6.713620 (lr=1.0518e-04) (hash(x)=24380031) +4640 train 6.812093 (lr=1.0515e-04) (hash(x)=26065050) +4641 train 6.698345 (lr=1.0513e-04) (hash(x)=24442902) +4642 train 6.336202 (lr=1.0510e-04) (hash(x)=18548782) +4643 train 6.803016 (lr=1.0508e-04) (hash(x)=26957303) +4644 train 6.808969 (lr=1.0505e-04) (hash(x)=25032727) +4645 train 6.661395 (lr=1.0503e-04) (hash(x)=27224706) +4646 train 6.819057 (lr=1.0500e-04) (hash(x)=27508476) +4647 train 6.568614 (lr=1.0498e-04) (hash(x)=23055215) +4648 train 6.667826 (lr=1.0495e-04) (hash(x)=24496194) +4649 train 7.781665 (lr=1.0493e-04) (hash(x)=13982941) +4650 val loss 6.8458 +4650 val perplexity 939.9414 +4650 train 7.156137 (lr=1.0490e-04) (hash(x)=16721547) +4651 train 6.738876 (lr=1.0488e-04) (hash(x)=22929154) +4652 train 6.608243 (lr=1.0486e-04) (hash(x)=23323994) +4653 train 6.991921 (lr=1.0483e-04) (hash(x)=24877951) +4654 train 6.882239 (lr=1.0481e-04) (hash(x)=24096183) +4655 train 6.677348 (lr=1.0478e-04) (hash(x)=25329724) +4656 train 6.622552 (lr=1.0476e-04) (hash(x)=23877337) +4657 train 6.325511 (lr=1.0473e-04) (hash(x)=20923083) +4658 train 6.617769 (lr=1.0471e-04) (hash(x)=23807996) +4659 train 6.726782 (lr=1.0468e-04) (hash(x)=24370475) +4660 train 7.102216 (lr=1.0466e-04) (hash(x)=28202255) +4661 train 6.772810 (lr=1.0463e-04) (hash(x)=26142119) +4662 train 6.587736 (lr=1.0461e-04) (hash(x)=21387743) +4663 train 6.721777 (lr=1.0458e-04) (hash(x)=25662408) +4664 train 6.742555 (lr=1.0456e-04) (hash(x)=23962815) +4665 train 6.711985 (lr=1.0454e-04) (hash(x)=23987677) +4666 train 7.035161 (lr=1.0451e-04) (hash(x)=26554284) +4667 train 7.063850 (lr=1.0449e-04) (hash(x)=25991817) +4668 train 6.745886 (lr=1.0446e-04) (hash(x)=24256966) +4669 train 6.488042 (lr=1.0444e-04) (hash(x)=22187158) +4670 train 6.778424 (lr=1.0441e-04) (hash(x)=26295320) +4671 train 6.838223 (lr=1.0439e-04) (hash(x)=26346814) +4672 train 7.140420 (lr=1.0436e-04) (hash(x)=26594196) +4673 train 6.866277 (lr=1.0434e-04) (hash(x)=24322101) +4674 train 6.956043 (lr=1.0431e-04) (hash(x)=27274566) +4675 train 6.748751 (lr=1.0429e-04) (hash(x)=24505725) +4676 train 6.861784 (lr=1.0427e-04) (hash(x)=26167371) +4677 train 7.051567 (lr=1.0424e-04) (hash(x)=28062311) +4678 train 6.691937 (lr=1.0422e-04) (hash(x)=23476009) +4679 train 6.837733 (lr=1.0419e-04) (hash(x)=25283256) +4680 train 6.561932 (lr=1.0417e-04) (hash(x)=22033246) +4681 train 6.611320 (lr=1.0414e-04) (hash(x)=22716214) +4682 train 6.738142 (lr=1.0412e-04) (hash(x)=25672672) +4683 train 6.610075 (lr=1.0409e-04) (hash(x)=22979072) +4684 train 6.812343 (lr=1.0407e-04) (hash(x)=27439204) +4685 train 6.679767 (lr=1.0404e-04) (hash(x)=24857737) +4686 train 7.078681 (lr=1.0402e-04) (hash(x)=29615897) +4687 train 6.478140 (lr=1.0399e-04) (hash(x)=24021771) +4688 train 6.722273 (lr=1.0397e-04) (hash(x)=27410807) +4689 train 6.531349 (lr=1.0394e-04) (hash(x)=22850411) +4690 train 6.863567 (lr=1.0392e-04) (hash(x)=24949696) +4691 train 6.610474 (lr=1.0390e-04) (hash(x)=22956381) +4692 train 7.124044 (lr=1.0387e-04) (hash(x)=28193458) +4693 train 6.687074 (lr=1.0385e-04) (hash(x)=25596844) +4694 train 6.614580 (lr=1.0382e-04) (hash(x)=22101377) +4695 train 6.527902 (lr=1.0380e-04) (hash(x)=23576840) +4696 train 6.522301 (lr=1.0377e-04) (hash(x)=21849758) +4697 train 6.722600 (lr=1.0375e-04) (hash(x)=26431349) +4698 train 6.826772 (lr=1.0372e-04) (hash(x)=22960758) +4699 train 6.767840 (lr=1.0370e-04) (hash(x)=23243097) +4700 val loss 6.8379 +4700 val perplexity 932.5285 +4700 train 6.645391 (lr=1.0367e-04) (hash(x)=23715370) +4701 train 7.289497 (lr=1.0365e-04) (hash(x)=30678293) +4702 train 7.268864 (lr=1.0362e-04) (hash(x)=32481620) +4703 train 6.933671 (lr=1.0360e-04) (hash(x)=26414858) +4704 train 6.767171 (lr=1.0358e-04) (hash(x)=24768691) +4705 train 6.455888 (lr=1.0355e-04) (hash(x)=21627762) +4706 train 6.566767 (lr=1.0353e-04) (hash(x)=21024917) +4707 train 6.485158 (lr=1.0350e-04) (hash(x)=23570951) +4708 train 6.608132 (lr=1.0348e-04) (hash(x)=23729185) +4709 train 6.992542 (lr=1.0345e-04) (hash(x)=25933754) +4710 train 6.374849 (lr=1.0343e-04) (hash(x)=23091014) +4711 train 6.564669 (lr=1.0340e-04) (hash(x)=20099261) +4712 train 6.686293 (lr=1.0338e-04) (hash(x)=26807297) +4713 train 6.574502 (lr=1.0335e-04) (hash(x)=25332115) +4714 train 6.570032 (lr=1.0333e-04) (hash(x)=23247605) +4715 train 6.458462 (lr=1.0330e-04) (hash(x)=23786549) +4716 train 6.596419 (lr=1.0328e-04) (hash(x)=23981166) +4717 train 6.761294 (lr=1.0326e-04) (hash(x)=25967754) +4718 train 6.616960 (lr=1.0323e-04) (hash(x)=23659116) +4719 train 6.685711 (lr=1.0321e-04) (hash(x)=22453718) +4720 train 6.612755 (lr=1.0318e-04) (hash(x)=22597951) +4721 train 6.832849 (lr=1.0316e-04) (hash(x)=25284885) +4722 train 6.763364 (lr=1.0313e-04) (hash(x)=24748569) +4723 train 6.407938 (lr=1.0311e-04) (hash(x)=19448608) +4724 train 6.721561 (lr=1.0308e-04) (hash(x)=24888040) +4725 train 6.543894 (lr=1.0306e-04) (hash(x)=23203503) +4726 train 6.309494 (lr=1.0303e-04) (hash(x)=20387787) +4727 train 6.448917 (lr=1.0301e-04) (hash(x)=22529445) +4728 train 6.730635 (lr=1.0298e-04) (hash(x)=22455471) +4729 train 6.700087 (lr=1.0296e-04) (hash(x)=25661132) +4730 train 6.695432 (lr=1.0293e-04) (hash(x)=24997711) +4731 train 6.878798 (lr=1.0291e-04) (hash(x)=22575521) +4732 train 6.580721 (lr=1.0289e-04) (hash(x)=22640285) +4733 train 6.448650 (lr=1.0286e-04) (hash(x)=18637357) +4734 train 6.611969 (lr=1.0284e-04) (hash(x)=22845826) +4735 train 6.832355 (lr=1.0281e-04) (hash(x)=24484543) +4736 train 6.674081 (lr=1.0279e-04) (hash(x)=23352320) +4737 train 6.443909 (lr=1.0276e-04) (hash(x)=21544758) +4738 train 6.222775 (lr=1.0274e-04) (hash(x)=18292136) +4739 train 6.937458 (lr=1.0271e-04) (hash(x)=24893614) +4740 train 6.740598 (lr=1.0269e-04) (hash(x)=28103443) +4741 train 6.564887 (lr=1.0266e-04) (hash(x)=22233356) +4742 train 6.418771 (lr=1.0264e-04) (hash(x)=21133541) +4743 train 6.695026 (lr=1.0261e-04) (hash(x)=24043998) +4744 train 7.002538 (lr=1.0259e-04) (hash(x)=24801185) +4745 train 6.741107 (lr=1.0256e-04) (hash(x)=23858358) +4746 train 6.792718 (lr=1.0254e-04) (hash(x)=23926989) +4747 train 6.847858 (lr=1.0252e-04) (hash(x)=24813708) +4748 train 6.658395 (lr=1.0249e-04) (hash(x)=26339467) +4749 train 6.526909 (lr=1.0247e-04) (hash(x)=21850656) +4750 val loss 6.8332 +4750 val perplexity 928.1907 +4750 train 6.553168 (lr=1.0244e-04) (hash(x)=21475802) +4751 train 6.698186 (lr=1.0242e-04) (hash(x)=24301906) +4752 train 6.553594 (lr=1.0239e-04) (hash(x)=22748495) +4753 train 6.731884 (lr=1.0237e-04) (hash(x)=25649256) +4754 train 6.604394 (lr=1.0234e-04) (hash(x)=23934346) +4755 train 6.744371 (lr=1.0232e-04) (hash(x)=26332892) +4756 train 6.582848 (lr=1.0229e-04) (hash(x)=23279389) +4757 train 6.642505 (lr=1.0227e-04) (hash(x)=23146858) +4758 train 7.096859 (lr=1.0224e-04) (hash(x)=26892932) +4759 train 6.535709 (lr=1.0222e-04) (hash(x)=26328881) +4760 train 6.607625 (lr=1.0219e-04) (hash(x)=24394655) +4761 train 6.687614 (lr=1.0217e-04) (hash(x)=22122308) +4762 train 6.797274 (lr=1.0215e-04) (hash(x)=24200369) +4763 train 6.923988 (lr=1.0212e-04) (hash(x)=26841776) +4764 train 6.843721 (lr=1.0210e-04) (hash(x)=27196641) +4765 train 6.601759 (lr=1.0207e-04) (hash(x)=24912822) +4766 train 6.841160 (lr=1.0205e-04) (hash(x)=25946055) +4767 train 6.442070 (lr=1.0202e-04) (hash(x)=23101508) +4768 train 6.633420 (lr=1.0200e-04) (hash(x)=24287798) +4769 train 6.700449 (lr=1.0197e-04) (hash(x)=22798964) +4770 train 6.639043 (lr=1.0195e-04) (hash(x)=24164479) +4771 train 6.681278 (lr=1.0192e-04) (hash(x)=24946464) +4772 train 6.855106 (lr=1.0190e-04) (hash(x)=25154423) +4773 train 6.508721 (lr=1.0187e-04) (hash(x)=23173476) +4774 train 6.785816 (lr=1.0185e-04) (hash(x)=25373559) +4775 train 6.773729 (lr=1.0182e-04) (hash(x)=23527176) +4776 train 6.652081 (lr=1.0180e-04) (hash(x)=24865403) +4777 train 6.629979 (lr=1.0178e-04) (hash(x)=24451067) +4778 train 7.263655 (lr=1.0175e-04) (hash(x)=28187162) +4779 train 7.422599 (lr=1.0173e-04) (hash(x)=31163350) +4780 train 7.691823 (lr=1.0170e-04) (hash(x)=33563280) +4781 train 7.798041 (lr=1.0168e-04) (hash(x)=34939183) +4782 train 7.260335 (lr=1.0165e-04) (hash(x)=30263543) +4783 train 6.620449 (lr=1.0163e-04) (hash(x)=22705673) +4784 train 6.479745 (lr=1.0160e-04) (hash(x)=21415023) +4785 train 6.740118 (lr=1.0158e-04) (hash(x)=26079097) +4786 train 7.060513 (lr=1.0155e-04) (hash(x)=25503836) +4787 train 6.909864 (lr=1.0153e-04) (hash(x)=24705721) +4788 train 6.789121 (lr=1.0150e-04) (hash(x)=24384657) +4789 train 6.657348 (lr=1.0148e-04) (hash(x)=22550579) +4790 train 6.700687 (lr=1.0145e-04) (hash(x)=22452164) +4791 train 7.032010 (lr=1.0143e-04) (hash(x)=28664796) +4792 train 7.343388 (lr=1.0141e-04) (hash(x)=26139280) +4793 train 7.035703 (lr=1.0138e-04) (hash(x)=23862341) +4794 train 6.576211 (lr=1.0136e-04) (hash(x)=23784757) +4795 train 6.422811 (lr=1.0133e-04) (hash(x)=22659441) +4796 train 7.190503 (lr=1.0131e-04) (hash(x)=29744216) +4797 train 7.150381 (lr=1.0128e-04) (hash(x)=25822591) +4798 train 6.516498 (lr=1.0126e-04) (hash(x)=22370895) +4799 train 7.015632 (lr=1.0123e-04) (hash(x)=27102890) +4800 val loss 6.8382 +4800 val perplexity 932.8416 +4800 train 7.014906 (lr=1.0121e-04) (hash(x)=27014625) +4801 train 6.771005 (lr=1.0118e-04) (hash(x)=25755963) +4802 train 7.000852 (lr=1.0116e-04) (hash(x)=29675278) +4803 train 7.222031 (lr=1.0113e-04) (hash(x)=26660930) +4804 train 7.141225 (lr=1.0111e-04) (hash(x)=24557060) +4805 train 7.276901 (lr=1.0108e-04) (hash(x)=24622741) +4806 train 7.326272 (lr=1.0106e-04) (hash(x)=23952601) +4807 train 6.858451 (lr=1.0103e-04) (hash(x)=26787259) +4808 train 7.045209 (lr=1.0101e-04) (hash(x)=28919605) +4809 train 7.413354 (lr=1.0099e-04) (hash(x)=37061654) +4810 train 7.201610 (lr=1.0096e-04) (hash(x)=30379739) +4811 train 6.993192 (lr=1.0094e-04) (hash(x)=26097180) +4812 train 7.157968 (lr=1.0091e-04) (hash(x)=26327092) +4813 train 6.832402 (lr=1.0089e-04) (hash(x)=23258030) +4814 train 6.968782 (lr=1.0086e-04) (hash(x)=25582015) +4815 train 6.647031 (lr=1.0084e-04) (hash(x)=23396088) +4816 train 6.599604 (lr=1.0081e-04) (hash(x)=21904146) +4817 train 6.835788 (lr=1.0079e-04) (hash(x)=26281676) +4818 train 6.587488 (lr=1.0076e-04) (hash(x)=23140470) +4819 train 6.860962 (lr=1.0074e-04) (hash(x)=24611098) +4820 train 6.698832 (lr=1.0071e-04) (hash(x)=23832642) +4821 train 6.923076 (lr=1.0069e-04) (hash(x)=21439671) +4822 train 6.729234 (lr=1.0066e-04) (hash(x)=25128845) +4823 train 6.698273 (lr=1.0064e-04) (hash(x)=24911831) +4824 train 6.848621 (lr=1.0061e-04) (hash(x)=26051723) +4825 train 6.870625 (lr=1.0059e-04) (hash(x)=26479565) +4826 train 6.995992 (lr=1.0057e-04) (hash(x)=26228987) +4827 train 6.860706 (lr=1.0054e-04) (hash(x)=25131300) +4828 train 6.519578 (lr=1.0052e-04) (hash(x)=19921978) +4829 train 6.565630 (lr=1.0049e-04) (hash(x)=23173449) +4830 train 6.921703 (lr=1.0047e-04) (hash(x)=24791832) +4831 train 6.635696 (lr=1.0044e-04) (hash(x)=23453491) +4832 train 6.810227 (lr=1.0042e-04) (hash(x)=22564139) +4833 train 6.614479 (lr=1.0039e-04) (hash(x)=21659918) +4834 train 6.719414 (lr=1.0037e-04) (hash(x)=22956076) +4835 train 6.839929 (lr=1.0034e-04) (hash(x)=22237612) +4836 train 6.956979 (lr=1.0032e-04) (hash(x)=24736427) +4837 train 7.003910 (lr=1.0029e-04) (hash(x)=24939751) +4838 train 6.907630 (lr=1.0027e-04) (hash(x)=25059298) +4839 train 6.800163 (lr=1.0024e-04) (hash(x)=23453396) +4840 train 6.268997 (lr=1.0022e-04) (hash(x)=17919338) +4841 train 6.816481 (lr=1.0019e-04) (hash(x)=23428815) +4842 train 7.069445 (lr=1.0017e-04) (hash(x)=27042659) +4843 train 7.147547 (lr=1.0015e-04) (hash(x)=25161278) +4844 train 6.941835 (lr=1.0012e-04) (hash(x)=24113253) +4845 train 7.062898 (lr=1.0010e-04) (hash(x)=26139263) +4846 train 7.091086 (lr=1.0007e-04) (hash(x)=27787006) +4847 train 6.814208 (lr=1.0005e-04) (hash(x)=23869612) +4848 train 6.904207 (lr=1.0002e-04) (hash(x)=26092193) +4849 train 6.999090 (lr=9.9997e-05) (hash(x)=29351182) +4850 val loss 6.8101 +4850 val perplexity 906.9270 +4850 train 7.139253 (lr=9.9972e-05) (hash(x)=28773463) +4851 train 7.094354 (lr=9.9948e-05) (hash(x)=28207741) +4852 train 6.616544 (lr=9.9923e-05) (hash(x)=23280878) +4853 train 7.119644 (lr=9.9898e-05) (hash(x)=26742336) +4854 train 6.866681 (lr=9.9873e-05) (hash(x)=23543321) +4855 train 7.269741 (lr=9.9849e-05) (hash(x)=26581590) +4856 train 6.699693 (lr=9.9824e-05) (hash(x)=22728668) +4857 train 6.490190 (lr=9.9799e-05) (hash(x)=19854534) +4858 train 6.958186 (lr=9.9775e-05) (hash(x)=26612813) +4859 train 7.073520 (lr=9.9750e-05) (hash(x)=25827863) +4860 train 6.731296 (lr=9.9725e-05) (hash(x)=24574997) +4861 train 6.918628 (lr=9.9700e-05) (hash(x)=26187830) +4862 train 6.869282 (lr=9.9676e-05) (hash(x)=25105823) +4863 train 6.947574 (lr=9.9651e-05) (hash(x)=28056342) +4864 train 6.824577 (lr=9.9626e-05) (hash(x)=21885801) +4865 train 6.991627 (lr=9.9602e-05) (hash(x)=25659043) +4866 train 6.997921 (lr=9.9577e-05) (hash(x)=23852824) +4867 train 6.748840 (lr=9.9552e-05) (hash(x)=23965470) +4868 train 6.785684 (lr=9.9527e-05) (hash(x)=25035012) +4869 train 6.988646 (lr=9.9503e-05) (hash(x)=26639165) +4870 train 6.978170 (lr=9.9478e-05) (hash(x)=29205362) +4871 train 6.805588 (lr=9.9453e-05) (hash(x)=25900866) +4872 train 6.833088 (lr=9.9429e-05) (hash(x)=25636242) +4873 train 6.909275 (lr=9.9404e-05) (hash(x)=25430698) +4874 train 6.852694 (lr=9.9379e-05) (hash(x)=27629981) +4875 train 6.842128 (lr=9.9354e-05) (hash(x)=27682625) +4876 train 7.145935 (lr=9.9330e-05) (hash(x)=27549409) +4877 train 6.793025 (lr=9.9305e-05) (hash(x)=24661627) +4878 train 6.911772 (lr=9.9280e-05) (hash(x)=25196542) +4879 train 6.791998 (lr=9.9255e-05) (hash(x)=24549177) +4880 train 6.732149 (lr=9.9231e-05) (hash(x)=23740600) +4881 train 6.626244 (lr=9.9206e-05) (hash(x)=21460850) +4882 train 6.937071 (lr=9.9181e-05) (hash(x)=27101400) +4883 train 6.949811 (lr=9.9157e-05) (hash(x)=24193076) +4884 train 6.873064 (lr=9.9132e-05) (hash(x)=24582947) +4885 train 6.822083 (lr=9.9107e-05) (hash(x)=25133839) +4886 train 6.794108 (lr=9.9082e-05) (hash(x)=24759454) +4887 train 6.833715 (lr=9.9058e-05) (hash(x)=28239583) +4888 train 7.140664 (lr=9.9033e-05) (hash(x)=29594489) +4889 train 6.845714 (lr=9.9008e-05) (hash(x)=23833431) +4890 train 6.809753 (lr=9.8983e-05) (hash(x)=23139411) +4891 train 6.778566 (lr=9.8959e-05) (hash(x)=20885864) +4892 train 7.156106 (lr=9.8934e-05) (hash(x)=26217418) +4893 train 6.907770 (lr=9.8909e-05) (hash(x)=27321870) +4894 train 6.418430 (lr=9.8885e-05) (hash(x)=19912955) +4895 train 6.716272 (lr=9.8860e-05) (hash(x)=23223554) +4896 train 6.909854 (lr=9.8835e-05) (hash(x)=25667219) +4897 train 7.176727 (lr=9.8810e-05) (hash(x)=28007972) +4898 train 6.965570 (lr=9.8786e-05) (hash(x)=27748764) +4899 train 6.882524 (lr=9.8761e-05) (hash(x)=27425770) +4900 val loss 6.8049 +4900 val perplexity 902.2190 +4900 train 7.051987 (lr=9.8736e-05) (hash(x)=28394020) +4901 train 6.861229 (lr=9.8711e-05) (hash(x)=24080235) +4902 train 6.735783 (lr=9.8687e-05) (hash(x)=23309527) +4903 train 6.739461 (lr=9.8662e-05) (hash(x)=24793480) +4904 train 6.967689 (lr=9.8637e-05) (hash(x)=25344456) +4905 train 6.892622 (lr=9.8613e-05) (hash(x)=24590670) +4906 train 6.827186 (lr=9.8588e-05) (hash(x)=26937171) +4907 train 6.955471 (lr=9.8563e-05) (hash(x)=26949097) +4908 train 6.671553 (lr=9.8538e-05) (hash(x)=22443915) +4909 train 6.735691 (lr=9.8514e-05) (hash(x)=23814995) +4910 train 6.807331 (lr=9.8489e-05) (hash(x)=26135871) +4911 train 6.651020 (lr=9.8464e-05) (hash(x)=25415570) +4912 train 6.947881 (lr=9.8439e-05) (hash(x)=26756326) +4913 train 6.790450 (lr=9.8415e-05) (hash(x)=22920200) +4914 train 6.853197 (lr=9.8390e-05) (hash(x)=26710977) +4915 train 6.784116 (lr=9.8365e-05) (hash(x)=24985634) +4916 train 6.891040 (lr=9.8340e-05) (hash(x)=26004335) +4917 train 6.800818 (lr=9.8316e-05) (hash(x)=25637457) +4918 train 7.033272 (lr=9.8291e-05) (hash(x)=26645180) +4919 train 6.913893 (lr=9.8266e-05) (hash(x)=24425760) +4920 train 7.132333 (lr=9.8242e-05) (hash(x)=28223544) +4921 train 6.798764 (lr=9.8217e-05) (hash(x)=25538618) +4922 train 7.084340 (lr=9.8192e-05) (hash(x)=26984784) +4923 train 7.146976 (lr=9.8167e-05) (hash(x)=29154578) +4924 train 6.782646 (lr=9.8143e-05) (hash(x)=25308123) +4925 train 7.145017 (lr=9.8118e-05) (hash(x)=27939259) +4926 train 6.747296 (lr=9.8093e-05) (hash(x)=21984545) +4927 train 6.736080 (lr=9.8068e-05) (hash(x)=23707134) +4928 train 6.852135 (lr=9.8044e-05) (hash(x)=27201034) +4929 train 7.165152 (lr=9.8019e-05) (hash(x)=31623877) +4930 train 6.830841 (lr=9.7994e-05) (hash(x)=22162782) +4931 train 6.781831 (lr=9.7969e-05) (hash(x)=20049335) +4932 train 6.685591 (lr=9.7945e-05) (hash(x)=25594665) +4933 train 6.788752 (lr=9.7920e-05) (hash(x)=25265312) +4934 train 6.881922 (lr=9.7895e-05) (hash(x)=27094896) +4935 train 7.228536 (lr=9.7871e-05) (hash(x)=28321697) +4936 train 6.779289 (lr=9.7846e-05) (hash(x)=25006013) +4937 train 6.990648 (lr=9.7821e-05) (hash(x)=24596431) +4938 train 6.996357 (lr=9.7796e-05) (hash(x)=25150510) +4939 train 6.499701 (lr=9.7772e-05) (hash(x)=21497535) +4940 train 6.773103 (lr=9.7747e-05) (hash(x)=25094669) +4941 train 6.667109 (lr=9.7722e-05) (hash(x)=24024557) +4942 train 6.974693 (lr=9.7697e-05) (hash(x)=24370776) +4943 train 6.829064 (lr=9.7673e-05) (hash(x)=23434031) +4944 train 6.817200 (lr=9.7648e-05) (hash(x)=24383517) +4945 train 6.826978 (lr=9.7623e-05) (hash(x)=25858759) +4946 train 6.371229 (lr=9.7598e-05) (hash(x)=20409561) +4947 train 7.083531 (lr=9.7574e-05) (hash(x)=27469117) +4948 train 6.644352 (lr=9.7549e-05) (hash(x)=22086623) +4949 train 6.959882 (lr=9.7524e-05) (hash(x)=25759281) +4950 val loss 6.8094 +4950 val perplexity 906.3524 +4950 train 6.876153 (lr=9.7499e-05) (hash(x)=27130117) +4951 train 6.769779 (lr=9.7475e-05) (hash(x)=27003481) +4952 train 7.052941 (lr=9.7450e-05) (hash(x)=26725937) +4953 train 6.799442 (lr=9.7425e-05) (hash(x)=22691119) +4954 train 6.863097 (lr=9.7400e-05) (hash(x)=17272898) +4955 train 6.661474 (lr=9.7376e-05) (hash(x)=17850370) +4956 train 6.663415 (lr=9.7351e-05) (hash(x)=18729639) +4957 train 6.883087 (lr=9.7326e-05) (hash(x)=25327160) +4958 train 7.006086 (lr=9.7302e-05) (hash(x)=28709044) +4959 train 6.578156 (lr=9.7277e-05) (hash(x)=22236893) +4960 train 6.554546 (lr=9.7252e-05) (hash(x)=21729251) +4961 train 6.653811 (lr=9.7227e-05) (hash(x)=23852346) +4962 train 6.907745 (lr=9.7203e-05) (hash(x)=23974368) +4963 train 6.809888 (lr=9.7178e-05) (hash(x)=25764691) +4964 train 7.182287 (lr=9.7153e-05) (hash(x)=28341865) +4965 train 6.695339 (lr=9.7128e-05) (hash(x)=23856238) +4966 train 6.949515 (lr=9.7104e-05) (hash(x)=24568904) +4967 train 6.852286 (lr=9.7079e-05) (hash(x)=26857458) +4968 train 6.688712 (lr=9.7054e-05) (hash(x)=20507972) +4969 train 6.905873 (lr=9.7029e-05) (hash(x)=23139455) +4970 train 6.704041 (lr=9.7005e-05) (hash(x)=24853703) +4971 train 6.768646 (lr=9.6980e-05) (hash(x)=25654849) +4972 train 6.586267 (lr=9.6955e-05) (hash(x)=22963710) +4973 train 6.998671 (lr=9.6930e-05) (hash(x)=25652110) +4974 train 6.909349 (lr=9.6906e-05) (hash(x)=24085957) +4975 train 7.110539 (lr=9.6881e-05) (hash(x)=26413122) +4976 train 7.290235 (lr=9.6856e-05) (hash(x)=26989387) +4977 train 6.943774 (lr=9.6831e-05) (hash(x)=22784033) +4978 train 7.281620 (lr=9.6807e-05) (hash(x)=26694945) +4979 train 7.205448 (lr=9.6782e-05) (hash(x)=24507726) +4980 train 7.277875 (lr=9.6757e-05) (hash(x)=26490335) +4981 train 7.179653 (lr=9.6732e-05) (hash(x)=25624751) +4982 train 7.145508 (lr=9.6708e-05) (hash(x)=27846204) +4983 train 7.053813 (lr=9.6683e-05) (hash(x)=27696537) +4984 train 6.908569 (lr=9.6658e-05) (hash(x)=28915842) +4985 train 6.963002 (lr=9.6634e-05) (hash(x)=28274576) +4986 train 6.995515 (lr=9.6609e-05) (hash(x)=28923892) +4987 train 6.609841 (lr=9.6584e-05) (hash(x)=21602520) +4988 train 6.568758 (lr=9.6559e-05) (hash(x)=21061011) +4989 train 7.036209 (lr=9.6535e-05) (hash(x)=28060542) +4990 train 6.849380 (lr=9.6510e-05) (hash(x)=24838134) +4991 train 6.791252 (lr=9.6485e-05) (hash(x)=21950234) +4992 train 7.049852 (lr=9.6460e-05) (hash(x)=27192740) +4993 train 7.036859 (lr=9.6436e-05) (hash(x)=26770105) +4994 train 6.691747 (lr=9.6411e-05) (hash(x)=23721261) +4995 train 6.764431 (lr=9.6386e-05) (hash(x)=26064895) +4996 train 6.929451 (lr=9.6361e-05) (hash(x)=25651075) +4997 train 6.813091 (lr=9.6337e-05) (hash(x)=25029447) +4998 train 6.935493 (lr=9.6312e-05) (hash(x)=26088225) +4999 train 6.831342 (lr=9.6287e-05) (hash(x)=24051952) +5000 val loss 6.8060 +5000 val perplexity 903.2607 +5000 train 7.119318 (lr=9.6262e-05) (hash(x)=27671096) +5001 train 6.886547 (lr=9.6238e-05) (hash(x)=21510847) +5002 train 6.988344 (lr=9.6213e-05) (hash(x)=22444248) +5003 train 6.855206 (lr=9.6188e-05) (hash(x)=23898545) +5004 train 6.827136 (lr=9.6163e-05) (hash(x)=25372871) +5005 train 6.719972 (lr=9.6139e-05) (hash(x)=24179564) +5006 train 6.907381 (lr=9.6114e-05) (hash(x)=27157959) +5007 train 6.762409 (lr=9.6089e-05) (hash(x)=24029939) +5008 train 6.602869 (lr=9.6064e-05) (hash(x)=21326209) +5009 train 6.765321 (lr=9.6040e-05) (hash(x)=24678605) +5010 train 6.716585 (lr=9.6015e-05) (hash(x)=22456690) +5011 train 6.818122 (lr=9.5990e-05) (hash(x)=25044563) +5012 train 6.969776 (lr=9.5965e-05) (hash(x)=27476174) +5013 train 8.723328 (lr=9.5941e-05) (hash(x)=35911595) +5014 train 6.506436 (lr=9.5916e-05) (hash(x)=19380649) +5015 train 6.919833 (lr=9.5891e-05) (hash(x)=24393346) +5016 train 6.812145 (lr=9.5866e-05) (hash(x)=25367533) +5017 train 6.810600 (lr=9.5842e-05) (hash(x)=22744936) +5018 train 6.699428 (lr=9.5817e-05) (hash(x)=24091925) +5019 train 6.994817 (lr=9.5792e-05) (hash(x)=28452609) +5020 train 6.919025 (lr=9.5768e-05) (hash(x)=28083248) +5021 train 6.908870 (lr=9.5743e-05) (hash(x)=25512003) +5022 train 6.672005 (lr=9.5718e-05) (hash(x)=22956967) +5023 train 7.366930 (lr=9.5693e-05) (hash(x)=26985352) +5024 train 6.450666 (lr=9.5669e-05) (hash(x)=19762294) +5025 train 6.414966 (lr=9.5644e-05) (hash(x)=17526152) +5026 train 6.419557 (lr=9.5619e-05) (hash(x)=19782243) +5027 train 6.992571 (lr=9.5594e-05) (hash(x)=26394568) +5028 train 6.930541 (lr=9.5570e-05) (hash(x)=25592759) +5029 train 6.842696 (lr=9.5545e-05) (hash(x)=25318486) +5030 train 6.611304 (lr=9.5520e-05) (hash(x)=21592796) +5031 train 6.588808 (lr=9.5495e-05) (hash(x)=19493265) +5032 train 6.517513 (lr=9.5471e-05) (hash(x)=18573720) +5033 train 6.686963 (lr=9.5446e-05) (hash(x)=24507451) +5034 train 6.789182 (lr=9.5421e-05) (hash(x)=23415305) +5035 train 6.464078 (lr=9.5396e-05) (hash(x)=21230587) +5036 train 6.831174 (lr=9.5372e-05) (hash(x)=23927070) +5037 train 7.084607 (lr=9.5347e-05) (hash(x)=27738855) +5038 train 7.059085 (lr=9.5322e-05) (hash(x)=25935342) +5039 train 6.686523 (lr=9.5297e-05) (hash(x)=23944010) +5040 train 6.952915 (lr=9.5273e-05) (hash(x)=27102186) +5041 train 6.996863 (lr=9.5248e-05) (hash(x)=26372006) +5042 train 7.191411 (lr=9.5223e-05) (hash(x)=29135493) +5043 train 6.972921 (lr=9.5198e-05) (hash(x)=30456809) +5044 train 7.119377 (lr=9.5174e-05) (hash(x)=31511524) +5045 train 6.916039 (lr=9.5149e-05) (hash(x)=24781245) +5046 train 7.162239 (lr=9.5124e-05) (hash(x)=27848359) +5047 train 6.752933 (lr=9.5100e-05) (hash(x)=21517435) +5048 train 6.739620 (lr=9.5075e-05) (hash(x)=23204698) +5049 train 6.569971 (lr=9.5050e-05) (hash(x)=24233710) +5050 val loss 6.7967 +5050 val perplexity 894.8876 +5050 train 6.571050 (lr=9.5025e-05) (hash(x)=22269852) +5051 train 6.789043 (lr=9.5001e-05) (hash(x)=24353917) +5052 train 6.937453 (lr=9.4976e-05) (hash(x)=26830869) +5053 train 6.767808 (lr=9.4951e-05) (hash(x)=24562870) +5054 train 6.611825 (lr=9.4926e-05) (hash(x)=23293792) +5055 train 6.649066 (lr=9.4902e-05) (hash(x)=25025868) +5056 train 6.925275 (lr=9.4877e-05) (hash(x)=26983676) +5057 train 6.712763 (lr=9.4852e-05) (hash(x)=24219951) +5058 train 6.641163 (lr=9.4827e-05) (hash(x)=22461697) +5059 train 6.712533 (lr=9.4803e-05) (hash(x)=22273663) +5060 train 6.483372 (lr=9.4778e-05) (hash(x)=21710914) +5061 train 6.826713 (lr=9.4753e-05) (hash(x)=27580667) +5062 train 6.804513 (lr=9.4728e-05) (hash(x)=26181884) +5063 train 6.725801 (lr=9.4704e-05) (hash(x)=22940997) +5064 train 6.771484 (lr=9.4679e-05) (hash(x)=23741304) +5065 train 6.874730 (lr=9.4654e-05) (hash(x)=26593649) +5066 train 6.904389 (lr=9.4629e-05) (hash(x)=27697771) +5067 train 7.076743 (lr=9.4605e-05) (hash(x)=29402781) +5068 train 6.814147 (lr=9.4580e-05) (hash(x)=24335695) +5069 train 6.775932 (lr=9.4555e-05) (hash(x)=23894879) +5070 train 6.826995 (lr=9.4531e-05) (hash(x)=24044464) +5071 train 7.025670 (lr=9.4506e-05) (hash(x)=25864840) +5072 train 6.981965 (lr=9.4481e-05) (hash(x)=24734201) +5073 train 6.688365 (lr=9.4456e-05) (hash(x)=24089358) +5074 train 6.610784 (lr=9.4432e-05) (hash(x)=23928823) +5075 train 6.906410 (lr=9.4407e-05) (hash(x)=26245998) +5076 train 6.627605 (lr=9.4382e-05) (hash(x)=22602693) +5077 train 6.968843 (lr=9.4357e-05) (hash(x)=24817993) +5078 train 6.668797 (lr=9.4333e-05) (hash(x)=24235289) +5079 train 6.667229 (lr=9.4308e-05) (hash(x)=24682151) +5080 train 6.639012 (lr=9.4283e-05) (hash(x)=22672915) +5081 train 6.364633 (lr=9.4258e-05) (hash(x)=22148775) +5082 train 6.404241 (lr=9.4234e-05) (hash(x)=21856381) +5083 train 6.666573 (lr=9.4209e-05) (hash(x)=23622029) +5084 train 6.777490 (lr=9.4184e-05) (hash(x)=26379564) +5085 train 6.941069 (lr=9.4160e-05) (hash(x)=26226059) +5086 train 6.920178 (lr=9.4135e-05) (hash(x)=26964644) +5087 train 6.781779 (lr=9.4110e-05) (hash(x)=27055330) +5088 train 6.705605 (lr=9.4085e-05) (hash(x)=24752706) +5089 train 6.930500 (lr=9.4061e-05) (hash(x)=27209598) +5090 train 6.917538 (lr=9.4036e-05) (hash(x)=28373566) +5091 train 6.572446 (lr=9.4011e-05) (hash(x)=22125662) +5092 train 7.023319 (lr=9.3986e-05) (hash(x)=27599554) +5093 train 6.765624 (lr=9.3962e-05) (hash(x)=23334240) +5094 train 6.670415 (lr=9.3937e-05) (hash(x)=22102478) +5095 train 6.760048 (lr=9.3912e-05) (hash(x)=22705710) +5096 train 6.683530 (lr=9.3887e-05) (hash(x)=24064437) +5097 train 6.930141 (lr=9.3863e-05) (hash(x)=24423227) +5098 train 6.656194 (lr=9.3838e-05) (hash(x)=24308585) +5099 train 7.105059 (lr=9.3813e-05) (hash(x)=23426381) +5100 val loss 6.7870 +5100 val perplexity 886.2176 +5100 train 6.670707 (lr=9.3789e-05) (hash(x)=23577767) +5101 train 6.877226 (lr=9.3764e-05) (hash(x)=23820445) +5102 train 7.018078 (lr=9.3739e-05) (hash(x)=26666486) +5103 train 7.112721 (lr=9.3714e-05) (hash(x)=26775238) +5104 train 7.025454 (lr=9.3690e-05) (hash(x)=28104538) +5105 train 6.984714 (lr=9.3665e-05) (hash(x)=26105993) +5106 train 7.272233 (lr=9.3640e-05) (hash(x)=28874892) +5107 train 7.258424 (lr=9.3615e-05) (hash(x)=28659494) +5108 train 7.111467 (lr=9.3591e-05) (hash(x)=28230409) +5109 train 6.976137 (lr=9.3566e-05) (hash(x)=27792588) +5110 train 6.835701 (lr=9.3541e-05) (hash(x)=24125012) +5111 train 6.694009 (lr=9.3517e-05) (hash(x)=21734331) +5112 train 6.659355 (lr=9.3492e-05) (hash(x)=21329345) +5113 train 6.666503 (lr=9.3467e-05) (hash(x)=20836230) +5114 train 7.086617 (lr=9.3442e-05) (hash(x)=27859866) +5115 train 6.749791 (lr=9.3418e-05) (hash(x)=26149297) +5116 train 6.355406 (lr=9.3393e-05) (hash(x)=22035287) +5117 train 6.640651 (lr=9.3368e-05) (hash(x)=24034094) +5118 train 6.876366 (lr=9.3343e-05) (hash(x)=25511275) +5119 train 7.037430 (lr=9.3319e-05) (hash(x)=25693442) +5120 train 6.859082 (lr=9.3294e-05) (hash(x)=24238644) +5121 train 6.795742 (lr=9.3269e-05) (hash(x)=27009150) +5122 train 6.828026 (lr=9.3245e-05) (hash(x)=27562018) +5123 train 6.967759 (lr=9.3220e-05) (hash(x)=25256537) +5124 train 6.908041 (lr=9.3195e-05) (hash(x)=24732969) +5125 train 6.975822 (lr=9.3170e-05) (hash(x)=26564639) +5126 train 6.841775 (lr=9.3146e-05) (hash(x)=25859936) +5127 train 6.765171 (lr=9.3121e-05) (hash(x)=25290454) +5128 train 6.706631 (lr=9.3096e-05) (hash(x)=26057541) +5129 train 6.597983 (lr=9.3071e-05) (hash(x)=20763052) +5130 train 6.799704 (lr=9.3047e-05) (hash(x)=24632947) +5131 train 6.813286 (lr=9.3022e-05) (hash(x)=22481385) +5132 train 6.903383 (lr=9.2997e-05) (hash(x)=26230113) +5133 train 6.961888 (lr=9.2973e-05) (hash(x)=24594175) +5134 train 6.892981 (lr=9.2948e-05) (hash(x)=26733933) +5135 train 6.806056 (lr=9.2923e-05) (hash(x)=25699860) +5136 train 6.792394 (lr=9.2898e-05) (hash(x)=25004860) +5137 train 6.568287 (lr=9.2874e-05) (hash(x)=21538194) +5138 train 6.831172 (lr=9.2849e-05) (hash(x)=25351665) +5139 train 7.030617 (lr=9.2824e-05) (hash(x)=24776432) +5140 train 7.745044 (lr=9.2800e-05) (hash(x)=27840013) +5141 train 7.006040 (lr=9.2775e-05) (hash(x)=27952241) +5142 train 7.126163 (lr=9.2750e-05) (hash(x)=29410640) +5143 train 6.765762 (lr=9.2725e-05) (hash(x)=19919115) +5144 train 6.974079 (lr=9.2701e-05) (hash(x)=25359426) +5145 train 6.886366 (lr=9.2676e-05) (hash(x)=26105338) +5146 train 6.819669 (lr=9.2651e-05) (hash(x)=24663206) +5147 train 7.685731 (lr=9.2627e-05) (hash(x)=33107169) +5148 train 6.916393 (lr=9.2602e-05) (hash(x)=25852121) +5149 train 7.368291 (lr=9.2577e-05) (hash(x)=28823558) +5150 val loss 6.8014 +5150 val perplexity 899.1370 +5150 train 6.925564 (lr=9.2552e-05) (hash(x)=26700266) +5151 train 6.863870 (lr=9.2528e-05) (hash(x)=25586967) +5152 train 6.996399 (lr=9.2503e-05) (hash(x)=26131789) +5153 train 6.914090 (lr=9.2478e-05) (hash(x)=24609028) +5154 train 6.844238 (lr=9.2453e-05) (hash(x)=25216988) +5155 train 6.786966 (lr=9.2429e-05) (hash(x)=25317418) +5156 train 6.649637 (lr=9.2404e-05) (hash(x)=23414100) +5157 train 6.444585 (lr=9.2379e-05) (hash(x)=22025412) +5158 train 6.793529 (lr=9.2355e-05) (hash(x)=24183244) +5159 train 6.790815 (lr=9.2330e-05) (hash(x)=25373506) +5160 train 6.780567 (lr=9.2305e-05) (hash(x)=23993626) +5161 train 6.853326 (lr=9.2281e-05) (hash(x)=24226292) +5162 train 6.789690 (lr=9.2256e-05) (hash(x)=28088368) +5163 train 6.660208 (lr=9.2231e-05) (hash(x)=24099329) +5164 train 6.643028 (lr=9.2206e-05) (hash(x)=22480634) +5165 train 6.773037 (lr=9.2182e-05) (hash(x)=24350062) +5166 train 6.623109 (lr=9.2157e-05) (hash(x)=22961882) +5167 train 6.888074 (lr=9.2132e-05) (hash(x)=26496148) +5168 train 6.952138 (lr=9.2108e-05) (hash(x)=28077849) +5169 train 6.948448 (lr=9.2083e-05) (hash(x)=27625348) +5170 train 6.870418 (lr=9.2058e-05) (hash(x)=26350424) +5171 train 7.084143 (lr=9.2033e-05) (hash(x)=26240306) +5172 train 6.751785 (lr=9.2009e-05) (hash(x)=22800548) +5173 train 6.767860 (lr=9.1984e-05) (hash(x)=22788078) +5174 train 6.654176 (lr=9.1959e-05) (hash(x)=22949070) +5175 train 6.890009 (lr=9.1935e-05) (hash(x)=27395083) +5176 train 7.721588 (lr=9.1910e-05) (hash(x)=36982903) +5177 train 6.914083 (lr=9.1885e-05) (hash(x)=24962594) +5178 train 7.096671 (lr=9.1860e-05) (hash(x)=26616025) +5179 train 6.802034 (lr=9.1836e-05) (hash(x)=25664921) +5180 train 6.885965 (lr=9.1811e-05) (hash(x)=30103067) +5181 train 6.942366 (lr=9.1786e-05) (hash(x)=27454780) +5182 train 6.995533 (lr=9.1762e-05) (hash(x)=26627207) +5183 train 6.937097 (lr=9.1737e-05) (hash(x)=27389709) +5184 train 6.934589 (lr=9.1712e-05) (hash(x)=25948451) +5185 train 6.924047 (lr=9.1688e-05) (hash(x)=27094712) +5186 train 6.803464 (lr=9.1663e-05) (hash(x)=25337447) +5187 train 6.873714 (lr=9.1638e-05) (hash(x)=25036495) +5188 train 6.956592 (lr=9.1613e-05) (hash(x)=23873516) +5189 train 6.845379 (lr=9.1589e-05) (hash(x)=27088330) +5190 train 6.842264 (lr=9.1564e-05) (hash(x)=24889579) +5191 train 7.129599 (lr=9.1539e-05) (hash(x)=29172968) +5192 train 6.868534 (lr=9.1515e-05) (hash(x)=24900922) +5193 train 6.735051 (lr=9.1490e-05) (hash(x)=25995084) +5194 train 7.018564 (lr=9.1465e-05) (hash(x)=28675317) +5195 train 6.636992 (lr=9.1441e-05) (hash(x)=26559640) +5196 train 6.710588 (lr=9.1416e-05) (hash(x)=24086171) +5197 train 6.586383 (lr=9.1391e-05) (hash(x)=21968289) +5198 train 7.277806 (lr=9.1366e-05) (hash(x)=30188196) +5199 train 6.823056 (lr=9.1342e-05) (hash(x)=25464920) +5200 val loss 6.7961 +5200 val perplexity 894.3778 +5200 train 7.091028 (lr=9.1317e-05) (hash(x)=26173181) +5201 train 7.094686 (lr=9.1292e-05) (hash(x)=27680219) +5202 train 6.778279 (lr=9.1268e-05) (hash(x)=25603121) +5203 train 6.925769 (lr=9.1243e-05) (hash(x)=25661701) +5204 train 7.242128 (lr=9.1218e-05) (hash(x)=26013585) +5205 train 6.594687 (lr=9.1194e-05) (hash(x)=24366700) +5206 train 6.669263 (lr=9.1169e-05) (hash(x)=25257775) +5207 train 6.745074 (lr=9.1144e-05) (hash(x)=25992320) +5208 train 7.140686 (lr=9.1120e-05) (hash(x)=26900590) +5209 train 7.445110 (lr=9.1095e-05) (hash(x)=29637054) +5210 train 6.782819 (lr=9.1070e-05) (hash(x)=24549530) +5211 train 6.856773 (lr=9.1045e-05) (hash(x)=25002688) +5212 train 6.575888 (lr=9.1021e-05) (hash(x)=24044117) +5213 train 6.750980 (lr=9.0996e-05) (hash(x)=26328463) +5214 train 6.466695 (lr=9.0971e-05) (hash(x)=22227720) +5215 train 6.751888 (lr=9.0947e-05) (hash(x)=24949509) +5216 train 6.482439 (lr=9.0922e-05) (hash(x)=20803942) +5217 train 6.693425 (lr=9.0897e-05) (hash(x)=23896318) +5218 train 7.043648 (lr=9.0873e-05) (hash(x)=27505505) +5219 train 7.323495 (lr=9.0848e-05) (hash(x)=32106793) +5220 train 7.082771 (lr=9.0823e-05) (hash(x)=27655652) +5221 train 6.773857 (lr=9.0799e-05) (hash(x)=22286002) +5222 train 6.785920 (lr=9.0774e-05) (hash(x)=25436085) +5223 train 6.872938 (lr=9.0749e-05) (hash(x)=25615151) +5224 train 6.884454 (lr=9.0725e-05) (hash(x)=25164282) +5225 train 6.590109 (lr=9.0700e-05) (hash(x)=25318304) +5226 train 6.713510 (lr=9.0675e-05) (hash(x)=25698854) +5227 train 7.440392 (lr=9.0651e-05) (hash(x)=31092520) +5228 train 7.054185 (lr=9.0626e-05) (hash(x)=27876462) +5229 train 6.645040 (lr=9.0601e-05) (hash(x)=25512238) +5230 train 6.777814 (lr=9.0577e-05) (hash(x)=27337001) +5231 train 6.833975 (lr=9.0552e-05) (hash(x)=27923548) +5232 train 6.860507 (lr=9.0527e-05) (hash(x)=26126903) +5233 train 6.944772 (lr=9.0502e-05) (hash(x)=26987079) +5234 train 6.941941 (lr=9.0478e-05) (hash(x)=27736752) +5235 train 6.474109 (lr=9.0453e-05) (hash(x)=20502148) +5236 train 6.950452 (lr=9.0428e-05) (hash(x)=25730359) +5237 train 7.007370 (lr=9.0404e-05) (hash(x)=25897090) +5238 train 7.109368 (lr=9.0379e-05) (hash(x)=27737344) +5239 train 6.951034 (lr=9.0354e-05) (hash(x)=26387848) +5240 train 6.887100 (lr=9.0330e-05) (hash(x)=19576641) +5241 train 6.727705 (lr=9.0305e-05) (hash(x)=25667615) +5242 train 7.014295 (lr=9.0280e-05) (hash(x)=28862899) +5243 train 7.007419 (lr=9.0256e-05) (hash(x)=27095086) +5244 train 6.895475 (lr=9.0231e-05) (hash(x)=26809459) +5245 train 6.762910 (lr=9.0206e-05) (hash(x)=22578578) +5246 train 6.733840 (lr=9.0182e-05) (hash(x)=20405975) +5247 train 6.677120 (lr=9.0157e-05) (hash(x)=22863518) +5248 train 6.869998 (lr=9.0132e-05) (hash(x)=25589310) +5249 train 6.668940 (lr=9.0108e-05) (hash(x)=24032373) +5250 val loss 6.7864 +5250 val perplexity 885.6954 +5250 train 6.657390 (lr=9.0083e-05) (hash(x)=24307631) +5251 train 6.730733 (lr=9.0058e-05) (hash(x)=22344972) +5252 train 6.694860 (lr=9.0034e-05) (hash(x)=23462221) +5253 train 6.918074 (lr=9.0009e-05) (hash(x)=26864577) +5254 train 7.048474 (lr=8.9984e-05) (hash(x)=27670761) +5255 train 6.594772 (lr=8.9960e-05) (hash(x)=20869581) +5256 train 6.628403 (lr=8.9935e-05) (hash(x)=23040048) +5257 train 7.391052 (lr=8.9910e-05) (hash(x)=26912443) +5258 train 7.228195 (lr=8.9886e-05) (hash(x)=27521477) +5259 train 7.401396 (lr=8.9861e-05) (hash(x)=30598301) +5260 train 7.201622 (lr=8.9836e-05) (hash(x)=27553532) +5261 train 6.847891 (lr=8.9812e-05) (hash(x)=24589527) +5262 train 6.783563 (lr=8.9787e-05) (hash(x)=24600906) +5263 train 6.363390 (lr=8.9762e-05) (hash(x)=18133606) +5264 train 6.756435 (lr=8.9738e-05) (hash(x)=24404101) +5265 train 6.866073 (lr=8.9713e-05) (hash(x)=25090392) +5266 train 6.692220 (lr=8.9688e-05) (hash(x)=23414438) +5267 train 6.849403 (lr=8.9664e-05) (hash(x)=25235010) +5268 train 6.839813 (lr=8.9639e-05) (hash(x)=26030672) +5269 train 6.514786 (lr=8.9615e-05) (hash(x)=24935365) +5270 train 6.900964 (lr=8.9590e-05) (hash(x)=25881960) +5271 train 6.940488 (lr=8.9565e-05) (hash(x)=28736122) +5272 train 6.745648 (lr=8.9541e-05) (hash(x)=24140149) +5273 train 6.306073 (lr=8.9516e-05) (hash(x)=18582531) +5274 train 6.756784 (lr=8.9491e-05) (hash(x)=24857973) +5275 train 7.069672 (lr=8.9467e-05) (hash(x)=31964687) +5276 train 6.766031 (lr=8.9442e-05) (hash(x)=23492762) +5277 train 7.055895 (lr=8.9417e-05) (hash(x)=26235680) +5278 train 6.818188 (lr=8.9393e-05) (hash(x)=23865809) +5279 train 6.769574 (lr=8.9368e-05) (hash(x)=25528329) +5280 train 6.825878 (lr=8.9343e-05) (hash(x)=23080663) +5281 train 6.746442 (lr=8.9319e-05) (hash(x)=24965563) +5282 train 7.019647 (lr=8.9294e-05) (hash(x)=28088400) +5283 train 7.086666 (lr=8.9269e-05) (hash(x)=25714091) +5284 train 7.143453 (lr=8.9245e-05) (hash(x)=30297970) +5285 train 6.943405 (lr=8.9220e-05) (hash(x)=27707039) +5286 train 6.557206 (lr=8.9195e-05) (hash(x)=21970067) +5287 train 6.690117 (lr=8.9171e-05) (hash(x)=24020765) +5288 train 6.721960 (lr=8.9146e-05) (hash(x)=24234154) +5289 train 6.926292 (lr=8.9122e-05) (hash(x)=26015275) +5290 train 6.966074 (lr=8.9097e-05) (hash(x)=27295071) +5291 train 6.780380 (lr=8.9072e-05) (hash(x)=25992253) +5292 train 7.022045 (lr=8.9048e-05) (hash(x)=28569126) +5293 train 6.874856 (lr=8.9023e-05) (hash(x)=25844953) +5294 train 6.964760 (lr=8.8998e-05) (hash(x)=25193813) +5295 train 7.180355 (lr=8.8974e-05) (hash(x)=27792245) +5296 train 7.173135 (lr=8.8949e-05) (hash(x)=26115965) +5297 train 6.713497 (lr=8.8924e-05) (hash(x)=24061711) +5298 train 6.984919 (lr=8.8900e-05) (hash(x)=28841643) +5299 train 7.028745 (lr=8.8875e-05) (hash(x)=26073593) +5300 val loss 6.7825 +5300 val perplexity 882.2281 +5300 train 6.962758 (lr=8.8851e-05) (hash(x)=27101667) +5301 train 6.985931 (lr=8.8826e-05) (hash(x)=29291251) +5302 train 6.884358 (lr=8.8801e-05) (hash(x)=26954695) +5303 train 6.726399 (lr=8.8777e-05) (hash(x)=28287635) +5304 train 6.831024 (lr=8.8752e-05) (hash(x)=27673805) +5305 train 6.546120 (lr=8.8727e-05) (hash(x)=22377141) +5306 train 6.539178 (lr=8.8703e-05) (hash(x)=21381559) +5307 train 6.992900 (lr=8.8678e-05) (hash(x)=26552691) +5308 train 6.771266 (lr=8.8654e-05) (hash(x)=21345465) +5309 train 6.703556 (lr=8.8629e-05) (hash(x)=21087948) +5310 train 6.588066 (lr=8.8604e-05) (hash(x)=22385470) +5311 train 6.520029 (lr=8.8580e-05) (hash(x)=20951206) +5312 train 7.044321 (lr=8.8555e-05) (hash(x)=26875026) +5313 train 6.962409 (lr=8.8530e-05) (hash(x)=25424360) +5314 train 6.740160 (lr=8.8506e-05) (hash(x)=23683387) +5315 train 6.766778 (lr=8.8481e-05) (hash(x)=24242534) +5316 train 6.878269 (lr=8.8457e-05) (hash(x)=23924087) +5317 train 6.687909 (lr=8.8432e-05) (hash(x)=23296703) +5318 train 6.253419 (lr=8.8407e-05) (hash(x)=14889111) +5319 train 6.503117 (lr=8.8383e-05) (hash(x)=22356452) +5320 train 6.905386 (lr=8.8358e-05) (hash(x)=27301986) +5321 train 6.639143 (lr=8.8333e-05) (hash(x)=24132282) +5322 train 6.765798 (lr=8.8309e-05) (hash(x)=27524086) +5323 train 6.847528 (lr=8.8284e-05) (hash(x)=26498154) +5324 train 6.488214 (lr=8.8260e-05) (hash(x)=23591099) +5325 train 6.918313 (lr=8.8235e-05) (hash(x)=25971622) +5326 train 6.940120 (lr=8.8210e-05) (hash(x)=26259885) +5327 train 6.779408 (lr=8.8186e-05) (hash(x)=24385170) +5328 train 6.751846 (lr=8.8161e-05) (hash(x)=25379964) +5329 train 6.982330 (lr=8.8137e-05) (hash(x)=28607035) +5330 train 6.583507 (lr=8.8112e-05) (hash(x)=22361074) +5331 train 7.229787 (lr=8.8087e-05) (hash(x)=28364745) +5332 train 6.994779 (lr=8.8063e-05) (hash(x)=28078835) +5333 train 6.835958 (lr=8.8038e-05) (hash(x)=28992889) +5334 train 6.723085 (lr=8.8013e-05) (hash(x)=24586705) +5335 train 6.826920 (lr=8.7989e-05) (hash(x)=23455854) +5336 train 6.859783 (lr=8.7964e-05) (hash(x)=26782164) +5337 train 6.847062 (lr=8.7940e-05) (hash(x)=24714995) +5338 train 6.809724 (lr=8.7915e-05) (hash(x)=26578056) +5339 train 6.923603 (lr=8.7890e-05) (hash(x)=26454794) +5340 train 6.924381 (lr=8.7866e-05) (hash(x)=25615977) +5341 train 6.525587 (lr=8.7841e-05) (hash(x)=23191758) +5342 train 7.134377 (lr=8.7817e-05) (hash(x)=30196630) +5343 train 6.610983 (lr=8.7792e-05) (hash(x)=21589405) +5344 train 6.706453 (lr=8.7767e-05) (hash(x)=25866595) +5345 train 6.991240 (lr=8.7743e-05) (hash(x)=26344506) +5346 train 6.902629 (lr=8.7718e-05) (hash(x)=24305075) +5347 train 6.793927 (lr=8.7694e-05) (hash(x)=25445166) +5348 train 6.912477 (lr=8.7669e-05) (hash(x)=27214999) +5349 train 6.818635 (lr=8.7644e-05) (hash(x)=26743203) +5350 val loss 6.7738 +5350 val perplexity 874.6603 +5350 train 7.050711 (lr=8.7620e-05) (hash(x)=28483107) +5351 train 6.686041 (lr=8.7595e-05) (hash(x)=24698150) +5352 train 6.845192 (lr=8.7571e-05) (hash(x)=25560667) +5353 train 6.650436 (lr=8.7546e-05) (hash(x)=25678105) +5354 train 6.823796 (lr=8.7521e-05) (hash(x)=24405638) +5355 train 6.606084 (lr=8.7497e-05) (hash(x)=21795788) +5356 train 6.694545 (lr=8.7472e-05) (hash(x)=19518892) +5357 train 6.787006 (lr=8.7448e-05) (hash(x)=22670004) +5358 train 7.262349 (lr=8.7423e-05) (hash(x)=32593024) +5359 train 6.881940 (lr=8.7399e-05) (hash(x)=28010836) +5360 train 7.063333 (lr=8.7374e-05) (hash(x)=30061197) +5361 train 6.967412 (lr=8.7349e-05) (hash(x)=27401111) +5362 train 6.850109 (lr=8.7325e-05) (hash(x)=25830560) +5363 train 6.994815 (lr=8.7300e-05) (hash(x)=26255418) +5364 train 7.079182 (lr=8.7276e-05) (hash(x)=27890883) +5365 train 6.879920 (lr=8.7251e-05) (hash(x)=27086915) +5366 train 6.898582 (lr=8.7226e-05) (hash(x)=24456440) +5367 train 6.950758 (lr=8.7202e-05) (hash(x)=25427381) +5368 train 6.708330 (lr=8.7177e-05) (hash(x)=25282670) +5369 train 6.684088 (lr=8.7153e-05) (hash(x)=20350564) +5370 train 6.558380 (lr=8.7128e-05) (hash(x)=21533244) +5371 train 6.802431 (lr=8.7104e-05) (hash(x)=25804914) +5372 train 6.833347 (lr=8.7079e-05) (hash(x)=25707639) +5373 train 7.027599 (lr=8.7054e-05) (hash(x)=27781879) +5374 train 7.269895 (lr=8.7030e-05) (hash(x)=29819925) +5375 train 7.315853 (lr=8.7005e-05) (hash(x)=27478557) +5376 train 7.150224 (lr=8.6981e-05) (hash(x)=28960748) +5377 train 6.580602 (lr=8.6956e-05) (hash(x)=22915560) +5378 train 6.628503 (lr=8.6932e-05) (hash(x)=23713290) +5379 train 6.980484 (lr=8.6907e-05) (hash(x)=28532986) +5380 train 6.949100 (lr=8.6882e-05) (hash(x)=27944777) +5381 train 6.926096 (lr=8.6858e-05) (hash(x)=26294839) +5382 train 6.562130 (lr=8.6833e-05) (hash(x)=23539631) +5383 train 6.760273 (lr=8.6809e-05) (hash(x)=23865569) +5384 train 6.869421 (lr=8.6784e-05) (hash(x)=25083729) +5385 train 6.761826 (lr=8.6760e-05) (hash(x)=24164657) +5386 train 6.896432 (lr=8.6735e-05) (hash(x)=24585690) +5387 train 6.754175 (lr=8.6711e-05) (hash(x)=23365484) +5388 train 6.991724 (lr=8.6686e-05) (hash(x)=26164114) +5389 train 6.921889 (lr=8.6661e-05) (hash(x)=28053451) +5390 train 7.748703 (lr=8.6637e-05) (hash(x)=31709088) +5391 train 6.819231 (lr=8.6612e-05) (hash(x)=23407132) +5392 train 6.925874 (lr=8.6588e-05) (hash(x)=26250086) +5393 train 6.782281 (lr=8.6563e-05) (hash(x)=26820895) +5394 train 6.608325 (lr=8.6539e-05) (hash(x)=23608821) +5395 train 7.169326 (lr=8.6514e-05) (hash(x)=26750510) +5396 train 6.621819 (lr=8.6489e-05) (hash(x)=23447808) +5397 train 6.928493 (lr=8.6465e-05) (hash(x)=24131963) +5398 train 6.652528 (lr=8.6440e-05) (hash(x)=24664943) +5399 train 6.596779 (lr=8.6416e-05) (hash(x)=20253664) +5400 val loss 6.7734 +5400 val perplexity 874.2747 +5400 train 6.913070 (lr=8.6391e-05) (hash(x)=23073932) +5401 train 7.120445 (lr=8.6367e-05) (hash(x)=31820468) +5402 train 6.671948 (lr=8.6342e-05) (hash(x)=24535932) +5403 train 6.769316 (lr=8.6318e-05) (hash(x)=24619408) +5404 train 6.649123 (lr=8.6293e-05) (hash(x)=21821155) +5405 train 6.811619 (lr=8.6269e-05) (hash(x)=24784107) +5406 train 6.649743 (lr=8.6244e-05) (hash(x)=20435871) +5407 train 6.541944 (lr=8.6219e-05) (hash(x)=21087928) +5408 train 6.776865 (lr=8.6195e-05) (hash(x)=25016195) +5409 train 6.846417 (lr=8.6170e-05) (hash(x)=25341703) +5410 train 6.872092 (lr=8.6146e-05) (hash(x)=25760577) +5411 train 7.010189 (lr=8.6121e-05) (hash(x)=28800595) +5412 train 6.853093 (lr=8.6097e-05) (hash(x)=26160439) +5413 train 6.856941 (lr=8.6072e-05) (hash(x)=25317118) +5414 train 6.593349 (lr=8.6048e-05) (hash(x)=23767638) +5415 train 6.758499 (lr=8.6023e-05) (hash(x)=25957589) +5416 train 6.632646 (lr=8.5999e-05) (hash(x)=24299810) +5417 train 6.955605 (lr=8.5974e-05) (hash(x)=25584592) +5418 train 6.747116 (lr=8.5950e-05) (hash(x)=23758384) +5419 train 6.812590 (lr=8.5925e-05) (hash(x)=24519649) +5420 train 6.623777 (lr=8.5901e-05) (hash(x)=23703662) +5421 train 6.805132 (lr=8.5876e-05) (hash(x)=24159131) +5422 train 6.823782 (lr=8.5851e-05) (hash(x)=24580461) +5423 train 6.965379 (lr=8.5827e-05) (hash(x)=27008610) +5424 train 6.774188 (lr=8.5802e-05) (hash(x)=28643720) +5425 train 6.829540 (lr=8.5778e-05) (hash(x)=25966593) +5426 train 6.792015 (lr=8.5753e-05) (hash(x)=23300756) +5427 train 7.133870 (lr=8.5729e-05) (hash(x)=25803040) +5428 train 6.874805 (lr=8.5704e-05) (hash(x)=25444529) +5429 train 6.949461 (lr=8.5680e-05) (hash(x)=26495218) +5430 train 6.602909 (lr=8.5655e-05) (hash(x)=22956308) +5431 train 6.954340 (lr=8.5631e-05) (hash(x)=27580265) +5432 train 6.886774 (lr=8.5606e-05) (hash(x)=26548439) +5433 train 7.043679 (lr=8.5582e-05) (hash(x)=30677288) +5434 train 7.001323 (lr=8.5557e-05) (hash(x)=32631553) +5435 train 6.929595 (lr=8.5533e-05) (hash(x)=29873037) +5436 train 7.101181 (lr=8.5508e-05) (hash(x)=28622601) +5437 train 6.809501 (lr=8.5484e-05) (hash(x)=26547966) +5438 train 6.817381 (lr=8.5459e-05) (hash(x)=23121402) +5439 train 6.677069 (lr=8.5435e-05) (hash(x)=24244798) +5440 train 6.891025 (lr=8.5410e-05) (hash(x)=26350421) +5441 train 6.821273 (lr=8.5386e-05) (hash(x)=25125564) +5442 train 6.758688 (lr=8.5361e-05) (hash(x)=24887111) +5443 train 6.737179 (lr=8.5337e-05) (hash(x)=22449713) +5444 train 6.609848 (lr=8.5312e-05) (hash(x)=21000641) +5445 train 6.723650 (lr=8.5288e-05) (hash(x)=24406712) +5446 train 6.753822 (lr=8.5263e-05) (hash(x)=25870897) +5447 train 6.670581 (lr=8.5239e-05) (hash(x)=24535871) +5448 train 6.956459 (lr=8.5214e-05) (hash(x)=30598963) +5449 train 6.954918 (lr=8.5190e-05) (hash(x)=26963614) +5450 val loss 6.7729 +5450 val perplexity 873.8712 +5450 train 6.936888 (lr=8.5165e-05) (hash(x)=27683120) +5451 train 7.258449 (lr=8.5141e-05) (hash(x)=30278191) +5452 train 6.729442 (lr=8.5116e-05) (hash(x)=22555106) +5453 train 6.781676 (lr=8.5092e-05) (hash(x)=25679475) +5454 train 6.777605 (lr=8.5067e-05) (hash(x)=25463327) +5455 train 6.820654 (lr=8.5043e-05) (hash(x)=27558681) +5456 train 6.780496 (lr=8.5018e-05) (hash(x)=27210802) +5457 train 6.746762 (lr=8.4994e-05) (hash(x)=25956094) +5458 train 6.889762 (lr=8.4969e-05) (hash(x)=25155920) +5459 train 6.757285 (lr=8.4945e-05) (hash(x)=25299486) +5460 train 6.863598 (lr=8.4920e-05) (hash(x)=24173588) +5461 train 6.846138 (lr=8.4896e-05) (hash(x)=23223432) +5462 train 6.698801 (lr=8.4871e-05) (hash(x)=22789811) +5463 train 6.531262 (lr=8.4847e-05) (hash(x)=21152793) +5464 train 6.701885 (lr=8.4822e-05) (hash(x)=24524146) +5465 train 6.756531 (lr=8.4798e-05) (hash(x)=26668399) +5466 train 6.852878 (lr=8.4773e-05) (hash(x)=26990178) +5467 train 6.694564 (lr=8.4749e-05) (hash(x)=24197830) +5468 train 6.414488 (lr=8.4724e-05) (hash(x)=21110315) +5469 train 6.908227 (lr=8.4700e-05) (hash(x)=21372114) +5470 train 6.561028 (lr=8.4675e-05) (hash(x)=22360232) +5471 train 6.957489 (lr=8.4651e-05) (hash(x)=28147005) +5472 train 6.784115 (lr=8.4627e-05) (hash(x)=25497907) +5473 train 6.825136 (lr=8.4602e-05) (hash(x)=26091722) +5474 train 7.020852 (lr=8.4578e-05) (hash(x)=26640380) +5475 train 6.918208 (lr=8.4553e-05) (hash(x)=27700158) +5476 train 6.860077 (lr=8.4529e-05) (hash(x)=26659383) +5477 train 6.667418 (lr=8.4504e-05) (hash(x)=23150914) +5478 train 6.920007 (lr=8.4480e-05) (hash(x)=28451771) +5479 train 6.625583 (lr=8.4455e-05) (hash(x)=21933180) +5480 train 6.438756 (lr=8.4431e-05) (hash(x)=18336782) +5481 train 6.823419 (lr=8.4406e-05) (hash(x)=28593884) +5482 train 6.976275 (lr=8.4382e-05) (hash(x)=25995737) +5483 train 6.631153 (lr=8.4357e-05) (hash(x)=23470482) +5484 train 6.740941 (lr=8.4333e-05) (hash(x)=24399247) +5485 train 6.962289 (lr=8.4308e-05) (hash(x)=22692875) +5486 train 7.051528 (lr=8.4284e-05) (hash(x)=27782972) +5487 train 6.775329 (lr=8.4260e-05) (hash(x)=24735895) +5488 train 6.937636 (lr=8.4235e-05) (hash(x)=26739032) +5489 train 7.150472 (lr=8.4211e-05) (hash(x)=26435203) +5490 train 6.921820 (lr=8.4186e-05) (hash(x)=27319682) +5491 train 6.475949 (lr=8.4162e-05) (hash(x)=22148167) +5492 train 6.844106 (lr=8.4137e-05) (hash(x)=25606445) +5493 train 6.677125 (lr=8.4113e-05) (hash(x)=23537482) +5494 train 6.945585 (lr=8.4088e-05) (hash(x)=26051751) +5495 train 6.674848 (lr=8.4064e-05) (hash(x)=26209948) +5496 train 7.228758 (lr=8.4040e-05) (hash(x)=28188903) +5497 train 7.121947 (lr=8.4015e-05) (hash(x)=27804754) +5498 train 6.921432 (lr=8.3991e-05) (hash(x)=27285270) +5499 train 6.674993 (lr=8.3966e-05) (hash(x)=25646265) +5500 val loss 6.7539 +5500 val perplexity 857.3859 +5500 train 6.813207 (lr=8.3942e-05) (hash(x)=27369782) +5501 train 6.577168 (lr=8.3917e-05) (hash(x)=22778204) +5502 train 6.442817 (lr=8.3893e-05) (hash(x)=21487353) +5503 train 6.747423 (lr=8.3868e-05) (hash(x)=23358313) +5504 train 6.841214 (lr=8.3844e-05) (hash(x)=26058393) +5505 train 6.943654 (lr=8.3820e-05) (hash(x)=25138681) +5506 train 7.036608 (lr=8.3795e-05) (hash(x)=29359396) +5507 train 6.657126 (lr=8.3771e-05) (hash(x)=25220289) +5508 train 6.791375 (lr=8.3746e-05) (hash(x)=27460334) +5509 train 6.736676 (lr=8.3722e-05) (hash(x)=25250267) +5510 train 6.536762 (lr=8.3697e-05) (hash(x)=23581210) +5511 train 6.518842 (lr=8.3673e-05) (hash(x)=22398001) +5512 train 6.586008 (lr=8.3649e-05) (hash(x)=21260507) +5513 train 6.552258 (lr=8.3624e-05) (hash(x)=22961844) +5514 train 6.442944 (lr=8.3600e-05) (hash(x)=22275986) +5515 train 6.562608 (lr=8.3575e-05) (hash(x)=23695664) +5516 train 6.731561 (lr=8.3551e-05) (hash(x)=24483770) +5517 train 6.832926 (lr=8.3527e-05) (hash(x)=25646845) +5518 train 6.808525 (lr=8.3502e-05) (hash(x)=25980380) +5519 train 6.556800 (lr=8.3478e-05) (hash(x)=23724957) +5520 train 6.368870 (lr=8.3453e-05) (hash(x)=22208575) +5521 train 6.337928 (lr=8.3429e-05) (hash(x)=21856644) +5522 train 6.706368 (lr=8.3404e-05) (hash(x)=24121651) +5523 train 6.831079 (lr=8.3380e-05) (hash(x)=25267537) +5524 train 6.681591 (lr=8.3356e-05) (hash(x)=25614807) +5525 train 7.172493 (lr=8.3331e-05) (hash(x)=29361370) +5526 train 6.967346 (lr=8.3307e-05) (hash(x)=28077422) +5527 train 6.801595 (lr=8.3282e-05) (hash(x)=23083514) +5528 train 6.861657 (lr=8.3258e-05) (hash(x)=26412620) +5529 train 6.625701 (lr=8.3234e-05) (hash(x)=23833787) +5530 train 6.719677 (lr=8.3209e-05) (hash(x)=23874525) +5531 train 6.704685 (lr=8.3185e-05) (hash(x)=24396585) +5532 train 6.502557 (lr=8.3160e-05) (hash(x)=21817470) +5533 train 6.755927 (lr=8.3136e-05) (hash(x)=25984999) +5534 train 6.637992 (lr=8.3112e-05) (hash(x)=21877013) +5535 train 6.099526 (lr=8.3087e-05) (hash(x)=16016924) +5536 train 6.609548 (lr=8.3063e-05) (hash(x)=21730198) +5537 train 6.881958 (lr=8.3038e-05) (hash(x)=26986291) +5538 train 7.061148 (lr=8.3014e-05) (hash(x)=27321141) +5539 train 6.962801 (lr=8.2990e-05) (hash(x)=28879986) +5540 train 7.106337 (lr=8.2965e-05) (hash(x)=31352487) +5541 train 6.856023 (lr=8.2941e-05) (hash(x)=27981347) +5542 train 6.720764 (lr=8.2916e-05) (hash(x)=25561437) +5543 train 6.872509 (lr=8.2892e-05) (hash(x)=27173674) +5544 train 6.458302 (lr=8.2868e-05) (hash(x)=20400516) +5545 train 6.571527 (lr=8.2843e-05) (hash(x)=22205514) +5546 train 6.366554 (lr=8.2819e-05) (hash(x)=21485231) +5547 train 6.552059 (lr=8.2795e-05) (hash(x)=22231485) +5548 train 6.547881 (lr=8.2770e-05) (hash(x)=21915469) +5549 train 6.702114 (lr=8.2746e-05) (hash(x)=22986074) +5550 val loss 6.7582 +5550 val perplexity 861.0877 +5550 train 6.918360 (lr=8.2721e-05) (hash(x)=26423407) +5551 train 7.177637 (lr=8.2697e-05) (hash(x)=28056250) +5552 train 7.151304 (lr=8.2673e-05) (hash(x)=29799119) +5553 train 6.923215 (lr=8.2648e-05) (hash(x)=24387849) +5554 train 6.905099 (lr=8.2624e-05) (hash(x)=27942752) +5555 train 6.718675 (lr=8.2600e-05) (hash(x)=23755137) +5556 train 6.632587 (lr=8.2575e-05) (hash(x)=23100189) +5557 train 6.601135 (lr=8.2551e-05) (hash(x)=20487254) +5558 train 6.899127 (lr=8.2526e-05) (hash(x)=25973375) +5559 train 6.552034 (lr=8.2502e-05) (hash(x)=22233617) +5560 train 6.795923 (lr=8.2478e-05) (hash(x)=25968128) +5561 train 6.215412 (lr=8.2453e-05) (hash(x)=18599249) +5562 train 6.781425 (lr=8.2429e-05) (hash(x)=25811805) +5563 train 6.959369 (lr=8.2405e-05) (hash(x)=26090483) +5564 train 6.660217 (lr=8.2380e-05) (hash(x)=25327699) +5565 train 8.059344 (lr=8.2356e-05) (hash(x)=36705946) +5566 train 7.067386 (lr=8.2332e-05) (hash(x)=29142293) +5567 train 6.515654 (lr=8.2307e-05) (hash(x)=23777908) +5568 train 6.663925 (lr=8.2283e-05) (hash(x)=25336608) +5569 train 6.957376 (lr=8.2259e-05) (hash(x)=27222983) +5570 train 7.041710 (lr=8.2234e-05) (hash(x)=29024896) +5571 train 6.629699 (lr=8.2210e-05) (hash(x)=22709741) +5572 train 6.650201 (lr=8.2186e-05) (hash(x)=22996697) +5573 train 6.750814 (lr=8.2161e-05) (hash(x)=24900228) +5574 train 6.863702 (lr=8.2137e-05) (hash(x)=27122698) +5575 train 6.935917 (lr=8.2112e-05) (hash(x)=27842849) +5576 train 6.749761 (lr=8.2088e-05) (hash(x)=27900509) +5577 train 6.899980 (lr=8.2064e-05) (hash(x)=26932678) +5578 train 6.847363 (lr=8.2039e-05) (hash(x)=28488385) +5579 train 7.178633 (lr=8.2015e-05) (hash(x)=27855572) +5580 train 6.975050 (lr=8.1991e-05) (hash(x)=25477193) +5581 train 6.888826 (lr=8.1966e-05) (hash(x)=25188536) +5582 train 6.707208 (lr=8.1942e-05) (hash(x)=23234626) +5583 train 6.747613 (lr=8.1918e-05) (hash(x)=23711679) +5584 train 6.520406 (lr=8.1893e-05) (hash(x)=21522788) +5585 train 6.763567 (lr=8.1869e-05) (hash(x)=27589949) +5586 train 6.674794 (lr=8.1845e-05) (hash(x)=22735443) +5587 train 6.924495 (lr=8.1821e-05) (hash(x)=25543906) +5588 train 6.904967 (lr=8.1796e-05) (hash(x)=26533831) +5589 train 6.813309 (lr=8.1772e-05) (hash(x)=24766996) +5590 train 6.408195 (lr=8.1748e-05) (hash(x)=20609422) +5591 train 6.165576 (lr=8.1723e-05) (hash(x)=17204843) +5592 train 6.717644 (lr=8.1699e-05) (hash(x)=26518352) +5593 train 6.781876 (lr=8.1675e-05) (hash(x)=24751586) +5594 train 6.539938 (lr=8.1650e-05) (hash(x)=22459566) +5595 train 9.118697 (lr=8.1626e-05) (hash(x)=48147671) +5596 train 6.694744 (lr=8.1602e-05) (hash(x)=24875184) +5597 train 6.869714 (lr=8.1577e-05) (hash(x)=25435777) +5598 train 6.726688 (lr=8.1553e-05) (hash(x)=23559255) +5599 train 6.655282 (lr=8.1529e-05) (hash(x)=23909800) +5600 val loss 6.7625 +5600 val perplexity 864.7898 +5600 train 6.547328 (lr=8.1504e-05) (hash(x)=22696140) +5601 train 6.942243 (lr=8.1480e-05) (hash(x)=28988340) +5602 train 6.746855 (lr=8.1456e-05) (hash(x)=26908897) +5603 train 6.854511 (lr=8.1432e-05) (hash(x)=24704097) +5604 train 6.943724 (lr=8.1407e-05) (hash(x)=28705642) +5605 train 6.607710 (lr=8.1383e-05) (hash(x)=23610257) +5606 train 6.702293 (lr=8.1359e-05) (hash(x)=23248994) +5607 train 7.042466 (lr=8.1334e-05) (hash(x)=25033286) +5608 train 7.203836 (lr=8.1310e-05) (hash(x)=30158584) +5609 train 7.678651 (lr=8.1286e-05) (hash(x)=28352541) +5610 train 7.990192 (lr=8.1261e-05) (hash(x)=29775655) +5611 train 6.807556 (lr=8.1237e-05) (hash(x)=24783577) +5612 train 6.893526 (lr=8.1213e-05) (hash(x)=28279673) +5613 train 7.027267 (lr=8.1189e-05) (hash(x)=24188526) +5614 train 6.800878 (lr=8.1164e-05) (hash(x)=25048310) +5615 train 6.675494 (lr=8.1140e-05) (hash(x)=23608371) +5616 train 7.077130 (lr=8.1116e-05) (hash(x)=28765833) +5617 train 7.026441 (lr=8.1091e-05) (hash(x)=24600812) +5618 train 6.640411 (lr=8.1067e-05) (hash(x)=24101293) +5619 train 6.880435 (lr=8.1043e-05) (hash(x)=25216084) +5620 train 6.781366 (lr=8.1019e-05) (hash(x)=23642110) +5621 train 6.864632 (lr=8.0994e-05) (hash(x)=25556167) +5622 train 7.360252 (lr=8.0970e-05) (hash(x)=29343276) +5623 train 6.855218 (lr=8.0946e-05) (hash(x)=23654625) +5624 train 6.790656 (lr=8.0922e-05) (hash(x)=27083661) +5625 train 6.906291 (lr=8.0897e-05) (hash(x)=25727830) +5626 train 6.725565 (lr=8.0873e-05) (hash(x)=26134786) +5627 train 6.759465 (lr=8.0849e-05) (hash(x)=25503100) +5628 train 6.586694 (lr=8.0824e-05) (hash(x)=24124654) +5629 train 6.573095 (lr=8.0800e-05) (hash(x)=23760249) +5630 train 6.712552 (lr=8.0776e-05) (hash(x)=24987030) +5631 train 6.842964 (lr=8.0752e-05) (hash(x)=22633313) +5632 train 6.772363 (lr=8.0727e-05) (hash(x)=25230230) +5633 train 7.046413 (lr=8.0703e-05) (hash(x)=26833493) +5634 train 6.836974 (lr=8.0679e-05) (hash(x)=25251986) +5635 train 6.816998 (lr=8.0655e-05) (hash(x)=27176235) +5636 train 6.613065 (lr=8.0630e-05) (hash(x)=23859809) +5637 train 6.976302 (lr=8.0606e-05) (hash(x)=27322950) +5638 train 6.571976 (lr=8.0582e-05) (hash(x)=22771925) +5639 train 6.714149 (lr=8.0558e-05) (hash(x)=24267011) +5640 train 7.117325 (lr=8.0533e-05) (hash(x)=28035033) +5641 train 6.813698 (lr=8.0509e-05) (hash(x)=26296064) +5642 train 6.474618 (lr=8.0485e-05) (hash(x)=20889800) +5643 train 6.514001 (lr=8.0461e-05) (hash(x)=21370796) +5644 train 6.707162 (lr=8.0436e-05) (hash(x)=23539685) +5645 train 7.105974 (lr=8.0412e-05) (hash(x)=28375028) +5646 train 6.619444 (lr=8.0388e-05) (hash(x)=23287498) +5647 train 6.573822 (lr=8.0364e-05) (hash(x)=23449416) +5648 train 6.651000 (lr=8.0340e-05) (hash(x)=24650331) +5649 train 6.932401 (lr=8.0315e-05) (hash(x)=25969848) +5650 val loss 6.7492 +5650 val perplexity 853.3740 +5650 train 6.781743 (lr=8.0291e-05) (hash(x)=26316896) +5651 train 7.146057 (lr=8.0267e-05) (hash(x)=26968187) +5652 train 7.285948 (lr=8.0243e-05) (hash(x)=28230305) +5653 train 7.149176 (lr=8.0218e-05) (hash(x)=27436973) +5654 train 7.061443 (lr=8.0194e-05) (hash(x)=25969554) +5655 train 7.058300 (lr=8.0170e-05) (hash(x)=28527906) +5656 train 6.758926 (lr=8.0146e-05) (hash(x)=22984439) +5657 train 6.832776 (lr=8.0121e-05) (hash(x)=23594458) +5658 train 6.564486 (lr=8.0097e-05) (hash(x)=21503183) +5659 train 6.668923 (lr=8.0073e-05) (hash(x)=21982691) +5660 train 6.899278 (lr=8.0049e-05) (hash(x)=26037102) +5661 train 6.581882 (lr=8.0025e-05) (hash(x)=25289815) +5662 train 6.788231 (lr=8.0000e-05) (hash(x)=22400394) +5663 train 6.521751 (lr=7.9976e-05) (hash(x)=21189075) +5664 train 6.531887 (lr=7.9952e-05) (hash(x)=22653032) +5665 train 6.574560 (lr=7.9928e-05) (hash(x)=22445556) +5666 train 6.665541 (lr=7.9904e-05) (hash(x)=23514405) +5667 train 6.676318 (lr=7.9879e-05) (hash(x)=25354290) +5668 train 6.807796 (lr=7.9855e-05) (hash(x)=28556308) +5669 train 6.853100 (lr=7.9831e-05) (hash(x)=30706366) +5670 train 6.658532 (lr=7.9807e-05) (hash(x)=24436612) +5671 train 6.978691 (lr=7.9783e-05) (hash(x)=25278645) +5672 train 7.342096 (lr=7.9758e-05) (hash(x)=29900662) +5673 train 7.561307 (lr=7.9734e-05) (hash(x)=32797871) +5674 train 7.601524 (lr=7.9710e-05) (hash(x)=34459306) +5675 train 7.218844 (lr=7.9686e-05) (hash(x)=31347747) +5676 train 7.295648 (lr=7.9662e-05) (hash(x)=28679061) +5677 train 6.791342 (lr=7.9637e-05) (hash(x)=23537177) +5678 train 6.737674 (lr=7.9613e-05) (hash(x)=22202027) +5679 train 6.899925 (lr=7.9589e-05) (hash(x)=23654290) +5680 train 6.634217 (lr=7.9565e-05) (hash(x)=20411309) +5681 train 6.696379 (lr=7.9541e-05) (hash(x)=23183433) +5682 train 6.799377 (lr=7.9517e-05) (hash(x)=24997201) +5683 train 6.774779 (lr=7.9492e-05) (hash(x)=25683179) +5684 train 6.823653 (lr=7.9468e-05) (hash(x)=27287287) +5685 train 6.778989 (lr=7.9444e-05) (hash(x)=23378935) +5686 train 6.777965 (lr=7.9420e-05) (hash(x)=25672369) +5687 train 6.767910 (lr=7.9396e-05) (hash(x)=24571139) +5688 train 6.780295 (lr=7.9371e-05) (hash(x)=23792319) +5689 train 6.801865 (lr=7.9347e-05) (hash(x)=25663997) +5690 train 6.754492 (lr=7.9323e-05) (hash(x)=24860502) +5691 train 6.841713 (lr=7.9299e-05) (hash(x)=25012625) +5692 train 7.077863 (lr=7.9275e-05) (hash(x)=26175222) +5693 train 6.887155 (lr=7.9251e-05) (hash(x)=24984061) +5694 train 6.720532 (lr=7.9227e-05) (hash(x)=25330180) +5695 train 7.004965 (lr=7.9202e-05) (hash(x)=26203172) +5696 train 6.834700 (lr=7.9178e-05) (hash(x)=23142935) +5697 train 6.791326 (lr=7.9154e-05) (hash(x)=22817936) +5698 train 6.741410 (lr=7.9130e-05) (hash(x)=24609677) +5699 train 7.035175 (lr=7.9106e-05) (hash(x)=28259689) +5700 val loss 6.7684 +5700 val perplexity 869.9373 +5700 train 7.106973 (lr=7.9082e-05) (hash(x)=29709340) +5701 train 6.535245 (lr=7.9057e-05) (hash(x)=22454445) +5702 train 6.684054 (lr=7.9033e-05) (hash(x)=23470427) +5703 train 6.382756 (lr=7.9009e-05) (hash(x)=19623503) +5704 train 6.780708 (lr=7.8985e-05) (hash(x)=25365692) +5705 train 7.004888 (lr=7.8961e-05) (hash(x)=27559822) +5706 train 7.025258 (lr=7.8937e-05) (hash(x)=26765778) +5707 train 6.760106 (lr=7.8913e-05) (hash(x)=21925406) +5708 train 6.643950 (lr=7.8888e-05) (hash(x)=23748896) +5709 train 6.793678 (lr=7.8864e-05) (hash(x)=28415736) +5710 train 6.205655 (lr=7.8840e-05) (hash(x)=18478534) +5711 train 6.581403 (lr=7.8816e-05) (hash(x)=23970545) +5712 train 6.765993 (lr=7.8792e-05) (hash(x)=25339274) +5713 train 6.542746 (lr=7.8768e-05) (hash(x)=24222112) +5714 train 6.904524 (lr=7.8744e-05) (hash(x)=27697890) +5715 train 6.890022 (lr=7.8720e-05) (hash(x)=26075181) +5716 train 6.991802 (lr=7.8695e-05) (hash(x)=27430144) +5717 train 6.971670 (lr=7.8671e-05) (hash(x)=28695466) +5718 train 7.649181 (lr=7.8647e-05) (hash(x)=28322756) +5719 train 6.804241 (lr=7.8623e-05) (hash(x)=25724900) +5720 train 6.716295 (lr=7.8599e-05) (hash(x)=24091951) +5721 train 7.130802 (lr=7.8575e-05) (hash(x)=27577472) +5722 train 6.952374 (lr=7.8551e-05) (hash(x)=27011754) +5723 train 6.853590 (lr=7.8527e-05) (hash(x)=25450376) +5724 train 6.708627 (lr=7.8503e-05) (hash(x)=23368747) +5725 train 6.980096 (lr=7.8478e-05) (hash(x)=27632908) +5726 train 6.861922 (lr=7.8454e-05) (hash(x)=25946302) +5727 train 6.596628 (lr=7.8430e-05) (hash(x)=23245421) +5728 train 6.934280 (lr=7.8406e-05) (hash(x)=25365268) +5729 train 7.007065 (lr=7.8382e-05) (hash(x)=25708400) +5730 train 6.941960 (lr=7.8358e-05) (hash(x)=30724161) +5731 train 6.758341 (lr=7.8334e-05) (hash(x)=26868795) +5732 train 6.592479 (lr=7.8310e-05) (hash(x)=23227033) +5733 train 6.746457 (lr=7.8286e-05) (hash(x)=24631556) +5734 train 6.370605 (lr=7.8262e-05) (hash(x)=19919780) +5735 train 6.698135 (lr=7.8238e-05) (hash(x)=24087537) +5736 train 6.764034 (lr=7.8213e-05) (hash(x)=25505501) +5737 train 6.565242 (lr=7.8189e-05) (hash(x)=21207038) +5738 train 6.104246 (lr=7.8165e-05) (hash(x)=15245559) +5739 train 6.560083 (lr=7.8141e-05) (hash(x)=22792495) +5740 train 6.858063 (lr=7.8117e-05) (hash(x)=26073243) +5741 train 6.809637 (lr=7.8093e-05) (hash(x)=25409896) +5742 train 6.957153 (lr=7.8069e-05) (hash(x)=28537234) +5743 train 6.711044 (lr=7.8045e-05) (hash(x)=25549646) +5744 train 6.642452 (lr=7.8021e-05) (hash(x)=24189822) +5745 train 6.790210 (lr=7.7997e-05) (hash(x)=25413623) +5746 train 6.758987 (lr=7.7973e-05) (hash(x)=25525173) +5747 train 6.852482 (lr=7.7949e-05) (hash(x)=27281086) +5748 train 6.785326 (lr=7.7925e-05) (hash(x)=28098971) +5749 train 6.828117 (lr=7.7900e-05) (hash(x)=25711227) +5750 val loss 6.7532 +5750 val perplexity 856.8228 +5750 train 6.941152 (lr=7.7876e-05) (hash(x)=30335340) +5751 train 6.854985 (lr=7.7852e-05) (hash(x)=26406563) +5752 train 6.478808 (lr=7.7828e-05) (hash(x)=20828857) +5753 train 6.782996 (lr=7.7804e-05) (hash(x)=25407278) +5754 train 7.279509 (lr=7.7780e-05) (hash(x)=26587000) +5755 train 6.673110 (lr=7.7756e-05) (hash(x)=24171804) +5756 train 6.677877 (lr=7.7732e-05) (hash(x)=24666412) +5757 train 6.969124 (lr=7.7708e-05) (hash(x)=27612885) +5758 train 6.839677 (lr=7.7684e-05) (hash(x)=23238194) +5759 train 6.876149 (lr=7.7660e-05) (hash(x)=23972429) +5760 train 7.029501 (lr=7.7636e-05) (hash(x)=27640328) +5761 train 7.082110 (lr=7.7612e-05) (hash(x)=28743403) +5762 train 6.881167 (lr=7.7588e-05) (hash(x)=27096346) +5763 train 6.802810 (lr=7.7564e-05) (hash(x)=27360494) +5764 train 6.834692 (lr=7.7540e-05) (hash(x)=24955188) +5765 train 6.980800 (lr=7.7516e-05) (hash(x)=24859883) +5766 train 6.770841 (lr=7.7492e-05) (hash(x)=25016765) +5767 train 6.858556 (lr=7.7468e-05) (hash(x)=26378040) +5768 train 6.969643 (lr=7.7444e-05) (hash(x)=25969390) +5769 train 6.545894 (lr=7.7420e-05) (hash(x)=24744059) +5770 train 6.911163 (lr=7.7396e-05) (hash(x)=26922523) +5771 train 6.774622 (lr=7.7372e-05) (hash(x)=22806400) +5772 train 6.702698 (lr=7.7348e-05) (hash(x)=22073473) +5773 train 6.762222 (lr=7.7324e-05) (hash(x)=26899184) +5774 train 6.930432 (lr=7.7299e-05) (hash(x)=26317007) +5775 train 6.722405 (lr=7.7275e-05) (hash(x)=24618531) +5776 train 6.581261 (lr=7.7251e-05) (hash(x)=22931588) +5777 train 7.461469 (lr=7.7227e-05) (hash(x)=30193423) +5778 train 6.810140 (lr=7.7203e-05) (hash(x)=27935540) +5779 train 6.436209 (lr=7.7179e-05) (hash(x)=22365122) +5780 train 6.743750 (lr=7.7155e-05) (hash(x)=25986560) +5781 train 6.452182 (lr=7.7131e-05) (hash(x)=21689063) +5782 train 6.685553 (lr=7.7107e-05) (hash(x)=24451344) +5783 train 6.829579 (lr=7.7083e-05) (hash(x)=20135714) +5784 train 6.726818 (lr=7.7059e-05) (hash(x)=22474047) +5785 train 6.993881 (lr=7.7035e-05) (hash(x)=26104873) +5786 train 7.389283 (lr=7.7011e-05) (hash(x)=30461181) +5787 train 6.807112 (lr=7.6987e-05) (hash(x)=28352366) +5788 train 6.787262 (lr=7.6963e-05) (hash(x)=27086825) +5789 train 6.574933 (lr=7.6939e-05) (hash(x)=22710450) +5790 train 6.710147 (lr=7.6915e-05) (hash(x)=24903963) +5791 train 6.826997 (lr=7.6892e-05) (hash(x)=26490981) +5792 train 7.338470 (lr=7.6868e-05) (hash(x)=25486575) +5793 train 7.088044 (lr=7.6844e-05) (hash(x)=24864419) +5794 train 6.918178 (lr=7.6820e-05) (hash(x)=28083020) +5795 train 6.843332 (lr=7.6796e-05) (hash(x)=26473954) +5796 train 6.867130 (lr=7.6772e-05) (hash(x)=25614591) +5797 train 6.669031 (lr=7.6748e-05) (hash(x)=24326793) +5798 train 7.048642 (lr=7.6724e-05) (hash(x)=31511645) +5799 train 6.625762 (lr=7.6700e-05) (hash(x)=23927567) +5800 val loss 6.7491 +5800 val perplexity 853.2943 +5800 train 6.851493 (lr=7.6676e-05) (hash(x)=26273162) +5801 train 6.702566 (lr=7.6652e-05) (hash(x)=26191045) +5802 train 6.719997 (lr=7.6628e-05) (hash(x)=25529853) +5803 train 6.755159 (lr=7.6604e-05) (hash(x)=23353619) +5804 train 6.602757 (lr=7.6580e-05) (hash(x)=25222730) +5805 train 6.753565 (lr=7.6556e-05) (hash(x)=27188285) +5806 train 6.695590 (lr=7.6532e-05) (hash(x)=25442552) +5807 train 6.903729 (lr=7.6508e-05) (hash(x)=27943609) +5808 train 6.924062 (lr=7.6484e-05) (hash(x)=29273881) +5809 train 6.742291 (lr=7.6460e-05) (hash(x)=24274388) +5810 train 6.684427 (lr=7.6436e-05) (hash(x)=21577045) +5811 train 6.412811 (lr=7.6412e-05) (hash(x)=22453474) +5812 train 6.764372 (lr=7.6388e-05) (hash(x)=25379308) +5813 train 7.299197 (lr=7.6364e-05) (hash(x)=31469316) +5814 train 6.820058 (lr=7.6340e-05) (hash(x)=27666898) +5815 train 6.673551 (lr=7.6316e-05) (hash(x)=22962561) +5816 train 6.930358 (lr=7.6293e-05) (hash(x)=26659488) +5817 train 6.625146 (lr=7.6269e-05) (hash(x)=23332118) +5818 train 7.000892 (lr=7.6245e-05) (hash(x)=30374669) +5819 train 6.775052 (lr=7.6221e-05) (hash(x)=27351426) +5820 train 6.923297 (lr=7.6197e-05) (hash(x)=25241833) +5821 train 6.784788 (lr=7.6173e-05) (hash(x)=24699099) +5822 train 6.679583 (lr=7.6149e-05) (hash(x)=25889152) +5823 train 6.994821 (lr=7.6125e-05) (hash(x)=24772257) +5824 train 6.606875 (lr=7.6101e-05) (hash(x)=21187690) +5825 train 6.914224 (lr=7.6077e-05) (hash(x)=26831636) +5826 train 6.601569 (lr=7.6053e-05) (hash(x)=23586722) +5827 train 6.447441 (lr=7.6029e-05) (hash(x)=21308028) +5828 train 6.866263 (lr=7.6005e-05) (hash(x)=23918648) +5829 train 7.029453 (lr=7.5982e-05) (hash(x)=25064642) +5830 train 6.742702 (lr=7.5958e-05) (hash(x)=25457639) +5831 train 6.789898 (lr=7.5934e-05) (hash(x)=25539761) +5832 train 6.786453 (lr=7.5910e-05) (hash(x)=26755692) +5833 train 7.096978 (lr=7.5886e-05) (hash(x)=26926121) +5834 train 7.184804 (lr=7.5862e-05) (hash(x)=28206151) +5835 train 6.904080 (lr=7.5838e-05) (hash(x)=26855802) +5836 train 7.044017 (lr=7.5814e-05) (hash(x)=27908892) +5837 train 6.998695 (lr=7.5790e-05) (hash(x)=29472224) +5838 train 6.570723 (lr=7.5766e-05) (hash(x)=24362055) +5839 train 6.615617 (lr=7.5743e-05) (hash(x)=23316262) +5840 train 6.666992 (lr=7.5719e-05) (hash(x)=25211260) +5841 train 6.798492 (lr=7.5695e-05) (hash(x)=25576111) +5842 train 6.571870 (lr=7.5671e-05) (hash(x)=21936430) +5843 train 6.483102 (lr=7.5647e-05) (hash(x)=21271807) +5844 train 6.536750 (lr=7.5623e-05) (hash(x)=23499406) +5845 train 6.807054 (lr=7.5599e-05) (hash(x)=24542517) +5846 train 6.841548 (lr=7.5575e-05) (hash(x)=26133151) +5847 train 6.789255 (lr=7.5552e-05) (hash(x)=23857558) +5848 train 6.719162 (lr=7.5528e-05) (hash(x)=25847943) +5849 train 7.303195 (lr=7.5504e-05) (hash(x)=29686711) +5850 val loss 6.7442 +5850 val perplexity 849.1542 +5850 train 6.986072 (lr=7.5480e-05) (hash(x)=26432184) +5851 train 6.938257 (lr=7.5456e-05) (hash(x)=26381255) +5852 train 6.642330 (lr=7.5432e-05) (hash(x)=24189494) +5853 train 6.733267 (lr=7.5408e-05) (hash(x)=28105073) +5854 train 6.674586 (lr=7.5384e-05) (hash(x)=25926797) +5855 train 7.004807 (lr=7.5361e-05) (hash(x)=30252690) +5856 train 7.033140 (lr=7.5337e-05) (hash(x)=35140015) +5857 train 6.802080 (lr=7.5313e-05) (hash(x)=25872958) +5858 train 6.670247 (lr=7.5289e-05) (hash(x)=26168599) +5859 train 6.612790 (lr=7.5265e-05) (hash(x)=23502359) +5860 train 7.235108 (lr=7.5241e-05) (hash(x)=27926741) +5861 train 7.209812 (lr=7.5217e-05) (hash(x)=30656009) +5862 train 6.701717 (lr=7.5194e-05) (hash(x)=22968272) +5863 train 7.557466 (lr=7.5170e-05) (hash(x)=30590162) +5864 train 6.838745 (lr=7.5146e-05) (hash(x)=27016671) +5865 train 7.021903 (lr=7.5122e-05) (hash(x)=25210533) +5866 train 6.999584 (lr=7.5098e-05) (hash(x)=29820330) +5867 train 6.629241 (lr=7.5074e-05) (hash(x)=24592932) +5868 train 6.690899 (lr=7.5051e-05) (hash(x)=23509725) +5869 train 6.710496 (lr=7.5027e-05) (hash(x)=23603016) +5870 train 6.763348 (lr=7.5003e-05) (hash(x)=24515529) +5871 train 6.919867 (lr=7.4979e-05) (hash(x)=25015721) +5872 train 7.062160 (lr=7.4955e-05) (hash(x)=28098776) +5873 train 6.876769 (lr=7.4932e-05) (hash(x)=28132535) +5874 train 7.310811 (lr=7.4908e-05) (hash(x)=31861276) +5875 train 6.778574 (lr=7.4884e-05) (hash(x)=25131959) +5876 train 6.887018 (lr=7.4860e-05) (hash(x)=25775926) +5877 train 6.654340 (lr=7.4836e-05) (hash(x)=21056777) +5878 train 6.835735 (lr=7.4812e-05) (hash(x)=26606890) +5879 train 6.988219 (lr=7.4789e-05) (hash(x)=28639679) +5880 train 6.809082 (lr=7.4765e-05) (hash(x)=26185626) +5881 train 6.891767 (lr=7.4741e-05) (hash(x)=24674878) +5882 train 6.859828 (lr=7.4717e-05) (hash(x)=25104282) +5883 train 6.480780 (lr=7.4693e-05) (hash(x)=23994413) +5884 train 6.844945 (lr=7.4670e-05) (hash(x)=25973331) +5885 train 6.811657 (lr=7.4646e-05) (hash(x)=27715763) +5886 train 6.807522 (lr=7.4622e-05) (hash(x)=26634706) +5887 train 6.846031 (lr=7.4598e-05) (hash(x)=26199058) +5888 train 6.846820 (lr=7.4574e-05) (hash(x)=25510330) +5889 train 7.071919 (lr=7.4551e-05) (hash(x)=26984744) +5890 train 7.169118 (lr=7.4527e-05) (hash(x)=27912483) +5891 train 6.773422 (lr=7.4503e-05) (hash(x)=28292328) +5892 train 6.684065 (lr=7.4479e-05) (hash(x)=23939512) +5893 train 6.639386 (lr=7.4456e-05) (hash(x)=22399977) +5894 train 6.966221 (lr=7.4432e-05) (hash(x)=25993660) +5895 train 6.911766 (lr=7.4408e-05) (hash(x)=28907461) +5896 train 6.748529 (lr=7.4384e-05) (hash(x)=21188293) +5897 train 6.361009 (lr=7.4360e-05) (hash(x)=19675299) +5898 train 7.016867 (lr=7.4337e-05) (hash(x)=29440224) +5899 train 6.759085 (lr=7.4313e-05) (hash(x)=25827028) +5900 val loss 6.7668 +5900 val perplexity 868.5546 +5900 train 6.837895 (lr=7.4289e-05) (hash(x)=30635737) +5901 train 6.901427 (lr=7.4265e-05) (hash(x)=27871847) +5902 train 6.984863 (lr=7.4242e-05) (hash(x)=27427472) +5903 train 7.124261 (lr=7.4218e-05) (hash(x)=26466915) +5904 train 7.167929 (lr=7.4194e-05) (hash(x)=25845281) +5905 train 6.712271 (lr=7.4170e-05) (hash(x)=25495489) +5906 train 6.950735 (lr=7.4147e-05) (hash(x)=25734950) +5907 train 7.090353 (lr=7.4123e-05) (hash(x)=31790001) +5908 train 7.049562 (lr=7.4099e-05) (hash(x)=28873445) +5909 train 7.016983 (lr=7.4075e-05) (hash(x)=26613552) +5910 train 6.890358 (lr=7.4052e-05) (hash(x)=27974804) +5911 train 6.524709 (lr=7.4028e-05) (hash(x)=20332613) +5912 train 6.769673 (lr=7.4004e-05) (hash(x)=23800786) +5913 train 6.854105 (lr=7.3980e-05) (hash(x)=27031988) +5914 train 6.846111 (lr=7.3957e-05) (hash(x)=26887263) +5915 train 6.875945 (lr=7.3933e-05) (hash(x)=26669544) +5916 train 6.974242 (lr=7.3909e-05) (hash(x)=27018436) +5917 train 6.678337 (lr=7.3886e-05) (hash(x)=24124032) +5918 train 6.456813 (lr=7.3862e-05) (hash(x)=23724141) +5919 train 7.021938 (lr=7.3838e-05) (hash(x)=26766470) +5920 train 7.192800 (lr=7.3814e-05) (hash(x)=28707643) +5921 train 6.609590 (lr=7.3791e-05) (hash(x)=22993426) +5922 train 5.775745 (lr=7.3767e-05) (hash(x)=12463744) +5923 train 6.726114 (lr=7.3743e-05) (hash(x)=25199942) +5924 train 7.013460 (lr=7.3720e-05) (hash(x)=27722710) +5925 train 6.765102 (lr=7.3696e-05) (hash(x)=25162205) +5926 train 6.846948 (lr=7.3672e-05) (hash(x)=25433291) +5927 train 6.842110 (lr=7.3648e-05) (hash(x)=26722145) +5928 train 6.855958 (lr=7.3625e-05) (hash(x)=25851728) +5929 train 7.025162 (lr=7.3601e-05) (hash(x)=26409139) +5930 train 6.927719 (lr=7.3577e-05) (hash(x)=25557927) +5931 train 6.784290 (lr=7.3554e-05) (hash(x)=25974032) +5932 train 6.831502 (lr=7.3530e-05) (hash(x)=27058695) +5933 train 6.891120 (lr=7.3506e-05) (hash(x)=26149203) +5934 train 6.635621 (lr=7.3483e-05) (hash(x)=24330364) +5935 train 6.593649 (lr=7.3459e-05) (hash(x)=21222489) +5936 train 7.004874 (lr=7.3435e-05) (hash(x)=26877624) +5937 train 6.804489 (lr=7.3412e-05) (hash(x)=24867636) +5938 train 6.926898 (lr=7.3388e-05) (hash(x)=25373388) +5939 train 6.719570 (lr=7.3364e-05) (hash(x)=24233280) +5940 train 7.149077 (lr=7.3341e-05) (hash(x)=27167168) +5941 train 7.285167 (lr=7.3317e-05) (hash(x)=29172610) +5942 train 6.689482 (lr=7.3293e-05) (hash(x)=25076589) +5943 train 6.722241 (lr=7.3270e-05) (hash(x)=24662435) +5944 train 7.060192 (lr=7.3246e-05) (hash(x)=23449480) +5945 train 6.997798 (lr=7.3222e-05) (hash(x)=24363528) +5946 train 6.430356 (lr=7.3199e-05) (hash(x)=22901251) +5947 train 6.628842 (lr=7.3175e-05) (hash(x)=22803397) +5948 train 6.756666 (lr=7.3151e-05) (hash(x)=25096097) +5949 train 6.479759 (lr=7.3128e-05) (hash(x)=20510241) +5950 val loss 6.7492 +5950 val perplexity 853.3671 +5950 train 6.964746 (lr=7.3104e-05) (hash(x)=24979320) +5951 train 6.753395 (lr=7.3080e-05) (hash(x)=24308927) +5952 train 7.068074 (lr=7.3057e-05) (hash(x)=26729787) +5953 train 6.861726 (lr=7.3033e-05) (hash(x)=24909028) +5954 train 6.893541 (lr=7.3009e-05) (hash(x)=26835931) +5955 train 6.343139 (lr=7.2986e-05) (hash(x)=20018414) +5956 train 6.533084 (lr=7.2962e-05) (hash(x)=22502398) +5957 train 6.545239 (lr=7.2938e-05) (hash(x)=22885050) +5958 train 6.322642 (lr=7.2915e-05) (hash(x)=21886150) +5959 train 6.793485 (lr=7.2891e-05) (hash(x)=28442502) +5960 train 6.822193 (lr=7.2868e-05) (hash(x)=24422795) +5961 train 6.428365 (lr=7.2844e-05) (hash(x)=19111217) +5962 train 6.741100 (lr=7.2820e-05) (hash(x)=24683928) +5963 train 6.832817 (lr=7.2797e-05) (hash(x)=26005705) +5964 train 6.790151 (lr=7.2773e-05) (hash(x)=27105653) +5965 train 6.831166 (lr=7.2749e-05) (hash(x)=26355565) +5966 train 6.774501 (lr=7.2726e-05) (hash(x)=28748016) +5967 train 6.565619 (lr=7.2702e-05) (hash(x)=22810435) +5968 train 6.629612 (lr=7.2679e-05) (hash(x)=23292595) +5969 train 6.920513 (lr=7.2655e-05) (hash(x)=25613029) +5970 train 6.877253 (lr=7.2631e-05) (hash(x)=26732062) +5971 train 7.013725 (lr=7.2608e-05) (hash(x)=23706225) +5972 train 6.686502 (lr=7.2584e-05) (hash(x)=24982916) +5973 train 6.982754 (lr=7.2561e-05) (hash(x)=25469856) +5974 train 7.024626 (lr=7.2537e-05) (hash(x)=27992345) +5975 train 7.077898 (lr=7.2513e-05) (hash(x)=30486518) +5976 train 7.087981 (lr=7.2490e-05) (hash(x)=31798255) +5977 train 7.176349 (lr=7.2466e-05) (hash(x)=33354988) +5978 train 6.944139 (lr=7.2443e-05) (hash(x)=28593964) +5979 train 6.806275 (lr=7.2419e-05) (hash(x)=26566879) +5980 train 6.404751 (lr=7.2395e-05) (hash(x)=21317486) +5981 train 6.763462 (lr=7.2372e-05) (hash(x)=23919299) +5982 train 6.865097 (lr=7.2348e-05) (hash(x)=24123063) +5983 train 6.996465 (lr=7.2325e-05) (hash(x)=22688712) +5984 train 6.869093 (lr=7.2301e-05) (hash(x)=25925729) +5985 train 7.216444 (lr=7.2278e-05) (hash(x)=30642515) +5986 train 6.654639 (lr=7.2254e-05) (hash(x)=26388569) +5987 train 6.788614 (lr=7.2230e-05) (hash(x)=26847937) +5988 train 6.625792 (lr=7.2207e-05) (hash(x)=23449653) +5989 train 6.699552 (lr=7.2183e-05) (hash(x)=24177890) +5990 train 6.658519 (lr=7.2160e-05) (hash(x)=23419881) +5991 train 6.523564 (lr=7.2136e-05) (hash(x)=20712962) +5992 train 6.711513 (lr=7.2113e-05) (hash(x)=24671023) +5993 train 6.876125 (lr=7.2089e-05) (hash(x)=24910994) +5994 train 6.552188 (lr=7.2066e-05) (hash(x)=20961144) +5995 train 5.954621 (lr=7.2042e-05) (hash(x)=13526184) +5996 train 6.491277 (lr=7.2018e-05) (hash(x)=21141112) +5997 train 6.398088 (lr=7.1995e-05) (hash(x)=22334600) +5998 train 6.863069 (lr=7.1971e-05) (hash(x)=27472803) +5999 train 7.028366 (lr=7.1948e-05) (hash(x)=27490086) +6000 val loss 6.7429 +6000 val perplexity 848.0483 +6000 train 6.600244 (lr=7.1924e-05) (hash(x)=22653477) +6001 train 6.370182 (lr=7.1901e-05) (hash(x)=21495031) +6002 train 6.690923 (lr=7.1877e-05) (hash(x)=27095460) +6003 train 6.687506 (lr=7.1854e-05) (hash(x)=25021203) +6004 train 6.605546 (lr=7.1830e-05) (hash(x)=24829139) +6005 train 6.686594 (lr=7.1807e-05) (hash(x)=25335474) +6006 train 6.711287 (lr=7.1783e-05) (hash(x)=26000289) +6007 train 6.611351 (lr=7.1760e-05) (hash(x)=23973908) +6008 train 6.700113 (lr=7.1736e-05) (hash(x)=26975306) +6009 train 6.571054 (lr=7.1713e-05) (hash(x)=21568359) +6010 train 6.663641 (lr=7.1689e-05) (hash(x)=22760009) +6011 train 6.714217 (lr=7.1666e-05) (hash(x)=24588031) +6012 train 6.772915 (lr=7.1642e-05) (hash(x)=26644069) +6013 train 6.763800 (lr=7.1619e-05) (hash(x)=23607819) +6014 train 7.011137 (lr=7.1595e-05) (hash(x)=29445584) +6015 train 7.004474 (lr=7.1572e-05) (hash(x)=29132401) +6016 train 6.682677 (lr=7.1548e-05) (hash(x)=24606886) +6017 train 6.759783 (lr=7.1525e-05) (hash(x)=28736940) +6018 train 6.861856 (lr=7.1501e-05) (hash(x)=26640031) +6019 train 6.852708 (lr=7.1478e-05) (hash(x)=25773639) +6020 train 6.660483 (lr=7.1454e-05) (hash(x)=22620213) +6021 train 6.900246 (lr=7.1431e-05) (hash(x)=26493275) +6022 train 6.601905 (lr=7.1407e-05) (hash(x)=22747439) +6023 train 6.870439 (lr=7.1384e-05) (hash(x)=27386700) +6024 train 7.327838 (lr=7.1360e-05) (hash(x)=36749567) +6025 train 6.979054 (lr=7.1337e-05) (hash(x)=29149408) +6026 train 6.469392 (lr=7.1313e-05) (hash(x)=22669052) +6027 train 6.687429 (lr=7.1290e-05) (hash(x)=25032643) +6028 train 6.566757 (lr=7.1266e-05) (hash(x)=24928329) +6029 train 6.857366 (lr=7.1243e-05) (hash(x)=25351040) +6030 train 6.932189 (lr=7.1219e-05) (hash(x)=23381257) +6031 train 6.645975 (lr=7.1196e-05) (hash(x)=24268614) +6032 train 6.882330 (lr=7.1173e-05) (hash(x)=27077927) +6033 train 6.853475 (lr=7.1149e-05) (hash(x)=26542132) +6034 train 6.898323 (lr=7.1126e-05) (hash(x)=27252181) +6035 train 6.901428 (lr=7.1102e-05) (hash(x)=27673003) +6036 train 6.947325 (lr=7.1079e-05) (hash(x)=26186255) +6037 train 6.824005 (lr=7.1055e-05) (hash(x)=26038620) +6038 train 6.840657 (lr=7.1032e-05) (hash(x)=24912758) +6039 train 6.757512 (lr=7.1008e-05) (hash(x)=27378387) +6040 train 6.574413 (lr=7.0985e-05) (hash(x)=22937541) +6041 train 6.789797 (lr=7.0962e-05) (hash(x)=24974861) +6042 train 6.447690 (lr=7.0938e-05) (hash(x)=21201237) +6043 train 6.756597 (lr=7.0915e-05) (hash(x)=24801098) +6044 train 6.669254 (lr=7.0891e-05) (hash(x)=24774812) +6045 train 6.591078 (lr=7.0868e-05) (hash(x)=23464631) +6046 train 6.669991 (lr=7.0844e-05) (hash(x)=23063986) +6047 train 6.622223 (lr=7.0821e-05) (hash(x)=22529400) +6048 train 6.548576 (lr=7.0798e-05) (hash(x)=20813689) +6049 train 6.510549 (lr=7.0774e-05) (hash(x)=22151422) +6050 val loss 6.7446 +6050 val perplexity 849.4526 +6050 train 6.755458 (lr=7.0751e-05) (hash(x)=24198253) +6051 train 6.520357 (lr=7.0727e-05) (hash(x)=22008715) +6052 train 6.408850 (lr=7.0704e-05) (hash(x)=21805152) +6053 train 7.310297 (lr=7.0681e-05) (hash(x)=28440666) +6054 train 6.977907 (lr=7.0657e-05) (hash(x)=24451326) +6055 train 6.750200 (lr=7.0634e-05) (hash(x)=27586989) +6056 train 7.003415 (lr=7.0610e-05) (hash(x)=26291723) +6057 train 6.557022 (lr=7.0587e-05) (hash(x)=21902541) +6058 train 6.561477 (lr=7.0564e-05) (hash(x)=23355166) +6059 train 6.754514 (lr=7.0540e-05) (hash(x)=23439588) +6060 train 6.819782 (lr=7.0517e-05) (hash(x)=25254823) +6061 train 6.529953 (lr=7.0493e-05) (hash(x)=21943405) +6062 train 6.579486 (lr=7.0470e-05) (hash(x)=23512022) +6063 train 6.604787 (lr=7.0447e-05) (hash(x)=22336349) +6064 train 6.783370 (lr=7.0423e-05) (hash(x)=23924738) +6065 train 7.044293 (lr=7.0400e-05) (hash(x)=25645313) +6066 train 6.455806 (lr=7.0377e-05) (hash(x)=19342879) +6067 train 6.603348 (lr=7.0353e-05) (hash(x)=22235357) +6068 train 6.917061 (lr=7.0330e-05) (hash(x)=24999816) +6069 train 6.403961 (lr=7.0306e-05) (hash(x)=22710523) +6070 train 6.813107 (lr=7.0283e-05) (hash(x)=24059845) +6071 train 6.785062 (lr=7.0260e-05) (hash(x)=26147854) +6072 train 6.830751 (lr=7.0236e-05) (hash(x)=25432359) +6073 train 6.453006 (lr=7.0213e-05) (hash(x)=21375006) +6074 train 6.892781 (lr=7.0190e-05) (hash(x)=24050414) +6075 train 6.939407 (lr=7.0166e-05) (hash(x)=28013003) +6076 train 6.935039 (lr=7.0143e-05) (hash(x)=25292790) +6077 train 6.708241 (lr=7.0120e-05) (hash(x)=27062804) +6078 train 6.782913 (lr=7.0096e-05) (hash(x)=25803090) +6079 train 6.807561 (lr=7.0073e-05) (hash(x)=25346788) +6080 train 6.690573 (lr=7.0050e-05) (hash(x)=23701990) +6081 train 6.469120 (lr=7.0026e-05) (hash(x)=24661327) +6082 train 6.695337 (lr=7.0003e-05) (hash(x)=26003378) +6083 train 6.990705 (lr=6.9980e-05) (hash(x)=29551719) +6084 train 6.664030 (lr=6.9956e-05) (hash(x)=23882545) +6085 train 7.338400 (lr=6.9933e-05) (hash(x)=34784102) +6086 train 7.230979 (lr=6.9910e-05) (hash(x)=33914228) +6087 train 6.744937 (lr=6.9886e-05) (hash(x)=25956855) +6088 train 6.565371 (lr=6.9863e-05) (hash(x)=24387359) +6089 train 6.580453 (lr=6.9840e-05) (hash(x)=22047289) +6090 train 6.594273 (lr=6.9816e-05) (hash(x)=20761061) +6091 train 7.234431 (lr=6.9793e-05) (hash(x)=28873527) +6092 train 6.947109 (lr=6.9770e-05) (hash(x)=24916311) +6093 train 6.706350 (lr=6.9746e-05) (hash(x)=25117562) +6094 train 7.149683 (lr=6.9723e-05) (hash(x)=27330012) +6095 train 6.638904 (lr=6.9700e-05) (hash(x)=24367780) +6096 train 6.469069 (lr=6.9677e-05) (hash(x)=19618213) +6097 train 6.624074 (lr=6.9653e-05) (hash(x)=24831846) +6098 train 6.436165 (lr=6.9630e-05) (hash(x)=21831445) +6099 train 7.186293 (lr=6.9607e-05) (hash(x)=27682151) +6100 val loss 6.7373 +6100 val perplexity 843.3173 +6100 train 6.840718 (lr=6.9583e-05) (hash(x)=22944153) +6101 train 6.700797 (lr=6.9560e-05) (hash(x)=22223775) +6102 train 6.758475 (lr=6.9537e-05) (hash(x)=21861379) +6103 train 6.644552 (lr=6.9514e-05) (hash(x)=26084462) +6104 train 6.913630 (lr=6.9490e-05) (hash(x)=28752077) +6105 train 6.811162 (lr=6.9467e-05) (hash(x)=29273202) +6106 train 6.662103 (lr=6.9444e-05) (hash(x)=23643447) +6107 train 6.895482 (lr=6.9421e-05) (hash(x)=24782887) +6108 train 6.801342 (lr=6.9397e-05) (hash(x)=24344894) +6109 train 6.416261 (lr=6.9374e-05) (hash(x)=20434348) +6110 train 6.753206 (lr=6.9351e-05) (hash(x)=28910914) +6111 train 6.790034 (lr=6.9328e-05) (hash(x)=26702459) +6112 train 6.716129 (lr=6.9304e-05) (hash(x)=26062298) +6113 train 6.656215 (lr=6.9281e-05) (hash(x)=26194884) +6114 train 6.647952 (lr=6.9258e-05) (hash(x)=24259367) +6115 train 6.715721 (lr=6.9235e-05) (hash(x)=25413684) +6116 train 6.872312 (lr=6.9211e-05) (hash(x)=28048569) +6117 train 6.746395 (lr=6.9188e-05) (hash(x)=23691848) +6118 train 6.556442 (lr=6.9165e-05) (hash(x)=21878136) +6119 train 6.824774 (lr=6.9142e-05) (hash(x)=25717976) +6120 train 6.721869 (lr=6.9118e-05) (hash(x)=26912572) +6121 train 6.635098 (lr=6.9095e-05) (hash(x)=25634206) +6122 train 6.608047 (lr=6.9072e-05) (hash(x)=24361949) +6123 train 6.410970 (lr=6.9049e-05) (hash(x)=20092522) +6124 train 6.899871 (lr=6.9025e-05) (hash(x)=27393812) +6125 train 6.558434 (lr=6.9002e-05) (hash(x)=24098395) +6126 train 6.728714 (lr=6.8979e-05) (hash(x)=24652789) +6127 train 6.451136 (lr=6.8956e-05) (hash(x)=22141366) +6128 train 6.872462 (lr=6.8933e-05) (hash(x)=26547234) +6129 train 6.948061 (lr=6.8909e-05) (hash(x)=25195782) +6130 train 7.108571 (lr=6.8886e-05) (hash(x)=27990769) +6131 train 6.743523 (lr=6.8863e-05) (hash(x)=25655198) +6132 train 7.003025 (lr=6.8840e-05) (hash(x)=24909000) +6133 train 6.518723 (lr=6.8817e-05) (hash(x)=23104704) +6134 train 6.987656 (lr=6.8793e-05) (hash(x)=28627058) +6135 train 6.650565 (lr=6.8770e-05) (hash(x)=24652423) +6136 train 6.690285 (lr=6.8747e-05) (hash(x)=23333494) +6137 train 6.829488 (lr=6.8724e-05) (hash(x)=26098808) +6138 train 6.687454 (lr=6.8701e-05) (hash(x)=22606379) +6139 train 6.689163 (lr=6.8678e-05) (hash(x)=24387630) +6140 train 6.603149 (lr=6.8654e-05) (hash(x)=23603821) +6141 train 7.001419 (lr=6.8631e-05) (hash(x)=25565362) +6142 train 7.000793 (lr=6.8608e-05) (hash(x)=30725951) +6143 train 7.080167 (lr=6.8585e-05) (hash(x)=30911699) +6144 train 6.974181 (lr=6.8562e-05) (hash(x)=28792940) +6145 train 6.498325 (lr=6.8539e-05) (hash(x)=23108416) +6146 train 6.503929 (lr=6.8515e-05) (hash(x)=21634360) +6147 train 6.719827 (lr=6.8492e-05) (hash(x)=25683298) +6148 train 7.264926 (lr=6.8469e-05) (hash(x)=27010095) +6149 train 6.613451 (lr=6.8446e-05) (hash(x)=25035622) +6150 val loss 6.7283 +6150 val perplexity 835.7473 +6150 train 6.881063 (lr=6.8423e-05) (hash(x)=27354843) +6151 train 6.721745 (lr=6.8400e-05) (hash(x)=22076954) +6152 train 6.519229 (lr=6.8376e-05) (hash(x)=22778170) +6153 train 6.578804 (lr=6.8353e-05) (hash(x)=25936067) +6154 train 7.063388 (lr=6.8330e-05) (hash(x)=25757017) +6155 train 7.436540 (lr=6.8307e-05) (hash(x)=31181390) +6156 train 7.353550 (lr=6.8284e-05) (hash(x)=28478586) +6157 train 7.164531 (lr=6.8261e-05) (hash(x)=30427728) +6158 train 6.983534 (lr=6.8238e-05) (hash(x)=27821171) +6159 train 6.557165 (lr=6.8215e-05) (hash(x)=21586769) +6160 train 7.260522 (lr=6.8191e-05) (hash(x)=36460723) +6161 train 7.202773 (lr=6.8168e-05) (hash(x)=34422021) +6162 train 6.574089 (lr=6.8145e-05) (hash(x)=23380744) +6163 train 6.525200 (lr=6.8122e-05) (hash(x)=23624698) +6164 train 6.584047 (lr=6.8099e-05) (hash(x)=21721549) +6165 train 6.806507 (lr=6.8076e-05) (hash(x)=26759098) +6166 train 6.980251 (lr=6.8053e-05) (hash(x)=24678698) +6167 train 6.509882 (lr=6.8030e-05) (hash(x)=21994337) +6168 train 6.715327 (lr=6.8007e-05) (hash(x)=23156995) +6169 train 6.417404 (lr=6.7983e-05) (hash(x)=22673785) +6170 train 6.942349 (lr=6.7960e-05) (hash(x)=27902392) +6171 train 6.933713 (lr=6.7937e-05) (hash(x)=28469977) +6172 train 6.679043 (lr=6.7914e-05) (hash(x)=24716853) +6173 train 6.727211 (lr=6.7891e-05) (hash(x)=24847065) +6174 train 6.787969 (lr=6.7868e-05) (hash(x)=25196610) +6175 train 6.840582 (lr=6.7845e-05) (hash(x)=25454145) +6176 train 6.604665 (lr=6.7822e-05) (hash(x)=27374959) +6177 train 6.727921 (lr=6.7799e-05) (hash(x)=26065968) +6178 train 6.448128 (lr=6.7776e-05) (hash(x)=21082196) +6179 train 6.808669 (lr=6.7753e-05) (hash(x)=21129257) +6180 train 6.848221 (lr=6.7730e-05) (hash(x)=23571253) +6181 train 7.092178 (lr=6.7707e-05) (hash(x)=30436197) +6182 train 6.905426 (lr=6.7684e-05) (hash(x)=19236457) +6183 train 7.034374 (lr=6.7660e-05) (hash(x)=23239550) +6184 train 7.044525 (lr=6.7637e-05) (hash(x)=27503777) +6185 train 7.264349 (lr=6.7614e-05) (hash(x)=26579905) +6186 train 7.040818 (lr=6.7591e-05) (hash(x)=27244782) +6187 train 6.899329 (lr=6.7568e-05) (hash(x)=27585808) +6188 train 6.661195 (lr=6.7545e-05) (hash(x)=25367023) +6189 train 6.778680 (lr=6.7522e-05) (hash(x)=27227738) +6190 train 6.571091 (lr=6.7499e-05) (hash(x)=24972427) +6191 train 6.769026 (lr=6.7476e-05) (hash(x)=23565926) +6192 train 6.906073 (lr=6.7453e-05) (hash(x)=26296624) +6193 train 6.297252 (lr=6.7430e-05) (hash(x)=19742002) +6194 train 6.377191 (lr=6.7407e-05) (hash(x)=22264392) +6195 train 6.917311 (lr=6.7384e-05) (hash(x)=25975387) +6196 train 6.762851 (lr=6.7361e-05) (hash(x)=25404443) +6197 train 7.189889 (lr=6.7338e-05) (hash(x)=27889390) +6198 train 6.633894 (lr=6.7315e-05) (hash(x)=24869930) +6199 train 6.714467 (lr=6.7292e-05) (hash(x)=24705563) +6200 val loss 6.7556 +6200 val perplexity 858.8172 +6200 train 6.812641 (lr=6.7269e-05) (hash(x)=26587640) +6201 train 6.427730 (lr=6.7246e-05) (hash(x)=23338227) +6202 train 6.524831 (lr=6.7223e-05) (hash(x)=23895929) +6203 train 6.834175 (lr=6.7200e-05) (hash(x)=25184317) +6204 train 6.508203 (lr=6.7177e-05) (hash(x)=20824308) +6205 train 6.593323 (lr=6.7154e-05) (hash(x)=22183319) +6206 train 6.522138 (lr=6.7131e-05) (hash(x)=21547797) +6207 train 8.269240 (lr=6.7108e-05) (hash(x)=27671095) +6208 train 7.887664 (lr=6.7085e-05) (hash(x)=27417421) +6209 train 6.990594 (lr=6.7062e-05) (hash(x)=28244583) +6210 train 6.870158 (lr=6.7039e-05) (hash(x)=26413418) +6211 train 6.681470 (lr=6.7016e-05) (hash(x)=25646369) +6212 train 6.754157 (lr=6.6993e-05) (hash(x)=24195693) +6213 train 6.941432 (lr=6.6970e-05) (hash(x)=26879691) +6214 train 6.624207 (lr=6.6947e-05) (hash(x)=24829805) +6215 train 6.946915 (lr=6.6924e-05) (hash(x)=26254303) +6216 train 6.458109 (lr=6.6901e-05) (hash(x)=23524661) +6217 train 6.902368 (lr=6.6878e-05) (hash(x)=24095204) +6218 train 6.773026 (lr=6.6855e-05) (hash(x)=23807670) +6219 train 6.702383 (lr=6.6832e-05) (hash(x)=22812689) +6220 train 6.507877 (lr=6.6809e-05) (hash(x)=24273063) +6221 train 6.616876 (lr=6.6786e-05) (hash(x)=21647865) +6222 train 6.666538 (lr=6.6763e-05) (hash(x)=26480724) +6223 train 6.776297 (lr=6.6741e-05) (hash(x)=27454020) +6224 train 6.887741 (lr=6.6718e-05) (hash(x)=26441090) +6225 train 6.635654 (lr=6.6695e-05) (hash(x)=25030447) +6226 train 6.854871 (lr=6.6672e-05) (hash(x)=29009006) +6227 train 6.556744 (lr=6.6649e-05) (hash(x)=24788080) +6228 train 6.740322 (lr=6.6626e-05) (hash(x)=24267336) +6229 train 6.516491 (lr=6.6603e-05) (hash(x)=21735476) +6230 train 6.579247 (lr=6.6580e-05) (hash(x)=23662660) +6231 train 6.644578 (lr=6.6557e-05) (hash(x)=24394565) +6232 train 6.470817 (lr=6.6534e-05) (hash(x)=21971162) +6233 train 6.645883 (lr=6.6511e-05) (hash(x)=24642575) +6234 train 6.577460 (lr=6.6488e-05) (hash(x)=23150196) +6235 train 6.587026 (lr=6.6465e-05) (hash(x)=23961786) +6236 train 6.607925 (lr=6.6443e-05) (hash(x)=25190457) +6237 train 6.567735 (lr=6.6420e-05) (hash(x)=21408799) +6238 train 6.586014 (lr=6.6397e-05) (hash(x)=23967136) +6239 train 6.709983 (lr=6.6374e-05) (hash(x)=21780199) +6240 train 6.906898 (lr=6.6351e-05) (hash(x)=28920108) +6241 train 6.467752 (lr=6.6328e-05) (hash(x)=21526613) +6242 train 6.784834 (lr=6.6305e-05) (hash(x)=26215200) +6243 train 6.730505 (lr=6.6282e-05) (hash(x)=24418202) +6244 train 6.629341 (lr=6.6259e-05) (hash(x)=22692596) +6245 train 6.453846 (lr=6.6237e-05) (hash(x)=21109230) +6246 train 6.782561 (lr=6.6214e-05) (hash(x)=24863993) +6247 train 6.941719 (lr=6.6191e-05) (hash(x)=28296896) +6248 train 6.871745 (lr=6.6168e-05) (hash(x)=26511972) +6249 train 6.967212 (lr=6.6145e-05) (hash(x)=27248343) +6250 val loss 6.7370 +6250 val perplexity 843.0636 +6250 train 6.597157 (lr=6.6122e-05) (hash(x)=24413241) +6251 train 6.533061 (lr=6.6099e-05) (hash(x)=21091322) +6252 train 6.592903 (lr=6.6077e-05) (hash(x)=23691442) +6253 train 7.295590 (lr=6.6054e-05) (hash(x)=34998924) +6254 train 7.431653 (lr=6.6031e-05) (hash(x)=37561175) +6255 train 6.648251 (lr=6.6008e-05) (hash(x)=26766303) +6256 train 6.670591 (lr=6.5985e-05) (hash(x)=25829123) +6257 train 6.892593 (lr=6.5962e-05) (hash(x)=24526029) +6258 train 6.600794 (lr=6.5939e-05) (hash(x)=23935935) +6259 train 6.847135 (lr=6.5917e-05) (hash(x)=26470612) +6260 train 6.735092 (lr=6.5894e-05) (hash(x)=25188053) +6261 train 6.764690 (lr=6.5871e-05) (hash(x)=25031689) +6262 train 6.832376 (lr=6.5848e-05) (hash(x)=28886310) +6263 train 6.435919 (lr=6.5825e-05) (hash(x)=21599973) +6264 train 7.308557 (lr=6.5803e-05) (hash(x)=36259930) +6265 train 7.402907 (lr=6.5780e-05) (hash(x)=36255638) +6266 train 6.950125 (lr=6.5757e-05) (hash(x)=28538692) +6267 train 6.990514 (lr=6.5734e-05) (hash(x)=31207925) +6268 train 6.813657 (lr=6.5711e-05) (hash(x)=27022990) +6269 train 6.900206 (lr=6.5688e-05) (hash(x)=22962349) +6270 train 6.680608 (lr=6.5666e-05) (hash(x)=24062225) +6271 train 6.888714 (lr=6.5643e-05) (hash(x)=24969360) +6272 train 6.450805 (lr=6.5620e-05) (hash(x)=20717122) +6273 train 6.499159 (lr=6.5597e-05) (hash(x)=21506615) +6274 train 8.171073 (lr=6.5574e-05) (hash(x)=37152718) +6275 train 8.530334 (lr=6.5552e-05) (hash(x)=41298231) +6276 train 6.446312 (lr=6.5529e-05) (hash(x)=20561744) +6277 train 6.641902 (lr=6.5506e-05) (hash(x)=23851179) +6278 train 6.737724 (lr=6.5483e-05) (hash(x)=25012126) +6279 train 6.566926 (lr=6.5461e-05) (hash(x)=24382006) +6280 train 6.824311 (lr=6.5438e-05) (hash(x)=23884271) +6281 train 6.695795 (lr=6.5415e-05) (hash(x)=25856060) +6282 train 6.367767 (lr=6.5392e-05) (hash(x)=22415250) +6283 train 6.547745 (lr=6.5369e-05) (hash(x)=23267882) +6284 train 7.036121 (lr=6.5347e-05) (hash(x)=25865829) +6285 train 6.639879 (lr=6.5324e-05) (hash(x)=21416998) +6286 train 6.574090 (lr=6.5301e-05) (hash(x)=24791174) +6287 train 6.399467 (lr=6.5278e-05) (hash(x)=22009299) +6288 train 6.295324 (lr=6.5256e-05) (hash(x)=19101882) +6289 train 6.021877 (lr=6.5233e-05) (hash(x)=14030305) +6290 train 6.468733 (lr=6.5210e-05) (hash(x)=23503804) +6291 train 6.534112 (lr=6.5188e-05) (hash(x)=23980457) +6292 train 6.494457 (lr=6.5165e-05) (hash(x)=23138374) +6293 train 6.639366 (lr=6.5142e-05) (hash(x)=23808351) +6294 train 6.700841 (lr=6.5119e-05) (hash(x)=26804597) +6295 train 6.444360 (lr=6.5097e-05) (hash(x)=22376569) +6296 train 6.744777 (lr=6.5074e-05) (hash(x)=24434330) +6297 train 6.552177 (lr=6.5051e-05) (hash(x)=25235353) +6298 train 6.693433 (lr=6.5028e-05) (hash(x)=23327595) +6299 train 6.729156 (lr=6.5006e-05) (hash(x)=25511406) +6300 val loss 6.7322 +6300 val perplexity 839.0087 +6300 train 6.568425 (lr=6.4983e-05) (hash(x)=26780478) +6301 train 6.472635 (lr=6.4960e-05) (hash(x)=24295759) +6302 train 6.577579 (lr=6.4938e-05) (hash(x)=22768628) +6303 train 6.803293 (lr=6.4915e-05) (hash(x)=28166843) +6304 train 6.818007 (lr=6.4892e-05) (hash(x)=26391720) +6305 train 6.768917 (lr=6.4870e-05) (hash(x)=26005029) +6306 train 6.837994 (lr=6.4847e-05) (hash(x)=26340134) +6307 train 6.699667 (lr=6.4824e-05) (hash(x)=25581630) +6308 train 6.641735 (lr=6.4801e-05) (hash(x)=23327090) +6309 train 6.861694 (lr=6.4779e-05) (hash(x)=26068290) +6310 train 7.354572 (lr=6.4756e-05) (hash(x)=27158743) +6311 train 7.714587 (lr=6.4733e-05) (hash(x)=28230119) +6312 train 7.426974 (lr=6.4711e-05) (hash(x)=27663872) +6313 train 6.530832 (lr=6.4688e-05) (hash(x)=24497579) +6314 train 6.844416 (lr=6.4665e-05) (hash(x)=25474297) +6315 train 6.803630 (lr=6.4643e-05) (hash(x)=26479441) +6316 train 7.063251 (lr=6.4620e-05) (hash(x)=31243486) +6317 train 6.777951 (lr=6.4597e-05) (hash(x)=23940105) +6318 train 6.922779 (lr=6.4575e-05) (hash(x)=27137492) +6319 train 6.762177 (lr=6.4552e-05) (hash(x)=26207465) +6320 train 7.413354 (lr=6.4529e-05) (hash(x)=30769375) +6321 train 7.393456 (lr=6.4507e-05) (hash(x)=34020077) +6322 train 7.291429 (lr=6.4484e-05) (hash(x)=36643265) +6323 train 6.720346 (lr=6.4462e-05) (hash(x)=25903778) +6324 train 6.731610 (lr=6.4439e-05) (hash(x)=25391306) +6325 train 6.714939 (lr=6.4416e-05) (hash(x)=24463061) +6326 train 6.744910 (lr=6.4394e-05) (hash(x)=25888454) +6327 train 6.726531 (lr=6.4371e-05) (hash(x)=24748118) +6328 train 6.736858 (lr=6.4348e-05) (hash(x)=26770616) +6329 train 7.193236 (lr=6.4326e-05) (hash(x)=36051125) +6330 train 6.817751 (lr=6.4303e-05) (hash(x)=30079769) +6331 train 6.731271 (lr=6.4281e-05) (hash(x)=25300507) +6332 train 6.687326 (lr=6.4258e-05) (hash(x)=25264861) +6333 train 6.949310 (lr=6.4235e-05) (hash(x)=28076910) +6334 train 6.814931 (lr=6.4213e-05) (hash(x)=23872907) +6335 train 6.983266 (lr=6.4190e-05) (hash(x)=27033802) +6336 train 7.086359 (lr=6.4168e-05) (hash(x)=29034926) +6337 train 7.031785 (lr=6.4145e-05) (hash(x)=30388751) +6338 train 6.665866 (lr=6.4122e-05) (hash(x)=22350080) +6339 train 6.688284 (lr=6.4100e-05) (hash(x)=24888803) +6340 train 7.022704 (lr=6.4077e-05) (hash(x)=27045574) +6341 train 6.472556 (lr=6.4055e-05) (hash(x)=21911287) +6342 train 6.762057 (lr=6.4032e-05) (hash(x)=24549351) +6343 train 6.797203 (lr=6.4009e-05) (hash(x)=28788047) +6344 train 6.802729 (lr=6.3987e-05) (hash(x)=29734689) +6345 train 6.648633 (lr=6.3964e-05) (hash(x)=24915549) +6346 train 6.603639 (lr=6.3942e-05) (hash(x)=23615366) +6347 train 6.697722 (lr=6.3919e-05) (hash(x)=23609078) +6348 train 6.519879 (lr=6.3897e-05) (hash(x)=21506588) +6349 train 6.725418 (lr=6.3874e-05) (hash(x)=27036363) +6350 val loss 6.7364 +6350 val perplexity 842.5118 +6350 train 6.569339 (lr=6.3851e-05) (hash(x)=24002412) +6351 train 6.470453 (lr=6.3829e-05) (hash(x)=22185099) +6352 train 7.149307 (lr=6.3806e-05) (hash(x)=34289649) +6353 train 7.318689 (lr=6.3784e-05) (hash(x)=31299333) +6354 train 7.181187 (lr=6.3761e-05) (hash(x)=32794739) +6355 train 6.629282 (lr=6.3739e-05) (hash(x)=26805248) +6356 train 6.634726 (lr=6.3716e-05) (hash(x)=23809235) +6357 train 6.708240 (lr=6.3694e-05) (hash(x)=23530260) +6358 train 7.132778 (lr=6.3671e-05) (hash(x)=27848290) +6359 train 6.329806 (lr=6.3649e-05) (hash(x)=21585136) +6360 train 6.623978 (lr=6.3626e-05) (hash(x)=26665791) +6361 train 6.865958 (lr=6.3604e-05) (hash(x)=26577204) +6362 train 6.613823 (lr=6.3581e-05) (hash(x)=25064544) +6363 train 6.347074 (lr=6.3559e-05) (hash(x)=21098074) +6364 train 6.636158 (lr=6.3536e-05) (hash(x)=24402881) +6365 train 6.730886 (lr=6.3514e-05) (hash(x)=24719109) +6366 train 6.668485 (lr=6.3491e-05) (hash(x)=23949460) +6367 train 7.065729 (lr=6.3469e-05) (hash(x)=27691968) +6368 train 6.898888 (lr=6.3446e-05) (hash(x)=22484838) +6369 train 6.754116 (lr=6.3424e-05) (hash(x)=25616543) +6370 train 6.516630 (lr=6.3401e-05) (hash(x)=19538996) +6371 train 6.779512 (lr=6.3379e-05) (hash(x)=22407092) +6372 train 6.735961 (lr=6.3356e-05) (hash(x)=26712143) +6373 train 6.688695 (lr=6.3334e-05) (hash(x)=23057931) +6374 train 6.723588 (lr=6.3311e-05) (hash(x)=25451241) +6375 train 6.525969 (lr=6.3289e-05) (hash(x)=23706103) +6376 train 6.397173 (lr=6.3266e-05) (hash(x)=21757290) +6377 train 6.414414 (lr=6.3244e-05) (hash(x)=20986476) +6378 train 6.328622 (lr=6.3221e-05) (hash(x)=20111855) +6379 train 6.583164 (lr=6.3199e-05) (hash(x)=25335816) +6380 train 6.790474 (lr=6.3176e-05) (hash(x)=27243395) +6381 train 6.545430 (lr=6.3154e-05) (hash(x)=20620920) +6382 train 6.505058 (lr=6.3131e-05) (hash(x)=23698129) +6383 train 6.779334 (lr=6.3109e-05) (hash(x)=27918030) +6384 train 7.129688 (lr=6.3087e-05) (hash(x)=26713866) +6385 train 6.788519 (lr=6.3064e-05) (hash(x)=25706727) +6386 train 6.734346 (lr=6.3042e-05) (hash(x)=24469367) +6387 train 6.716304 (lr=6.3019e-05) (hash(x)=23707924) +6388 train 7.184279 (lr=6.2997e-05) (hash(x)=30690118) +6389 train 6.599563 (lr=6.2974e-05) (hash(x)=22929819) +6390 train 6.640799 (lr=6.2952e-05) (hash(x)=24335057) +6391 train 6.579395 (lr=6.2930e-05) (hash(x)=23127886) +6392 train 6.487888 (lr=6.2907e-05) (hash(x)=20281836) +6393 train 6.811025 (lr=6.2885e-05) (hash(x)=26921653) +6394 train 6.792683 (lr=6.2862e-05) (hash(x)=26718575) +6395 train 7.219695 (lr=6.2840e-05) (hash(x)=30330131) +6396 train 6.977075 (lr=6.2818e-05) (hash(x)=28748668) +6397 train 6.875438 (lr=6.2795e-05) (hash(x)=25553105) +6398 train 6.595619 (lr=6.2773e-05) (hash(x)=23014637) +6399 train 6.752439 (lr=6.2750e-05) (hash(x)=26197070) +6400 val loss 6.7235 +6400 val perplexity 831.7137 +6400 train 6.801134 (lr=6.2728e-05) (hash(x)=26501302) +6401 train 7.177848 (lr=6.2706e-05) (hash(x)=30227184) +6402 train 6.770064 (lr=6.2683e-05) (hash(x)=26145746) +6403 train 6.840440 (lr=6.2661e-05) (hash(x)=26375139) +6404 train 6.996100 (lr=6.2638e-05) (hash(x)=29258245) +6405 train 6.765767 (lr=6.2616e-05) (hash(x)=25590383) +6406 train 6.556205 (lr=6.2594e-05) (hash(x)=23954536) +6407 train 6.880006 (lr=6.2571e-05) (hash(x)=26463005) +6408 train 6.614699 (lr=6.2549e-05) (hash(x)=25262813) +6409 train 7.037940 (lr=6.2527e-05) (hash(x)=29629632) +6410 train 6.524571 (lr=6.2504e-05) (hash(x)=24129706) +6411 train 7.316133 (lr=6.2482e-05) (hash(x)=31602829) +6412 train 6.579433 (lr=6.2460e-05) (hash(x)=23631106) +6413 train 6.654531 (lr=6.2437e-05) (hash(x)=23820121) +6414 train 6.798052 (lr=6.2415e-05) (hash(x)=25090085) +6415 train 6.408859 (lr=6.2392e-05) (hash(x)=19160134) +6416 train 6.969322 (lr=6.2370e-05) (hash(x)=27345814) +6417 train 6.915020 (lr=6.2348e-05) (hash(x)=29638766) +6418 train 6.438119 (lr=6.2325e-05) (hash(x)=20682579) +6419 train 6.710851 (lr=6.2303e-05) (hash(x)=24597655) +6420 train 6.352027 (lr=6.2281e-05) (hash(x)=19718535) +6421 train 6.736130 (lr=6.2259e-05) (hash(x)=24664066) +6422 train 6.952687 (lr=6.2236e-05) (hash(x)=26511181) +6423 train 6.569950 (lr=6.2214e-05) (hash(x)=23699136) +6424 train 6.807832 (lr=6.2192e-05) (hash(x)=27669668) +6425 train 6.595735 (lr=6.2169e-05) (hash(x)=26303417) +6426 train 6.693791 (lr=6.2147e-05) (hash(x)=25066193) +6427 train 6.807931 (lr=6.2125e-05) (hash(x)=26748789) +6428 train 6.859009 (lr=6.2102e-05) (hash(x)=24973776) +6429 train 6.660149 (lr=6.2080e-05) (hash(x)=22716410) +6430 train 6.967969 (lr=6.2058e-05) (hash(x)=25256770) +6431 train 6.725028 (lr=6.2035e-05) (hash(x)=25353051) +6432 train 7.042052 (lr=6.2013e-05) (hash(x)=28304836) +6433 train 6.670842 (lr=6.1991e-05) (hash(x)=24557361) +6434 train 6.725680 (lr=6.1969e-05) (hash(x)=24311042) +6435 train 6.760007 (lr=6.1946e-05) (hash(x)=24780312) +6436 train 6.539731 (lr=6.1924e-05) (hash(x)=23831988) +6437 train 6.761615 (lr=6.1902e-05) (hash(x)=27148011) +6438 train 6.282558 (lr=6.1880e-05) (hash(x)=19352138) +6439 train 6.767095 (lr=6.1857e-05) (hash(x)=21558484) +6440 train 6.711507 (lr=6.1835e-05) (hash(x)=22684035) +6441 train 6.656948 (lr=6.1813e-05) (hash(x)=23347051) +6442 train 6.437633 (lr=6.1791e-05) (hash(x)=22500829) +6443 train 6.486623 (lr=6.1768e-05) (hash(x)=21468281) +6444 train 6.538166 (lr=6.1746e-05) (hash(x)=24340779) +6445 train 6.746545 (lr=6.1724e-05) (hash(x)=24815837) +6446 train 6.773976 (lr=6.1702e-05) (hash(x)=27008683) +6447 train 6.695419 (lr=6.1679e-05) (hash(x)=22828380) +6448 train 6.595995 (lr=6.1657e-05) (hash(x)=23017349) +6449 train 6.858356 (lr=6.1635e-05) (hash(x)=25479526) +6450 val loss 6.7263 +6450 val perplexity 834.0355 +6450 train 6.410745 (lr=6.1613e-05) (hash(x)=17701574) +6451 train 6.352615 (lr=6.1590e-05) (hash(x)=19071259) +6452 train 6.779368 (lr=6.1568e-05) (hash(x)=26359009) +6453 train 6.982852 (lr=6.1546e-05) (hash(x)=25496699) +6454 train 7.064710 (lr=6.1524e-05) (hash(x)=25972229) +6455 train 6.631824 (lr=6.1502e-05) (hash(x)=24623811) +6456 train 6.437387 (lr=6.1479e-05) (hash(x)=23501789) +6457 train 7.336988 (lr=6.1457e-05) (hash(x)=33758715) +6458 train 6.983874 (lr=6.1435e-05) (hash(x)=32783215) +6459 train 6.844182 (lr=6.1413e-05) (hash(x)=24877432) +6460 train 6.575209 (lr=6.1391e-05) (hash(x)=22645073) +6461 train 7.053010 (lr=6.1368e-05) (hash(x)=27908161) +6462 train 7.047910 (lr=6.1346e-05) (hash(x)=29172670) +6463 train 6.710014 (lr=6.1324e-05) (hash(x)=25410299) +6464 train 6.798458 (lr=6.1302e-05) (hash(x)=23586801) +6465 train 6.659719 (lr=6.1280e-05) (hash(x)=23941914) +6466 train 6.744383 (lr=6.1258e-05) (hash(x)=20803933) +6467 train 6.737031 (lr=6.1235e-05) (hash(x)=23472652) +6468 train 6.751787 (lr=6.1213e-05) (hash(x)=27343780) +6469 train 6.689517 (lr=6.1191e-05) (hash(x)=25984122) +6470 train 6.748909 (lr=6.1169e-05) (hash(x)=25424916) +6471 train 7.052864 (lr=6.1147e-05) (hash(x)=26046091) +6472 train 7.409299 (lr=6.1125e-05) (hash(x)=31192452) +6473 train 7.101862 (lr=6.1103e-05) (hash(x)=30660596) +6474 train 6.808507 (lr=6.1080e-05) (hash(x)=26427688) +6475 train 6.735064 (lr=6.1058e-05) (hash(x)=25823748) +6476 train 6.687737 (lr=6.1036e-05) (hash(x)=23265176) +6477 train 6.530827 (lr=6.1014e-05) (hash(x)=23683470) +6478 train 7.053711 (lr=6.0992e-05) (hash(x)=25901069) +6479 train 7.180156 (lr=6.0970e-05) (hash(x)=29887482) +6480 train 6.777484 (lr=6.0948e-05) (hash(x)=24798923) +6481 train 6.730946 (lr=6.0925e-05) (hash(x)=22313381) +6482 train 6.639955 (lr=6.0903e-05) (hash(x)=21504956) +6483 train 6.473093 (lr=6.0881e-05) (hash(x)=23604733) +6484 train 6.526338 (lr=6.0859e-05) (hash(x)=24020741) +6485 train 6.519855 (lr=6.0837e-05) (hash(x)=23457146) +6486 train 6.801706 (lr=6.0815e-05) (hash(x)=24126150) +6487 train 6.542661 (lr=6.0793e-05) (hash(x)=21809706) +6488 train 6.838256 (lr=6.0771e-05) (hash(x)=26084651) +6489 train 7.155046 (lr=6.0749e-05) (hash(x)=29867000) +6490 train 6.979784 (lr=6.0727e-05) (hash(x)=29830560) +6491 train 6.859445 (lr=6.0705e-05) (hash(x)=26739602) +6492 train 6.652905 (lr=6.0682e-05) (hash(x)=25457835) +6493 train 6.556494 (lr=6.0660e-05) (hash(x)=23270777) +6494 train 6.595926 (lr=6.0638e-05) (hash(x)=24105204) +6495 train 6.533270 (lr=6.0616e-05) (hash(x)=23712872) +6496 train 6.765500 (lr=6.0594e-05) (hash(x)=26066150) +6497 train 6.713515 (lr=6.0572e-05) (hash(x)=26485865) +6498 train 6.291575 (lr=6.0550e-05) (hash(x)=22296514) +6499 train 6.612634 (lr=6.0528e-05) (hash(x)=23412256) +6500 val loss 6.7111 +6500 val perplexity 821.5079 +6500 train 6.702200 (lr=6.0506e-05) (hash(x)=25915248) +6501 train 6.872786 (lr=6.0484e-05) (hash(x)=27193330) +6502 train 6.550590 (lr=6.0462e-05) (hash(x)=24757068) +6503 train 6.606986 (lr=6.0440e-05) (hash(x)=25875103) +6504 train 6.715951 (lr=6.0418e-05) (hash(x)=24210998) +6505 train 6.662057 (lr=6.0396e-05) (hash(x)=23708477) +6506 train 6.502963 (lr=6.0374e-05) (hash(x)=21400051) +6507 train 6.776152 (lr=6.0352e-05) (hash(x)=26452480) +6508 train 6.563697 (lr=6.0330e-05) (hash(x)=25330485) +6509 train 6.277898 (lr=6.0308e-05) (hash(x)=20562478) +6510 train 6.519273 (lr=6.0286e-05) (hash(x)=22931539) +6511 train 6.684288 (lr=6.0264e-05) (hash(x)=23736441) +6512 train 6.699304 (lr=6.0242e-05) (hash(x)=24641270) +6513 train 6.441413 (lr=6.0220e-05) (hash(x)=23908899) +6514 train 6.685299 (lr=6.0198e-05) (hash(x)=23811230) +6515 train 6.650009 (lr=6.0176e-05) (hash(x)=23730269) +6516 train 6.734625 (lr=6.0154e-05) (hash(x)=25450921) +6517 train 6.998605 (lr=6.0132e-05) (hash(x)=24825774) +6518 train 6.811689 (lr=6.0110e-05) (hash(x)=26183286) +6519 train 6.595659 (lr=6.0088e-05) (hash(x)=25093883) +6520 train 6.599437 (lr=6.0066e-05) (hash(x)=25280135) +6521 train 6.633207 (lr=6.0044e-05) (hash(x)=24709218) +6522 train 6.715385 (lr=6.0022e-05) (hash(x)=25337737) +6523 train 6.749494 (lr=6.0000e-05) (hash(x)=25880656) +6524 train 6.753523 (lr=5.9978e-05) (hash(x)=24806396) +6525 train 6.540334 (lr=5.9956e-05) (hash(x)=22967282) +6526 train 6.431147 (lr=5.9934e-05) (hash(x)=23423649) +6527 train 6.737737 (lr=5.9912e-05) (hash(x)=23692325) +6528 train 6.644441 (lr=5.9890e-05) (hash(x)=24793286) +6529 train 6.361970 (lr=5.9868e-05) (hash(x)=21861732) +6530 train 6.405592 (lr=5.9846e-05) (hash(x)=20376994) +6531 train 6.418121 (lr=5.9824e-05) (hash(x)=19897671) +6532 train 6.620523 (lr=5.9802e-05) (hash(x)=23805373) +6533 train 6.552617 (lr=5.9780e-05) (hash(x)=22770802) +6534 train 6.457738 (lr=5.9758e-05) (hash(x)=20817421) +6535 train 6.645041 (lr=5.9736e-05) (hash(x)=23061082) +6536 train 6.571938 (lr=5.9715e-05) (hash(x)=23703835) +6537 train 6.603511 (lr=5.9693e-05) (hash(x)=23495551) +6538 train 6.704929 (lr=5.9671e-05) (hash(x)=26965518) +6539 train 6.590042 (lr=5.9649e-05) (hash(x)=25016605) +6540 train 6.905722 (lr=5.9627e-05) (hash(x)=28268252) +6541 train 6.625385 (lr=5.9605e-05) (hash(x)=24414422) +6542 train 6.822032 (lr=5.9583e-05) (hash(x)=26304971) +6543 train 6.751825 (lr=5.9561e-05) (hash(x)=26094253) +6544 train 6.744519 (lr=5.9539e-05) (hash(x)=27288882) +6545 train 6.494179 (lr=5.9517e-05) (hash(x)=23235796) +6546 train 6.725679 (lr=5.9496e-05) (hash(x)=25614751) +6547 train 6.815810 (lr=5.9474e-05) (hash(x)=26257920) +6548 train 7.064773 (lr=5.9452e-05) (hash(x)=27528494) +6549 train 6.555851 (lr=5.9430e-05) (hash(x)=26109537) +6550 val loss 6.7202 +6550 val perplexity 829.0150 +6550 train 7.154356 (lr=5.9408e-05) (hash(x)=29056355) +6551 train 6.976779 (lr=5.9386e-05) (hash(x)=27327886) +6552 train 6.633129 (lr=5.9364e-05) (hash(x)=25379303) +6553 train 6.613402 (lr=5.9342e-05) (hash(x)=24031809) +6554 train 6.626506 (lr=5.9321e-05) (hash(x)=24368446) +6555 train 6.597606 (lr=5.9299e-05) (hash(x)=17980284) +6556 train 6.460194 (lr=5.9277e-05) (hash(x)=17135456) +6557 train 7.005454 (lr=5.9255e-05) (hash(x)=24328670) +6558 train 6.822784 (lr=5.9233e-05) (hash(x)=26330469) +6559 train 6.811400 (lr=5.9211e-05) (hash(x)=26186143) +6560 train 6.627397 (lr=5.9190e-05) (hash(x)=21312536) +6561 train 6.655827 (lr=5.9168e-05) (hash(x)=23620433) +6562 train 6.654243 (lr=5.9146e-05) (hash(x)=23237757) +6563 train 6.735336 (lr=5.9124e-05) (hash(x)=26383776) +6564 train 6.678801 (lr=5.9102e-05) (hash(x)=23866082) +6565 train 6.628591 (lr=5.9080e-05) (hash(x)=25119724) +6566 train 6.683923 (lr=5.9059e-05) (hash(x)=22138024) +6567 train 6.843146 (lr=5.9037e-05) (hash(x)=25336043) +6568 train 6.573400 (lr=5.9015e-05) (hash(x)=22265633) +6569 train 7.117701 (lr=5.8993e-05) (hash(x)=29533717) +6570 train 6.680074 (lr=5.8971e-05) (hash(x)=24529167) +6571 train 6.704204 (lr=5.8950e-05) (hash(x)=25878996) +6572 train 6.873288 (lr=5.8928e-05) (hash(x)=25030684) +6573 train 6.615953 (lr=5.8906e-05) (hash(x)=23302539) +6574 train 6.898439 (lr=5.8884e-05) (hash(x)=26424915) +6575 train 6.582356 (lr=5.8863e-05) (hash(x)=22811468) +6576 train 6.651901 (lr=5.8841e-05) (hash(x)=25681320) +6577 train 6.613539 (lr=5.8819e-05) (hash(x)=21672176) +6578 train 6.754108 (lr=5.8797e-05) (hash(x)=25546994) +6579 train 6.629109 (lr=5.8775e-05) (hash(x)=21632628) +6580 train 6.529082 (lr=5.8754e-05) (hash(x)=23217133) +6581 train 6.760785 (lr=5.8732e-05) (hash(x)=25568414) +6582 train 7.072968 (lr=5.8710e-05) (hash(x)=26521542) +6583 train 7.058980 (lr=5.8688e-05) (hash(x)=27925831) +6584 train 6.837256 (lr=5.8667e-05) (hash(x)=25677086) +6585 train 6.873632 (lr=5.8645e-05) (hash(x)=28006499) +6586 train 6.405332 (lr=5.8623e-05) (hash(x)=24166700) +6587 train 6.783045 (lr=5.8601e-05) (hash(x)=23914950) +6588 train 6.756094 (lr=5.8580e-05) (hash(x)=24511602) +6589 train 6.768405 (lr=5.8558e-05) (hash(x)=24532165) +6590 train 6.725883 (lr=5.8536e-05) (hash(x)=25169757) +6591 train 7.243274 (lr=5.8515e-05) (hash(x)=35528108) +6592 train 7.160187 (lr=5.8493e-05) (hash(x)=33572387) +6593 train 6.346091 (lr=5.8471e-05) (hash(x)=20757754) +6594 train 6.624988 (lr=5.8449e-05) (hash(x)=27790550) +6595 train 6.662776 (lr=5.8428e-05) (hash(x)=25766841) +6596 train 6.843513 (lr=5.8406e-05) (hash(x)=25982699) +6597 train 6.625133 (lr=5.8384e-05) (hash(x)=24998585) +6598 train 7.367909 (lr=5.8363e-05) (hash(x)=28188355) +6599 train 6.708416 (lr=5.8341e-05) (hash(x)=24949421) +6600 val loss 6.7165 +6600 val perplexity 825.9354 +6600 train 6.343804 (lr=5.8319e-05) (hash(x)=23872245) +6601 train 6.860002 (lr=5.8298e-05) (hash(x)=27849873) +6602 train 6.674449 (lr=5.8276e-05) (hash(x)=23867288) +6603 train 6.467304 (lr=5.8254e-05) (hash(x)=22078476) +6604 train 6.427331 (lr=5.8233e-05) (hash(x)=23416107) +6605 train 6.467948 (lr=5.8211e-05) (hash(x)=24495589) +6606 train 6.794427 (lr=5.8189e-05) (hash(x)=26346747) +6607 train 6.437208 (lr=5.8168e-05) (hash(x)=22845735) +6608 train 6.526249 (lr=5.8146e-05) (hash(x)=22160666) +6609 train 6.675552 (lr=5.8124e-05) (hash(x)=24322392) +6610 train 6.581995 (lr=5.8103e-05) (hash(x)=24901746) +6611 train 6.259971 (lr=5.8081e-05) (hash(x)=22161685) +6612 train 6.746327 (lr=5.8059e-05) (hash(x)=24382962) +6613 train 6.762346 (lr=5.8038e-05) (hash(x)=24755182) +6614 train 6.683807 (lr=5.8016e-05) (hash(x)=25593753) +6615 train 7.057788 (lr=5.7994e-05) (hash(x)=28138281) +6616 train 6.572220 (lr=5.7973e-05) (hash(x)=22617603) +6617 train 6.535779 (lr=5.7951e-05) (hash(x)=24707707) +6618 train 6.794466 (lr=5.7930e-05) (hash(x)=25061784) +6619 train 6.592704 (lr=5.7908e-05) (hash(x)=25747726) +6620 train 7.119829 (lr=5.7886e-05) (hash(x)=27211326) +6621 train 6.698439 (lr=5.7865e-05) (hash(x)=27027610) +6622 train 6.770950 (lr=5.7843e-05) (hash(x)=25466076) +6623 train 6.808994 (lr=5.7822e-05) (hash(x)=29038360) +6624 train 6.830751 (lr=5.7800e-05) (hash(x)=29571215) +6625 train 6.521413 (lr=5.7778e-05) (hash(x)=23238597) +6626 train 6.653017 (lr=5.7757e-05) (hash(x)=25410332) +6627 train 6.763246 (lr=5.7735e-05) (hash(x)=25751789) +6628 train 6.679903 (lr=5.7714e-05) (hash(x)=25362454) +6629 train 6.743053 (lr=5.7692e-05) (hash(x)=25766851) +6630 train 6.698157 (lr=5.7670e-05) (hash(x)=24910605) +6631 train 6.771694 (lr=5.7649e-05) (hash(x)=22827903) +6632 train 6.652753 (lr=5.7627e-05) (hash(x)=25584556) +6633 train 6.489545 (lr=5.7606e-05) (hash(x)=24421917) +6634 train 6.965593 (lr=5.7584e-05) (hash(x)=26521789) +6635 train 6.884314 (lr=5.7563e-05) (hash(x)=27684827) +6636 train 6.608031 (lr=5.7541e-05) (hash(x)=24496831) +6637 train 6.895201 (lr=5.7520e-05) (hash(x)=29121769) +6638 train 6.853336 (lr=5.7498e-05) (hash(x)=26976199) +6639 train 6.895685 (lr=5.7476e-05) (hash(x)=24647015) +6640 train 6.474707 (lr=5.7455e-05) (hash(x)=23533112) +6641 train 7.090727 (lr=5.7433e-05) (hash(x)=27728407) +6642 train 6.666399 (lr=5.7412e-05) (hash(x)=23870478) +6643 train 6.779106 (lr=5.7390e-05) (hash(x)=25635037) +6644 train 6.587296 (lr=5.7369e-05) (hash(x)=22902654) +6645 train 6.744533 (lr=5.7347e-05) (hash(x)=24756433) +6646 train 6.659529 (lr=5.7326e-05) (hash(x)=21646367) +6647 train 6.352454 (lr=5.7304e-05) (hash(x)=20477804) +6648 train 6.546036 (lr=5.7283e-05) (hash(x)=23702230) +6649 train 6.836159 (lr=5.7261e-05) (hash(x)=25480910) +6650 val loss 6.7018 +6650 val perplexity 813.8919 +6650 train 6.605155 (lr=5.7240e-05) (hash(x)=23989284) +6651 train 6.548540 (lr=5.7218e-05) (hash(x)=23226570) +6652 train 6.406940 (lr=5.7197e-05) (hash(x)=19657472) +6653 train 6.496341 (lr=5.7175e-05) (hash(x)=21354883) +6654 train 6.767953 (lr=5.7154e-05) (hash(x)=24915427) +6655 train 6.847787 (lr=5.7132e-05) (hash(x)=26692640) +6656 train 6.554329 (lr=5.7111e-05) (hash(x)=25516080) +6657 train 6.554471 (lr=5.7089e-05) (hash(x)=22755928) +6658 train 6.666805 (lr=5.7068e-05) (hash(x)=23792707) +6659 train 7.166565 (lr=5.7047e-05) (hash(x)=30505094) +6660 train 6.801991 (lr=5.7025e-05) (hash(x)=24887481) +6661 train 6.274940 (lr=5.7004e-05) (hash(x)=18352418) +6662 train 6.670843 (lr=5.6982e-05) (hash(x)=23821936) +6663 train 7.091811 (lr=5.6961e-05) (hash(x)=27388794) +6664 train 7.572109 (lr=5.6939e-05) (hash(x)=32531750) +6665 train 6.804301 (lr=5.6918e-05) (hash(x)=26251471) +6666 train 6.744940 (lr=5.6896e-05) (hash(x)=25379513) +6667 train 6.980494 (lr=5.6875e-05) (hash(x)=26464796) +6668 train 6.641743 (lr=5.6854e-05) (hash(x)=25226691) +6669 train 7.248963 (lr=5.6832e-05) (hash(x)=35216057) +6670 train 7.236151 (lr=5.6811e-05) (hash(x)=34846068) +6671 train 6.596277 (lr=5.6789e-05) (hash(x)=25265875) +6672 train 6.925989 (lr=5.6768e-05) (hash(x)=29338495) +6673 train 6.714469 (lr=5.6747e-05) (hash(x)=24613853) +6674 train 6.634613 (lr=5.6725e-05) (hash(x)=23316747) +6675 train 6.648499 (lr=5.6704e-05) (hash(x)=25144290) +6676 train 6.473430 (lr=5.6682e-05) (hash(x)=20570778) +6677 train 6.732851 (lr=5.6661e-05) (hash(x)=25961546) +6678 train 6.379395 (lr=5.6640e-05) (hash(x)=21952084) +6679 train 6.651918 (lr=5.6618e-05) (hash(x)=21841888) +6680 train 6.715526 (lr=5.6597e-05) (hash(x)=26221655) +6681 train 7.321805 (lr=5.6575e-05) (hash(x)=29479990) +6682 train 6.601569 (lr=5.6554e-05) (hash(x)=24526286) +6683 train 6.772023 (lr=5.6533e-05) (hash(x)=26454000) +6684 train 6.661401 (lr=5.6511e-05) (hash(x)=23398256) +6685 train 6.492476 (lr=5.6490e-05) (hash(x)=23387126) +6686 train 6.790088 (lr=5.6469e-05) (hash(x)=24806864) +6687 train 6.533649 (lr=5.6447e-05) (hash(x)=19809196) +6688 train 7.168717 (lr=5.6426e-05) (hash(x)=27030806) +6689 train 7.795539 (lr=5.6405e-05) (hash(x)=32976656) +6690 train 6.759073 (lr=5.6383e-05) (hash(x)=28265428) +6691 train 6.512672 (lr=5.6362e-05) (hash(x)=21882489) +6692 train 6.737628 (lr=5.6341e-05) (hash(x)=23649986) +6693 train 6.637737 (lr=5.6319e-05) (hash(x)=22792760) +6694 train 6.532953 (lr=5.6298e-05) (hash(x)=23519386) +6695 train 6.536446 (lr=5.6277e-05) (hash(x)=23007945) +6696 train 7.139526 (lr=5.6255e-05) (hash(x)=29863078) +6697 train 6.750241 (lr=5.6234e-05) (hash(x)=27150582) +6698 train 6.926831 (lr=5.6213e-05) (hash(x)=29058541) +6699 train 6.361716 (lr=5.6191e-05) (hash(x)=21321491) +6700 val loss 6.7195 +6700 val perplexity 828.4084 +6700 train 6.718700 (lr=5.6170e-05) (hash(x)=25074402) +6701 train 6.782699 (lr=5.6149e-05) (hash(x)=25070101) +6702 train 6.622453 (lr=5.6127e-05) (hash(x)=26448841) +6703 train 6.780968 (lr=5.6106e-05) (hash(x)=24079409) +6704 train 6.693456 (lr=5.6085e-05) (hash(x)=27013854) +6705 train 6.697026 (lr=5.6064e-05) (hash(x)=26192970) +6706 train 6.689859 (lr=5.6042e-05) (hash(x)=23398599) +6707 train 6.710674 (lr=5.6021e-05) (hash(x)=27458572) +6708 train 6.680453 (lr=5.6000e-05) (hash(x)=23730364) +6709 train 6.784771 (lr=5.5978e-05) (hash(x)=24719147) +6710 train 6.852330 (lr=5.5957e-05) (hash(x)=26381634) +6711 train 6.770692 (lr=5.5936e-05) (hash(x)=25874533) +6712 train 6.631415 (lr=5.5915e-05) (hash(x)=23893555) +6713 train 6.545808 (lr=5.5893e-05) (hash(x)=22668921) +6714 train 6.693785 (lr=5.5872e-05) (hash(x)=25338632) +6715 train 6.689333 (lr=5.5851e-05) (hash(x)=24203734) +6716 train 6.468263 (lr=5.5830e-05) (hash(x)=21927357) +6717 train 6.618448 (lr=5.5809e-05) (hash(x)=23390948) +6718 train 6.528230 (lr=5.5787e-05) (hash(x)=22728789) +6719 train 6.618810 (lr=5.5766e-05) (hash(x)=23660106) +6720 train 6.691389 (lr=5.5745e-05) (hash(x)=23800477) +6721 train 6.805182 (lr=5.5724e-05) (hash(x)=24913248) +6722 train 6.543817 (lr=5.5702e-05) (hash(x)=24169636) +6723 train 6.813918 (lr=5.5681e-05) (hash(x)=24560828) +6724 train 6.713162 (lr=5.5660e-05) (hash(x)=24237245) +6725 train 6.510536 (lr=5.5639e-05) (hash(x)=24651947) +6726 train 7.407716 (lr=5.5618e-05) (hash(x)=29420795) +6727 train 9.144987 (lr=5.5596e-05) (hash(x)=41821329) +6728 train 7.747678 (lr=5.5575e-05) (hash(x)=32786221) +6729 train 6.783542 (lr=5.5554e-05) (hash(x)=21023418) +6730 train 6.686186 (lr=5.5533e-05) (hash(x)=23442219) +6731 train 6.542961 (lr=5.5512e-05) (hash(x)=22773275) +6732 train 6.251407 (lr=5.5491e-05) (hash(x)=17886006) +6733 train 6.556766 (lr=5.5469e-05) (hash(x)=23140594) +6734 train 6.741707 (lr=5.5448e-05) (hash(x)=24063042) +6735 train 6.674129 (lr=5.5427e-05) (hash(x)=25763899) +6736 train 6.672765 (lr=5.5406e-05) (hash(x)=25516642) +6737 train 6.409122 (lr=5.5385e-05) (hash(x)=19159140) +6738 train 6.366950 (lr=5.5364e-05) (hash(x)=18424174) +6739 train 6.412827 (lr=5.5342e-05) (hash(x)=21182890) +6740 train 6.488742 (lr=5.5321e-05) (hash(x)=21234344) +6741 train 6.564739 (lr=5.5300e-05) (hash(x)=21066030) +6742 train 6.538553 (lr=5.5279e-05) (hash(x)=22731347) +6743 train 6.776410 (lr=5.5258e-05) (hash(x)=28584111) +6744 train 6.889693 (lr=5.5237e-05) (hash(x)=27184335) +6745 train 7.061000 (lr=5.5216e-05) (hash(x)=25984822) +6746 train 6.898245 (lr=5.5195e-05) (hash(x)=25174200) +6747 train 7.172380 (lr=5.5173e-05) (hash(x)=28121891) +6748 train 6.756558 (lr=5.5152e-05) (hash(x)=23937505) +6749 train 7.142067 (lr=5.5131e-05) (hash(x)=31680444) +6750 val loss 6.7132 +6750 val perplexity 823.1642 +6750 train 7.177812 (lr=5.5110e-05) (hash(x)=31775752) +6751 train 6.901887 (lr=5.5089e-05) (hash(x)=25559887) +6752 train 6.965541 (lr=5.5068e-05) (hash(x)=26889984) +6753 train 6.839258 (lr=5.5047e-05) (hash(x)=24885474) +6754 train 6.988565 (lr=5.5026e-05) (hash(x)=27653326) +6755 train 7.008809 (lr=5.5005e-05) (hash(x)=28704301) +6756 train 6.639417 (lr=5.4984e-05) (hash(x)=23220071) +6757 train 6.639818 (lr=5.4963e-05) (hash(x)=25777437) +6758 train 6.383789 (lr=5.4941e-05) (hash(x)=23376819) +6759 train 7.029078 (lr=5.4920e-05) (hash(x)=26886377) +6760 train 6.717963 (lr=5.4899e-05) (hash(x)=26562352) +6761 train 6.787438 (lr=5.4878e-05) (hash(x)=20865187) +6762 train 6.745866 (lr=5.4857e-05) (hash(x)=26943122) +6763 train 6.266155 (lr=5.4836e-05) (hash(x)=20211916) +6764 train 6.552408 (lr=5.4815e-05) (hash(x)=24183772) +6765 train 6.910843 (lr=5.4794e-05) (hash(x)=29358238) +6766 train 7.360990 (lr=5.4773e-05) (hash(x)=29588395) +6767 train 6.684206 (lr=5.4752e-05) (hash(x)=26461895) +6768 train 6.593867 (lr=5.4731e-05) (hash(x)=23887258) +6769 train 6.687430 (lr=5.4710e-05) (hash(x)=25305290) +6770 train 6.749825 (lr=5.4689e-05) (hash(x)=26084485) +6771 train 6.830283 (lr=5.4668e-05) (hash(x)=27618136) +6772 train 6.694516 (lr=5.4647e-05) (hash(x)=24635142) +6773 train 7.037940 (lr=5.4626e-05) (hash(x)=28828628) +6774 train 7.164922 (lr=5.4605e-05) (hash(x)=24704431) +6775 train 6.589301 (lr=5.4584e-05) (hash(x)=23018827) +6776 train 6.502724 (lr=5.4563e-05) (hash(x)=22709338) +6777 train 6.674240 (lr=5.4542e-05) (hash(x)=23247351) +6778 train 6.622713 (lr=5.4521e-05) (hash(x)=25498173) +6779 train 6.548662 (lr=5.4500e-05) (hash(x)=24662809) +6780 train 6.463264 (lr=5.4479e-05) (hash(x)=22611088) +6781 train 6.648037 (lr=5.4458e-05) (hash(x)=23802669) +6782 train 6.759464 (lr=5.4437e-05) (hash(x)=24949367) +6783 train 6.568915 (lr=5.4416e-05) (hash(x)=24375035) +6784 train 6.647116 (lr=5.4395e-05) (hash(x)=24591903) +6785 train 6.382805 (lr=5.4374e-05) (hash(x)=22905287) +6786 train 6.837379 (lr=5.4353e-05) (hash(x)=27008221) +6787 train 6.834550 (lr=5.4332e-05) (hash(x)=25006551) +6788 train 6.890291 (lr=5.4311e-05) (hash(x)=28678624) +6789 train 6.871375 (lr=5.4290e-05) (hash(x)=26876607) +6790 train 6.810932 (lr=5.4269e-05) (hash(x)=25696699) +6791 train 6.730606 (lr=5.4249e-05) (hash(x)=26431670) +6792 train 6.440666 (lr=5.4228e-05) (hash(x)=22447904) +6793 train 6.815530 (lr=5.4207e-05) (hash(x)=27288095) +6794 train 6.515880 (lr=5.4186e-05) (hash(x)=22544642) +6795 train 6.819137 (lr=5.4165e-05) (hash(x)=25525366) +6796 train 6.450737 (lr=5.4144e-05) (hash(x)=23282628) +6797 train 6.254287 (lr=5.4123e-05) (hash(x)=18705467) +6798 train 6.633817 (lr=5.4102e-05) (hash(x)=25984698) +6799 train 6.883444 (lr=5.4081e-05) (hash(x)=25033511) +6800 val loss 6.6989 +6800 val perplexity 811.4927 +6800 train 6.900335 (lr=5.4060e-05) (hash(x)=23975197) +6801 train 6.717359 (lr=5.4039e-05) (hash(x)=25039815) +6802 train 6.588919 (lr=5.4019e-05) (hash(x)=23217200) +6803 train 6.878107 (lr=5.3998e-05) (hash(x)=24224002) +6804 train 6.657192 (lr=5.3977e-05) (hash(x)=25161716) +6805 train 6.687971 (lr=5.3956e-05) (hash(x)=25886169) +6806 train 6.831147 (lr=5.3935e-05) (hash(x)=27502719) +6807 train 6.640271 (lr=5.3914e-05) (hash(x)=25602577) +6808 train 6.959766 (lr=5.3893e-05) (hash(x)=27545504) +6809 train 6.518123 (lr=5.3872e-05) (hash(x)=21838175) +6810 train 6.686152 (lr=5.3852e-05) (hash(x)=25037291) +6811 train 6.429569 (lr=5.3831e-05) (hash(x)=20716276) +6812 train 6.735425 (lr=5.3810e-05) (hash(x)=27408058) +6813 train 6.372641 (lr=5.3789e-05) (hash(x)=22169391) +6814 train 6.915460 (lr=5.3768e-05) (hash(x)=27113892) +6815 train 6.609354 (lr=5.3747e-05) (hash(x)=23316582) +6816 train 6.628319 (lr=5.3727e-05) (hash(x)=23433105) +6817 train 6.681027 (lr=5.3706e-05) (hash(x)=29305666) +6818 train 7.140223 (lr=5.3685e-05) (hash(x)=35297310) +6819 train 6.591447 (lr=5.3664e-05) (hash(x)=23849620) +6820 train 7.104143 (lr=5.3643e-05) (hash(x)=27107733) +6821 train 6.786566 (lr=5.3623e-05) (hash(x)=26560546) +6822 train 6.770821 (lr=5.3602e-05) (hash(x)=25137099) +6823 train 6.590791 (lr=5.3581e-05) (hash(x)=22470095) +6824 train 6.890836 (lr=5.3560e-05) (hash(x)=26132895) +6825 train 6.578027 (lr=5.3539e-05) (hash(x)=24541250) +6826 train 6.651310 (lr=5.3519e-05) (hash(x)=23720088) +6827 train 6.532926 (lr=5.3498e-05) (hash(x)=22569035) +6828 train 6.834543 (lr=5.3477e-05) (hash(x)=27262034) +6829 train 6.617980 (lr=5.3456e-05) (hash(x)=23445307) +6830 train 6.436527 (lr=5.3435e-05) (hash(x)=24237239) +6831 train 6.775603 (lr=5.3415e-05) (hash(x)=25089202) +6832 train 6.482881 (lr=5.3394e-05) (hash(x)=23173444) +6833 train 6.848947 (lr=5.3373e-05) (hash(x)=26877686) +6834 train 6.527875 (lr=5.3352e-05) (hash(x)=23633472) +6835 train 6.671608 (lr=5.3332e-05) (hash(x)=25943303) +6836 train 6.514188 (lr=5.3311e-05) (hash(x)=21822646) +6837 train 6.310781 (lr=5.3290e-05) (hash(x)=20229886) +6838 train 6.763823 (lr=5.3269e-05) (hash(x)=29370875) +6839 train 6.722174 (lr=5.3249e-05) (hash(x)=26243247) +6840 train 6.846508 (lr=5.3228e-05) (hash(x)=25477267) +6841 train 6.938168 (lr=5.3207e-05) (hash(x)=23684111) +6842 train 6.989157 (lr=5.3187e-05) (hash(x)=24654212) +6843 train 6.766366 (lr=5.3166e-05) (hash(x)=25379406) +6844 train 7.048842 (lr=5.3145e-05) (hash(x)=23854000) +6845 train 6.600615 (lr=5.3124e-05) (hash(x)=23629812) +6846 train 6.562889 (lr=5.3104e-05) (hash(x)=26396873) +6847 train 6.300188 (lr=5.3083e-05) (hash(x)=22231144) +6848 train 6.411922 (lr=5.3062e-05) (hash(x)=21266452) +6849 train 6.472416 (lr=5.3042e-05) (hash(x)=23902576) +6850 val loss 6.7033 +6850 val perplexity 815.1149 +6850 train 6.647502 (lr=5.3021e-05) (hash(x)=24586225) +6851 train 6.393981 (lr=5.3000e-05) (hash(x)=19695756) +6852 train 6.818289 (lr=5.2980e-05) (hash(x)=23392481) +6853 train 6.675652 (lr=5.2959e-05) (hash(x)=23325741) +6854 train 6.884717 (lr=5.2938e-05) (hash(x)=26700345) +6855 train 6.874928 (lr=5.2918e-05) (hash(x)=27646564) +6856 train 6.627678 (lr=5.2897e-05) (hash(x)=24874929) +6857 train 6.751389 (lr=5.2876e-05) (hash(x)=24963136) +6858 train 6.917965 (lr=5.2856e-05) (hash(x)=26304463) +6859 train 7.031194 (lr=5.2835e-05) (hash(x)=31873056) +6860 train 6.778401 (lr=5.2814e-05) (hash(x)=29596650) +6861 train 6.745203 (lr=5.2794e-05) (hash(x)=25880203) +6862 train 6.777443 (lr=5.2773e-05) (hash(x)=24334005) +6863 train 6.634511 (lr=5.2752e-05) (hash(x)=23889875) +6864 train 6.624272 (lr=5.2732e-05) (hash(x)=24826632) +6865 train 6.832534 (lr=5.2711e-05) (hash(x)=25180150) +6866 train 6.839916 (lr=5.2691e-05) (hash(x)=24647163) +6867 train 6.779148 (lr=5.2670e-05) (hash(x)=20646304) +6868 train 6.758850 (lr=5.2649e-05) (hash(x)=20689195) +6869 train 6.901125 (lr=5.2629e-05) (hash(x)=26843667) +6870 train 6.306240 (lr=5.2608e-05) (hash(x)=20133161) +6871 train 6.599422 (lr=5.2588e-05) (hash(x)=25255240) +6872 train 6.973691 (lr=5.2567e-05) (hash(x)=27092216) +6873 train 7.592595 (lr=5.2546e-05) (hash(x)=30823096) +6874 train 7.064954 (lr=5.2526e-05) (hash(x)=28048909) +6875 train 6.738887 (lr=5.2505e-05) (hash(x)=27612424) +6876 train 6.892480 (lr=5.2485e-05) (hash(x)=29012150) +6877 train 6.427304 (lr=5.2464e-05) (hash(x)=22024252) +6878 train 6.460419 (lr=5.2444e-05) (hash(x)=22117914) +6879 train 6.517752 (lr=5.2423e-05) (hash(x)=23883299) +6880 train 6.314161 (lr=5.2402e-05) (hash(x)=21904815) +6881 train 7.349626 (lr=5.2382e-05) (hash(x)=28935436) +6882 train 7.283777 (lr=5.2361e-05) (hash(x)=26270776) +6883 train 6.773915 (lr=5.2341e-05) (hash(x)=25842452) +6884 train 6.810722 (lr=5.2320e-05) (hash(x)=25986471) +6885 train 6.831250 (lr=5.2300e-05) (hash(x)=25637938) +6886 train 6.574808 (lr=5.2279e-05) (hash(x)=26620873) +6887 train 6.156690 (lr=5.2259e-05) (hash(x)=18463841) +6888 train 6.769421 (lr=5.2238e-05) (hash(x)=25960731) +6889 train 6.715816 (lr=5.2218e-05) (hash(x)=25965113) +6890 train 6.650517 (lr=5.2197e-05) (hash(x)=26528548) +6891 train 6.638124 (lr=5.2177e-05) (hash(x)=24032346) +6892 train 6.796538 (lr=5.2156e-05) (hash(x)=23884939) +6893 train 6.863884 (lr=5.2136e-05) (hash(x)=26100560) +6894 train 6.818538 (lr=5.2115e-05) (hash(x)=26351527) +6895 train 7.312386 (lr=5.2095e-05) (hash(x)=30657762) +6896 train 6.472072 (lr=5.2074e-05) (hash(x)=21587235) +6897 train 6.856186 (lr=5.2054e-05) (hash(x)=27080799) +6898 train 6.860822 (lr=5.2033e-05) (hash(x)=24436942) +6899 train 6.619538 (lr=5.2013e-05) (hash(x)=25199653) +6900 val loss 6.7048 +6900 val perplexity 816.3382 +6900 train 6.524784 (lr=5.1992e-05) (hash(x)=20422558) +6901 train 6.635506 (lr=5.1972e-05) (hash(x)=23938764) +6902 train 6.894499 (lr=5.1951e-05) (hash(x)=25349008) +6903 train 6.648482 (lr=5.1931e-05) (hash(x)=25288079) +6904 train 6.830418 (lr=5.1910e-05) (hash(x)=25112142) +6905 train 6.554160 (lr=5.1890e-05) (hash(x)=24324699) +6906 train 6.263150 (lr=5.1870e-05) (hash(x)=20290952) +6907 train 6.743055 (lr=5.1849e-05) (hash(x)=24683122) +6908 train 6.685098 (lr=5.1829e-05) (hash(x)=24652019) +6909 train 6.533643 (lr=5.1808e-05) (hash(x)=24176673) +6910 train 7.121162 (lr=5.1788e-05) (hash(x)=28772002) +6911 train 7.422093 (lr=5.1767e-05) (hash(x)=28979310) +6912 train 7.178329 (lr=5.1747e-05) (hash(x)=26422011) +6913 train 7.249428 (lr=5.1727e-05) (hash(x)=26276588) +6914 train 6.912301 (lr=5.1706e-05) (hash(x)=22836037) +6915 train 7.305973 (lr=5.1686e-05) (hash(x)=27746311) +6916 train 6.742742 (lr=5.1665e-05) (hash(x)=25230879) +6917 train 6.609577 (lr=5.1645e-05) (hash(x)=22646933) +6918 train 6.754329 (lr=5.1625e-05) (hash(x)=26522270) +6919 train 7.258733 (lr=5.1604e-05) (hash(x)=30254991) +6920 train 7.002207 (lr=5.1584e-05) (hash(x)=28662220) +6921 train 6.564778 (lr=5.1563e-05) (hash(x)=24215682) +6922 train 6.926308 (lr=5.1543e-05) (hash(x)=25866847) +6923 train 6.709377 (lr=5.1523e-05) (hash(x)=25961003) +6924 train 6.829312 (lr=5.1502e-05) (hash(x)=27074446) +6925 train 6.824494 (lr=5.1482e-05) (hash(x)=26898825) +6926 train 6.682111 (lr=5.1462e-05) (hash(x)=24331627) +6927 train 6.822234 (lr=5.1441e-05) (hash(x)=27274653) +6928 train 6.963281 (lr=5.1421e-05) (hash(x)=28159546) +6929 train 6.779401 (lr=5.1401e-05) (hash(x)=25124915) +6930 train 6.804506 (lr=5.1380e-05) (hash(x)=25251610) +6931 train 6.562407 (lr=5.1360e-05) (hash(x)=22056827) +6932 train 6.972389 (lr=5.1340e-05) (hash(x)=26923073) +6933 train 6.725480 (lr=5.1319e-05) (hash(x)=25862799) +6934 train 6.620528 (lr=5.1299e-05) (hash(x)=24301773) +6935 train 6.518983 (lr=5.1279e-05) (hash(x)=23026066) +6936 train 6.575964 (lr=5.1258e-05) (hash(x)=23105685) +6937 train 6.644212 (lr=5.1238e-05) (hash(x)=27478448) +6938 train 6.835136 (lr=5.1218e-05) (hash(x)=26169471) +6939 train 6.540747 (lr=5.1197e-05) (hash(x)=22601747) +6940 train 7.291917 (lr=5.1177e-05) (hash(x)=30296475) +6941 train 7.231452 (lr=5.1157e-05) (hash(x)=29691656) +6942 train 6.547454 (lr=5.1137e-05) (hash(x)=22720381) +6943 train 5.889240 (lr=5.1116e-05) (hash(x)=14001963) +6944 train 5.856005 (lr=5.1096e-05) (hash(x)=14631858) +6945 train 6.476036 (lr=5.1076e-05) (hash(x)=22423819) +6946 train 7.210862 (lr=5.1056e-05) (hash(x)=29723263) +6947 train 6.688653 (lr=5.1035e-05) (hash(x)=24657381) +6948 train 6.741883 (lr=5.1015e-05) (hash(x)=25336099) +6949 train 6.570352 (lr=5.0995e-05) (hash(x)=23487914) +6950 val loss 6.7039 +6950 val perplexity 815.5842 +6950 train 6.639184 (lr=5.0975e-05) (hash(x)=26765380) +6951 train 6.392848 (lr=5.0954e-05) (hash(x)=21988054) +6952 train 6.611769 (lr=5.0934e-05) (hash(x)=26126422) +6953 train 6.511120 (lr=5.0914e-05) (hash(x)=23482066) +6954 train 6.538132 (lr=5.0894e-05) (hash(x)=19115084) +6955 train 6.725525 (lr=5.0873e-05) (hash(x)=23512676) +6956 train 6.873155 (lr=5.0853e-05) (hash(x)=24987854) +6957 train 6.755629 (lr=5.0833e-05) (hash(x)=27653921) +6958 train 6.646404 (lr=5.0813e-05) (hash(x)=24047191) +6959 train 7.029692 (lr=5.0792e-05) (hash(x)=26241099) +6960 train 6.531509 (lr=5.0772e-05) (hash(x)=23964904) +6961 train 7.304256 (lr=5.0752e-05) (hash(x)=27170183) +6962 train 6.635365 (lr=5.0732e-05) (hash(x)=20395110) +6963 train 7.075122 (lr=5.0712e-05) (hash(x)=28067098) +6964 train 6.550528 (lr=5.0692e-05) (hash(x)=23241130) +6965 train 6.822337 (lr=5.0671e-05) (hash(x)=28216519) +6966 train 6.437531 (lr=5.0651e-05) (hash(x)=23683700) +6967 train 6.928999 (lr=5.0631e-05) (hash(x)=26209722) +6968 train 6.755993 (lr=5.0611e-05) (hash(x)=27291568) +6969 train 6.668547 (lr=5.0591e-05) (hash(x)=26135814) +6970 train 6.823261 (lr=5.0571e-05) (hash(x)=29967783) +6971 train 6.270232 (lr=5.0550e-05) (hash(x)=20837675) +6972 train 6.338666 (lr=5.0530e-05) (hash(x)=20072848) +6973 train 6.541911 (lr=5.0510e-05) (hash(x)=23102053) +6974 train 6.799170 (lr=5.0490e-05) (hash(x)=25562339) +6975 train 7.019951 (lr=5.0470e-05) (hash(x)=26928312) +6976 train 6.829404 (lr=5.0450e-05) (hash(x)=27591338) +6977 train 6.376156 (lr=5.0430e-05) (hash(x)=21672241) +6978 train 6.413855 (lr=5.0409e-05) (hash(x)=20512732) +6979 train 6.681511 (lr=5.0389e-05) (hash(x)=23532064) +6980 train 6.947017 (lr=5.0369e-05) (hash(x)=26114608) +6981 train 6.850330 (lr=5.0349e-05) (hash(x)=27181359) +6982 train 7.114423 (lr=5.0329e-05) (hash(x)=25845731) +6983 train 6.624601 (lr=5.0309e-05) (hash(x)=23563272) +6984 train 6.886247 (lr=5.0289e-05) (hash(x)=25759110) +6985 train 6.485725 (lr=5.0269e-05) (hash(x)=20402698) +6986 train 6.808442 (lr=5.0249e-05) (hash(x)=26026033) +6987 train 6.472820 (lr=5.0229e-05) (hash(x)=22303154) +6988 train 6.759393 (lr=5.0208e-05) (hash(x)=26657540) +6989 train 6.616892 (lr=5.0188e-05) (hash(x)=23648561) +6990 train 6.731893 (lr=5.0168e-05) (hash(x)=27827459) +6991 train 6.584856 (lr=5.0148e-05) (hash(x)=25704828) +6992 train 6.686243 (lr=5.0128e-05) (hash(x)=25111251) +6993 train 6.736330 (lr=5.0108e-05) (hash(x)=24651266) +6994 train 7.361019 (lr=5.0088e-05) (hash(x)=24346899) +6995 train 7.437059 (lr=5.0068e-05) (hash(x)=29405359) +6996 train 6.684090 (lr=5.0048e-05) (hash(x)=24811175) +6997 train 7.127706 (lr=5.0028e-05) (hash(x)=32499194) +6998 train 6.640239 (lr=5.0008e-05) (hash(x)=26948069) +6999 train 6.590231 (lr=4.9988e-05) (hash(x)=22498992) +7000 val loss 6.6987 +7000 val perplexity 811.3179 +7000 train 6.590199 (lr=4.9968e-05) (hash(x)=21834790) +7001 train 6.906529 (lr=4.9948e-05) (hash(x)=29382425) +7002 train 7.665344 (lr=4.9928e-05) (hash(x)=34167369) +7003 train 8.130107 (lr=4.9908e-05) (hash(x)=38527461) +7004 train 7.793442 (lr=4.9888e-05) (hash(x)=34036906) +7005 train 6.811199 (lr=4.9868e-05) (hash(x)=25238253) +7006 train 6.783044 (lr=4.9848e-05) (hash(x)=25713486) +7007 train 6.608097 (lr=4.9828e-05) (hash(x)=22895918) +7008 train 6.527632 (lr=4.9808e-05) (hash(x)=21769925) +7009 train 6.589226 (lr=4.9788e-05) (hash(x)=24505897) +7010 train 6.676883 (lr=4.9768e-05) (hash(x)=21379653) +7011 train 6.760405 (lr=4.9748e-05) (hash(x)=21037854) +7012 train 6.699048 (lr=4.9728e-05) (hash(x)=22186080) +7013 train 6.738660 (lr=4.9708e-05) (hash(x)=24364717) +7014 train 6.539514 (lr=4.9688e-05) (hash(x)=23784975) +7015 train 6.672319 (lr=4.9668e-05) (hash(x)=24404283) +7016 train 6.458867 (lr=4.9648e-05) (hash(x)=22785890) +7017 train 6.746530 (lr=4.9628e-05) (hash(x)=24512699) +7018 train 6.438191 (lr=4.9608e-05) (hash(x)=23298437) +7019 train 6.794530 (lr=4.9588e-05) (hash(x)=26403949) +7020 train 7.039366 (lr=4.9568e-05) (hash(x)=25626033) +7021 train 6.525324 (lr=4.9549e-05) (hash(x)=22694338) +7022 train 6.577487 (lr=4.9529e-05) (hash(x)=25655764) +7023 train 6.575733 (lr=4.9509e-05) (hash(x)=26663932) +7024 train 6.799820 (lr=4.9489e-05) (hash(x)=28071590) +7025 train 6.624252 (lr=4.9469e-05) (hash(x)=26372406) +7026 train 6.991801 (lr=4.9449e-05) (hash(x)=26421078) +7027 train 6.966972 (lr=4.9429e-05) (hash(x)=27229413) +7028 train 7.134614 (lr=4.9409e-05) (hash(x)=30304544) +7029 train 6.695889 (lr=4.9389e-05) (hash(x)=22401373) +7030 train 6.506272 (lr=4.9369e-05) (hash(x)=21010759) +7031 train 6.410844 (lr=4.9350e-05) (hash(x)=22805316) +7032 train 6.840135 (lr=4.9330e-05) (hash(x)=26172538) +7033 train 6.816179 (lr=4.9310e-05) (hash(x)=26383120) +7034 train 6.846784 (lr=4.9290e-05) (hash(x)=26289689) +7035 train 6.778790 (lr=4.9270e-05) (hash(x)=25330877) +7036 train 6.887783 (lr=4.9250e-05) (hash(x)=23273963) +7037 train 6.688503 (lr=4.9230e-05) (hash(x)=23075615) +7038 train 6.732616 (lr=4.9211e-05) (hash(x)=26033873) +7039 train 6.689270 (lr=4.9191e-05) (hash(x)=23344466) +7040 train 6.626483 (lr=4.9171e-05) (hash(x)=24490307) +7041 train 6.922247 (lr=4.9151e-05) (hash(x)=27308918) +7042 train 7.051494 (lr=4.9131e-05) (hash(x)=29906407) +7043 train 6.802355 (lr=4.9111e-05) (hash(x)=25732529) +7044 train 6.370182 (lr=4.9092e-05) (hash(x)=22678195) +7045 train 6.492812 (lr=4.9072e-05) (hash(x)=22541257) +7046 train 6.773599 (lr=4.9052e-05) (hash(x)=23871340) +7047 train 6.422566 (lr=4.9032e-05) (hash(x)=20966940) +7048 train 6.373817 (lr=4.9012e-05) (hash(x)=20610743) +7049 train 6.634306 (lr=4.8993e-05) (hash(x)=23927091) +7050 val loss 6.6902 +7050 val perplexity 804.4661 +7050 train 6.740383 (lr=4.8973e-05) (hash(x)=26491802) +7051 train 6.803163 (lr=4.8953e-05) (hash(x)=26665336) +7052 train 6.575222 (lr=4.8933e-05) (hash(x)=21668690) +7053 train 6.428668 (lr=4.8913e-05) (hash(x)=24356512) +7054 train 6.998041 (lr=4.8894e-05) (hash(x)=28687744) +7055 train 6.935844 (lr=4.8874e-05) (hash(x)=27422664) +7056 train 7.112676 (lr=4.8854e-05) (hash(x)=32781667) +7057 train 6.457229 (lr=4.8834e-05) (hash(x)=21462165) +7058 train 6.656914 (lr=4.8815e-05) (hash(x)=23858829) +7059 train 7.162908 (lr=4.8795e-05) (hash(x)=28555665) +7060 train 6.668069 (lr=4.8775e-05) (hash(x)=24375099) +7061 train 6.792062 (lr=4.8755e-05) (hash(x)=25476891) +7062 train 6.501115 (lr=4.8736e-05) (hash(x)=23491684) +7063 train 6.553356 (lr=4.8716e-05) (hash(x)=22116510) +7064 train 6.603742 (lr=4.8696e-05) (hash(x)=23612320) +7065 train 6.311260 (lr=4.8676e-05) (hash(x)=23586588) +7066 train 6.360023 (lr=4.8657e-05) (hash(x)=21516423) +7067 train 6.817801 (lr=4.8637e-05) (hash(x)=27863790) +7068 train 6.749361 (lr=4.8617e-05) (hash(x)=27743326) +7069 train 6.807074 (lr=4.8598e-05) (hash(x)=24547211) +7070 train 6.525232 (lr=4.8578e-05) (hash(x)=24037768) +7071 train 6.812812 (lr=4.8558e-05) (hash(x)=27269633) +7072 train 6.306626 (lr=4.8539e-05) (hash(x)=21792088) +7073 train 6.625601 (lr=4.8519e-05) (hash(x)=21341882) +7074 train 6.630420 (lr=4.8499e-05) (hash(x)=21845392) +7075 train 6.690990 (lr=4.8480e-05) (hash(x)=26916967) +7076 train 6.425282 (lr=4.8460e-05) (hash(x)=22735536) +7077 train 6.653797 (lr=4.8440e-05) (hash(x)=24203252) +7078 train 7.106064 (lr=4.8421e-05) (hash(x)=27669513) +7079 train 7.115207 (lr=4.8401e-05) (hash(x)=27157711) +7080 train 6.797960 (lr=4.8381e-05) (hash(x)=25287525) +7081 train 6.811700 (lr=4.8362e-05) (hash(x)=21940125) +7082 train 6.920998 (lr=4.8342e-05) (hash(x)=24826499) +7083 train 6.718906 (lr=4.8322e-05) (hash(x)=25865703) +7084 train 6.852278 (lr=4.8303e-05) (hash(x)=23279891) +7085 train 6.802608 (lr=4.8283e-05) (hash(x)=23580162) +7086 train 7.065876 (lr=4.8263e-05) (hash(x)=29032576) +7087 train 6.538510 (lr=4.8244e-05) (hash(x)=22774645) +7088 train 6.554945 (lr=4.8224e-05) (hash(x)=24708057) +7089 train 6.509502 (lr=4.8205e-05) (hash(x)=24919123) +7090 train 6.501338 (lr=4.8185e-05) (hash(x)=25443928) +7091 train 6.686148 (lr=4.8165e-05) (hash(x)=26162270) +7092 train 6.767890 (lr=4.8146e-05) (hash(x)=24923015) +7093 train 6.903273 (lr=4.8126e-05) (hash(x)=27294843) +7094 train 6.727230 (lr=4.8107e-05) (hash(x)=25423338) +7095 train 6.494987 (lr=4.8087e-05) (hash(x)=22143146) +7096 train 6.714003 (lr=4.8067e-05) (hash(x)=27059592) +7097 train 6.895794 (lr=4.8048e-05) (hash(x)=31418679) +7098 train 6.778404 (lr=4.8028e-05) (hash(x)=26496553) +7099 train 6.493590 (lr=4.8009e-05) (hash(x)=22202257) +7100 val loss 6.6901 +7100 val perplexity 804.4266 +7100 train 6.586926 (lr=4.7989e-05) (hash(x)=23142580) +7101 train 6.530775 (lr=4.7970e-05) (hash(x)=22120172) +7102 train 6.461856 (lr=4.7950e-05) (hash(x)=21171528) +7103 train 6.636633 (lr=4.7931e-05) (hash(x)=22356438) +7104 train 6.013152 (lr=4.7911e-05) (hash(x)=16374966) +7105 train 5.875303 (lr=4.7892e-05) (hash(x)=14734614) +7106 train 6.174273 (lr=4.7872e-05) (hash(x)=18705676) +7107 train 6.522479 (lr=4.7852e-05) (hash(x)=22331898) +7108 train 6.686692 (lr=4.7833e-05) (hash(x)=26426927) +7109 train 6.854282 (lr=4.7813e-05) (hash(x)=28322513) +7110 train 6.399553 (lr=4.7794e-05) (hash(x)=21793586) +7111 train 6.408123 (lr=4.7774e-05) (hash(x)=23172158) +7112 train 6.574103 (lr=4.7755e-05) (hash(x)=24194310) +7113 train 6.746316 (lr=4.7735e-05) (hash(x)=24943602) +7114 train 6.452289 (lr=4.7716e-05) (hash(x)=21472431) +7115 train 6.456310 (lr=4.7696e-05) (hash(x)=22578434) +7116 train 6.679022 (lr=4.7677e-05) (hash(x)=26228533) +7117 train 6.495018 (lr=4.7658e-05) (hash(x)=22875229) +7118 train 6.927637 (lr=4.7638e-05) (hash(x)=26288856) +7119 train 7.182082 (lr=4.7619e-05) (hash(x)=26971690) +7120 train 7.132239 (lr=4.7599e-05) (hash(x)=28477427) +7121 train 6.398011 (lr=4.7580e-05) (hash(x)=22252174) +7122 train 6.502181 (lr=4.7560e-05) (hash(x)=23402405) +7123 train 6.781998 (lr=4.7541e-05) (hash(x)=26760739) +7124 train 6.885805 (lr=4.7521e-05) (hash(x)=26389945) +7125 train 6.726699 (lr=4.7502e-05) (hash(x)=27214389) +7126 train 6.688694 (lr=4.7483e-05) (hash(x)=25338580) +7127 train 6.666201 (lr=4.7463e-05) (hash(x)=24851922) +7128 train 6.409030 (lr=4.7444e-05) (hash(x)=22136298) +7129 train 6.622428 (lr=4.7424e-05) (hash(x)=23221125) +7130 train 6.548748 (lr=4.7405e-05) (hash(x)=23760685) +7131 train 6.532955 (lr=4.7385e-05) (hash(x)=22854700) +7132 train 6.696274 (lr=4.7366e-05) (hash(x)=24903121) +7133 train 6.815952 (lr=4.7347e-05) (hash(x)=24132529) +7134 train 6.534497 (lr=4.7327e-05) (hash(x)=21247750) +7135 train 6.435617 (lr=4.7308e-05) (hash(x)=21017641) +7136 train 6.511568 (lr=4.7288e-05) (hash(x)=19076810) +7137 train 6.749046 (lr=4.7269e-05) (hash(x)=24379310) +7138 train 6.966363 (lr=4.7250e-05) (hash(x)=28603106) +7139 train 6.618524 (lr=4.7230e-05) (hash(x)=24141269) +7140 train 6.548526 (lr=4.7211e-05) (hash(x)=21764101) +7141 train 6.741230 (lr=4.7192e-05) (hash(x)=21775022) +7142 train 6.645745 (lr=4.7172e-05) (hash(x)=21895421) +7143 train 6.730641 (lr=4.7153e-05) (hash(x)=28186957) +7144 train 6.521155 (lr=4.7134e-05) (hash(x)=22812610) +7145 train 6.445381 (lr=4.7114e-05) (hash(x)=24119427) +7146 train 6.523513 (lr=4.7095e-05) (hash(x)=23282795) +7147 train 6.999715 (lr=4.7076e-05) (hash(x)=27125863) +7148 train 6.869883 (lr=4.7056e-05) (hash(x)=26419805) +7149 train 6.899921 (lr=4.7037e-05) (hash(x)=27166001) +7150 val loss 6.6869 +7150 val perplexity 801.8585 +7150 train 7.003401 (lr=4.7018e-05) (hash(x)=27928188) +7151 train 6.551525 (lr=4.6998e-05) (hash(x)=25661082) +7152 train 6.255527 (lr=4.6979e-05) (hash(x)=21558964) +7153 train 6.601094 (lr=4.6960e-05) (hash(x)=23850014) +7154 train 6.714125 (lr=4.6940e-05) (hash(x)=26825924) +7155 train 6.746782 (lr=4.6921e-05) (hash(x)=27131591) +7156 train 6.742712 (lr=4.6902e-05) (hash(x)=26444054) +7157 train 6.575235 (lr=4.6883e-05) (hash(x)=25248284) +7158 train 6.536975 (lr=4.6863e-05) (hash(x)=24554954) +7159 train 6.587534 (lr=4.6844e-05) (hash(x)=25462781) +7160 train 6.564920 (lr=4.6825e-05) (hash(x)=22222060) +7161 train 6.598998 (lr=4.6806e-05) (hash(x)=25383701) +7162 train 6.373229 (lr=4.6786e-05) (hash(x)=23441254) +7163 train 6.179818 (lr=4.6767e-05) (hash(x)=19079257) +7164 train 6.523782 (lr=4.6748e-05) (hash(x)=24291754) +7165 train 6.761312 (lr=4.6729e-05) (hash(x)=28124151) +7166 train 6.751331 (lr=4.6709e-05) (hash(x)=28418942) +7167 train 6.544672 (lr=4.6690e-05) (hash(x)=21774374) +7168 train 6.844510 (lr=4.6671e-05) (hash(x)=27779305) +7169 train 6.400855 (lr=4.6652e-05) (hash(x)=22951481) +7170 train 6.467229 (lr=4.6632e-05) (hash(x)=22806793) +7171 train 6.582089 (lr=4.6613e-05) (hash(x)=21349365) +7172 train 6.509540 (lr=4.6594e-05) (hash(x)=22227088) +7173 train 6.696206 (lr=4.6575e-05) (hash(x)=23062153) +7174 train 6.564076 (lr=4.6556e-05) (hash(x)=24661912) +7175 train 6.493379 (lr=4.6536e-05) (hash(x)=23657055) +7176 train 6.405988 (lr=4.6517e-05) (hash(x)=21770827) +7177 train 6.418524 (lr=4.6498e-05) (hash(x)=19893340) +7178 train 6.292589 (lr=4.6479e-05) (hash(x)=19619883) +7179 train 6.732776 (lr=4.6460e-05) (hash(x)=27273804) +7180 train 6.865142 (lr=4.6441e-05) (hash(x)=26856233) +7181 train 7.365268 (lr=4.6421e-05) (hash(x)=30812065) +7182 train 6.646030 (lr=4.6402e-05) (hash(x)=24842855) +7183 train 6.315258 (lr=4.6383e-05) (hash(x)=23604050) +7184 train 6.740009 (lr=4.6364e-05) (hash(x)=25956781) +7185 train 6.449626 (lr=4.6345e-05) (hash(x)=22622368) +7186 train 6.611237 (lr=4.6326e-05) (hash(x)=22555062) +7187 train 7.251422 (lr=4.6306e-05) (hash(x)=28419053) +7188 train 6.799333 (lr=4.6287e-05) (hash(x)=27237746) +7189 train 7.223021 (lr=4.6268e-05) (hash(x)=34147079) +7190 train 7.477424 (lr=4.6249e-05) (hash(x)=31385476) +7191 train 7.540168 (lr=4.6230e-05) (hash(x)=31534071) +7192 train 7.116565 (lr=4.6211e-05) (hash(x)=27723214) +7193 train 6.586855 (lr=4.6192e-05) (hash(x)=25309945) +7194 train 6.802277 (lr=4.6173e-05) (hash(x)=26393634) +7195 train 6.490454 (lr=4.6154e-05) (hash(x)=22037495) +7196 train 7.271095 (lr=4.6135e-05) (hash(x)=28916808) +7197 train 6.562295 (lr=4.6115e-05) (hash(x)=24786809) +7198 train 6.714882 (lr=4.6096e-05) (hash(x)=25710773) +7199 train 6.835010 (lr=4.6077e-05) (hash(x)=24183732) +7200 val loss 6.6930 +7200 val perplexity 806.7656 +7200 train 6.494992 (lr=4.6058e-05) (hash(x)=22316783) +7201 train 6.879405 (lr=4.6039e-05) (hash(x)=26678478) +7202 train 6.594345 (lr=4.6020e-05) (hash(x)=26199861) +7203 train 6.671088 (lr=4.6001e-05) (hash(x)=23379513) +7204 train 6.854254 (lr=4.5982e-05) (hash(x)=27514862) +7205 train 6.346297 (lr=4.5963e-05) (hash(x)=22367536) +7206 train 6.982100 (lr=4.5944e-05) (hash(x)=30561348) +7207 train 6.591284 (lr=4.5925e-05) (hash(x)=23384280) +7208 train 6.314372 (lr=4.5906e-05) (hash(x)=23493944) +7209 train 6.538498 (lr=4.5887e-05) (hash(x)=23259350) +7210 train 6.555013 (lr=4.5868e-05) (hash(x)=22358072) +7211 train 6.508362 (lr=4.5849e-05) (hash(x)=21744922) +7212 train 6.577289 (lr=4.5830e-05) (hash(x)=24271785) +7213 train 6.825837 (lr=4.5811e-05) (hash(x)=26149204) +7214 train 6.602364 (lr=4.5792e-05) (hash(x)=22521682) +7215 train 6.403345 (lr=4.5773e-05) (hash(x)=21975928) +7216 train 6.520415 (lr=4.5754e-05) (hash(x)=23678091) +7217 train 6.498315 (lr=4.5735e-05) (hash(x)=24076970) +7218 train 6.490055 (lr=4.5716e-05) (hash(x)=24675328) +7219 train 6.423672 (lr=4.5697e-05) (hash(x)=24851195) +7220 train 6.446483 (lr=4.5678e-05) (hash(x)=22760843) +7221 train 6.699359 (lr=4.5659e-05) (hash(x)=26106166) +7222 train 6.543656 (lr=4.5640e-05) (hash(x)=25222927) +7223 train 6.599770 (lr=4.5621e-05) (hash(x)=25281674) +7224 train 6.438635 (lr=4.5602e-05) (hash(x)=22361636) +7225 train 6.640338 (lr=4.5583e-05) (hash(x)=19597014) +7226 train 6.547261 (lr=4.5564e-05) (hash(x)=25474355) +7227 train 6.460382 (lr=4.5545e-05) (hash(x)=25118947) +7228 train 6.551521 (lr=4.5526e-05) (hash(x)=25831087) +7229 train 6.477960 (lr=4.5507e-05) (hash(x)=21854141) +7230 train 6.521675 (lr=4.5488e-05) (hash(x)=24268266) +7231 train 6.472688 (lr=4.5470e-05) (hash(x)=22947712) +7232 train 6.337673 (lr=4.5451e-05) (hash(x)=24052718) +7233 train 6.525099 (lr=4.5432e-05) (hash(x)=23176418) +7234 train 6.608743 (lr=4.5413e-05) (hash(x)=25482113) +7235 train 6.809640 (lr=4.5394e-05) (hash(x)=27044644) +7236 train 6.542436 (lr=4.5375e-05) (hash(x)=22440648) +7237 train 6.805176 (lr=4.5356e-05) (hash(x)=24390864) +7238 train 6.480918 (lr=4.5337e-05) (hash(x)=22823292) +7239 train 6.621150 (lr=4.5318e-05) (hash(x)=24853977) +7240 train 7.008794 (lr=4.5300e-05) (hash(x)=27345173) +7241 train 6.698280 (lr=4.5281e-05) (hash(x)=25629731) +7242 train 6.845371 (lr=4.5262e-05) (hash(x)=28076236) +7243 train 6.446841 (lr=4.5243e-05) (hash(x)=23245430) +7244 train 6.817379 (lr=4.5224e-05) (hash(x)=26968550) +7245 train 6.364647 (lr=4.5205e-05) (hash(x)=22511067) +7246 train 6.615907 (lr=4.5186e-05) (hash(x)=25621873) +7247 train 6.448262 (lr=4.5168e-05) (hash(x)=23696470) +7248 train 6.729478 (lr=4.5149e-05) (hash(x)=24100851) +7249 train 6.648424 (lr=4.5130e-05) (hash(x)=26413767) +7250 val loss 6.6858 +7250 val perplexity 800.9321 +7250 train 7.003232 (lr=4.5111e-05) (hash(x)=28139390) +7251 train 6.846901 (lr=4.5092e-05) (hash(x)=28348662) +7252 train 6.238605 (lr=4.5074e-05) (hash(x)=21008922) +7253 train 6.656906 (lr=4.5055e-05) (hash(x)=23805449) +7254 train 6.602112 (lr=4.5036e-05) (hash(x)=22413998) +7255 train 6.739563 (lr=4.5017e-05) (hash(x)=27489711) +7256 train 6.546302 (lr=4.4998e-05) (hash(x)=24065426) +7257 train 6.472333 (lr=4.4980e-05) (hash(x)=23658876) +7258 train 6.714611 (lr=4.4961e-05) (hash(x)=22926681) +7259 train 6.616934 (lr=4.4942e-05) (hash(x)=25608370) +7260 train 6.623937 (lr=4.4923e-05) (hash(x)=25771904) +7261 train 6.519287 (lr=4.4904e-05) (hash(x)=23442938) +7262 train 6.295934 (lr=4.4886e-05) (hash(x)=21971477) +7263 train 6.932230 (lr=4.4867e-05) (hash(x)=28050163) +7264 train 6.233330 (lr=4.4848e-05) (hash(x)=19165144) +7265 train 6.368499 (lr=4.4829e-05) (hash(x)=23626089) +7266 train 6.489301 (lr=4.4811e-05) (hash(x)=21317430) +7267 train 6.362234 (lr=4.4792e-05) (hash(x)=22615841) +7268 train 6.560036 (lr=4.4773e-05) (hash(x)=23531191) +7269 train 6.475199 (lr=4.4755e-05) (hash(x)=22880424) +7270 train 6.499666 (lr=4.4736e-05) (hash(x)=23082105) +7271 train 6.571361 (lr=4.4717e-05) (hash(x)=26996807) +7272 train 6.406382 (lr=4.4698e-05) (hash(x)=23958387) +7273 train 7.058540 (lr=4.4680e-05) (hash(x)=29795232) +7274 train 7.388640 (lr=4.4661e-05) (hash(x)=32699751) +7275 train 7.045696 (lr=4.4642e-05) (hash(x)=28780071) +7276 train 6.793634 (lr=4.4624e-05) (hash(x)=26315947) +7277 train 6.501097 (lr=4.4605e-05) (hash(x)=25917382) +7278 train 6.583067 (lr=4.4586e-05) (hash(x)=24016901) +7279 train 6.977289 (lr=4.4568e-05) (hash(x)=28626495) +7280 train 6.888819 (lr=4.4549e-05) (hash(x)=23151801) +7281 train 6.786190 (lr=4.4530e-05) (hash(x)=26063175) +7282 train 6.557578 (lr=4.4512e-05) (hash(x)=23920603) +7283 train 6.252908 (lr=4.4493e-05) (hash(x)=18380174) +7284 train 6.451385 (lr=4.4474e-05) (hash(x)=17624934) +7285 train 6.751689 (lr=4.4456e-05) (hash(x)=23983451) +7286 train 6.434766 (lr=4.4437e-05) (hash(x)=24800016) +7287 train 6.637134 (lr=4.4418e-05) (hash(x)=24783242) +7288 train 6.349041 (lr=4.4400e-05) (hash(x)=22587569) +7289 train 6.559931 (lr=4.4381e-05) (hash(x)=26036718) +7290 train 6.264823 (lr=4.4363e-05) (hash(x)=18877382) +7291 train 6.280380 (lr=4.4344e-05) (hash(x)=19411545) +7292 train 7.114231 (lr=4.4325e-05) (hash(x)=29609344) +7293 train 6.828748 (lr=4.4307e-05) (hash(x)=27166200) +7294 train 6.604184 (lr=4.4288e-05) (hash(x)=21983275) +7295 train 6.668965 (lr=4.4270e-05) (hash(x)=25832479) +7296 train 6.376112 (lr=4.4251e-05) (hash(x)=22228927) +7297 train 6.556897 (lr=4.4232e-05) (hash(x)=24798180) +7298 train 6.446733 (lr=4.4214e-05) (hash(x)=23430458) +7299 train 6.529263 (lr=4.4195e-05) (hash(x)=25202518) +7300 val loss 6.6867 +7300 val perplexity 801.6356 +7300 train 6.273222 (lr=4.4177e-05) (hash(x)=22541251) +7301 train 6.221218 (lr=4.4158e-05) (hash(x)=21318466) +7302 train 6.374269 (lr=4.4140e-05) (hash(x)=21980528) +7303 train 6.624094 (lr=4.4121e-05) (hash(x)=23522137) +7304 train 6.534393 (lr=4.4102e-05) (hash(x)=24277176) +7305 train 6.647470 (lr=4.4084e-05) (hash(x)=26825118) +7306 train 7.009079 (lr=4.4065e-05) (hash(x)=27305832) +7307 train 7.292209 (lr=4.4047e-05) (hash(x)=28917794) +7308 train 7.217925 (lr=4.4028e-05) (hash(x)=28522343) +7309 train 6.655178 (lr=4.4010e-05) (hash(x)=23550494) +7310 train 6.689311 (lr=4.3991e-05) (hash(x)=26849849) +7311 train 6.649668 (lr=4.3973e-05) (hash(x)=26731973) +7312 train 6.654425 (lr=4.3954e-05) (hash(x)=25834330) +7313 train 6.748093 (lr=4.3936e-05) (hash(x)=25609302) +7314 train 6.709039 (lr=4.3917e-05) (hash(x)=24824675) +7315 train 7.007408 (lr=4.3899e-05) (hash(x)=26458975) +7316 train 6.895278 (lr=4.3880e-05) (hash(x)=26388531) +7317 train 7.451993 (lr=4.3862e-05) (hash(x)=29604116) +7318 train 6.525224 (lr=4.3843e-05) (hash(x)=23711830) +7319 train 6.759193 (lr=4.3825e-05) (hash(x)=26019142) +7320 train 6.663570 (lr=4.3807e-05) (hash(x)=25564516) +7321 train 6.603185 (lr=4.3788e-05) (hash(x)=23916481) +7322 train 6.470540 (lr=4.3770e-05) (hash(x)=22007388) +7323 train 6.600568 (lr=4.3751e-05) (hash(x)=24158545) +7324 train 6.681610 (lr=4.3733e-05) (hash(x)=26696425) +7325 train 6.859281 (lr=4.3714e-05) (hash(x)=24761648) +7326 train 6.750040 (lr=4.3696e-05) (hash(x)=21948684) +7327 train 6.499999 (lr=4.3677e-05) (hash(x)=25081877) +7328 train 6.424262 (lr=4.3659e-05) (hash(x)=23106369) +7329 train 6.911237 (lr=4.3641e-05) (hash(x)=30304149) +7330 train 6.730309 (lr=4.3622e-05) (hash(x)=25934148) +7331 train 6.907550 (lr=4.3604e-05) (hash(x)=29097664) +7332 train 6.393314 (lr=4.3585e-05) (hash(x)=23519937) +7333 train 6.825058 (lr=4.3567e-05) (hash(x)=24266623) +7334 train 6.842674 (lr=4.3549e-05) (hash(x)=26107259) +7335 train 6.519789 (lr=4.3530e-05) (hash(x)=23843571) +7336 train 6.815305 (lr=4.3512e-05) (hash(x)=25928144) +7337 train 6.595052 (lr=4.3493e-05) (hash(x)=24894741) +7338 train 6.746257 (lr=4.3475e-05) (hash(x)=26543953) +7339 train 6.539413 (lr=4.3457e-05) (hash(x)=22737047) +7340 train 7.073861 (lr=4.3438e-05) (hash(x)=28701756) +7341 train 6.771858 (lr=4.3420e-05) (hash(x)=26303095) +7342 train 6.581705 (lr=4.3402e-05) (hash(x)=25848930) +7343 train 6.732914 (lr=4.3383e-05) (hash(x)=26805739) +7344 train 6.535427 (lr=4.3365e-05) (hash(x)=23645523) +7345 train 6.601861 (lr=4.3347e-05) (hash(x)=22851082) +7346 train 6.617456 (lr=4.3328e-05) (hash(x)=22477084) +7347 train 6.637556 (lr=4.3310e-05) (hash(x)=22934009) +7348 train 6.430665 (lr=4.3292e-05) (hash(x)=22419245) +7349 train 6.627903 (lr=4.3273e-05) (hash(x)=25754460) +7350 val loss 6.6741 +7350 val perplexity 791.6248 +7350 train 6.983156 (lr=4.3255e-05) (hash(x)=28466499) +7351 train 6.664763 (lr=4.3237e-05) (hash(x)=27169927) +7352 train 6.576773 (lr=4.3219e-05) (hash(x)=22380994) +7353 train 6.722459 (lr=4.3200e-05) (hash(x)=28830379) +7354 train 6.522338 (lr=4.3182e-05) (hash(x)=25360630) +7355 train 6.260238 (lr=4.3164e-05) (hash(x)=20554517) +7356 train 6.677245 (lr=4.3145e-05) (hash(x)=25135091) +7357 train 6.941508 (lr=4.3127e-05) (hash(x)=27004910) +7358 train 7.000327 (lr=4.3109e-05) (hash(x)=26562413) +7359 train 6.779564 (lr=4.3091e-05) (hash(x)=26545491) +7360 train 6.548332 (lr=4.3072e-05) (hash(x)=24145549) +7361 train 6.582128 (lr=4.3054e-05) (hash(x)=23157780) +7362 train 6.505293 (lr=4.3036e-05) (hash(x)=23160370) +7363 train 6.572433 (lr=4.3018e-05) (hash(x)=24911153) +7364 train 7.014215 (lr=4.2999e-05) (hash(x)=28756691) +7365 train 7.070230 (lr=4.2981e-05) (hash(x)=28005975) +7366 train 6.686822 (lr=4.2963e-05) (hash(x)=25229855) +7367 train 6.659455 (lr=4.2945e-05) (hash(x)=25179497) +7368 train 6.692677 (lr=4.2927e-05) (hash(x)=25923511) +7369 train 6.525354 (lr=4.2908e-05) (hash(x)=24498432) +7370 train 6.883469 (lr=4.2890e-05) (hash(x)=30029054) +7371 train 6.750687 (lr=4.2872e-05) (hash(x)=27193267) +7372 train 6.559268 (lr=4.2854e-05) (hash(x)=23594860) +7373 train 6.473798 (lr=4.2836e-05) (hash(x)=23762517) +7374 train 6.499544 (lr=4.2817e-05) (hash(x)=23355526) +7375 train 6.732459 (lr=4.2799e-05) (hash(x)=27085003) +7376 train 6.656196 (lr=4.2781e-05) (hash(x)=24882368) +7377 train 6.502861 (lr=4.2763e-05) (hash(x)=25602670) +7378 train 6.654967 (lr=4.2745e-05) (hash(x)=25731476) +7379 train 6.462044 (lr=4.2727e-05) (hash(x)=24828956) +7380 train 6.671636 (lr=4.2708e-05) (hash(x)=23256003) +7381 train 6.715827 (lr=4.2690e-05) (hash(x)=24971143) +7382 train 6.694037 (lr=4.2672e-05) (hash(x)=25376912) +7383 train 6.608070 (lr=4.2654e-05) (hash(x)=24558202) +7384 train 6.565177 (lr=4.2636e-05) (hash(x)=21557335) +7385 train 6.979719 (lr=4.2618e-05) (hash(x)=26574617) +7386 train 6.883154 (lr=4.2600e-05) (hash(x)=26945913) +7387 train 6.448813 (lr=4.2582e-05) (hash(x)=24656329) +7388 train 6.937735 (lr=4.2563e-05) (hash(x)=27427866) +7389 train 6.572214 (lr=4.2545e-05) (hash(x)=25543675) +7390 train 6.718918 (lr=4.2527e-05) (hash(x)=26742738) +7391 train 6.910024 (lr=4.2509e-05) (hash(x)=25317684) +7392 train 6.814252 (lr=4.2491e-05) (hash(x)=26542987) +7393 train 6.561638 (lr=4.2473e-05) (hash(x)=23921505) +7394 train 6.829295 (lr=4.2455e-05) (hash(x)=28167247) +7395 train 6.874551 (lr=4.2437e-05) (hash(x)=24853134) +7396 train 6.547444 (lr=4.2419e-05) (hash(x)=24133291) +7397 train 6.610211 (lr=4.2401e-05) (hash(x)=26803457) +7398 train 6.290830 (lr=4.2383e-05) (hash(x)=20998376) +7399 train 6.815527 (lr=4.2365e-05) (hash(x)=27104868) +7400 val loss 6.6768 +7400 val perplexity 793.7536 +7400 train 6.963722 (lr=4.2347e-05) (hash(x)=30530566) +7401 train 6.797076 (lr=4.2329e-05) (hash(x)=29554134) +7402 train 6.842403 (lr=4.2311e-05) (hash(x)=26099868) +7403 train 6.640707 (lr=4.2293e-05) (hash(x)=24353634) +7404 train 6.520944 (lr=4.2274e-05) (hash(x)=24008632) +7405 train 6.550181 (lr=4.2256e-05) (hash(x)=24259019) +7406 train 6.499336 (lr=4.2238e-05) (hash(x)=22683392) +7407 train 6.880348 (lr=4.2220e-05) (hash(x)=24806274) +7408 train 6.293403 (lr=4.2202e-05) (hash(x)=19427593) +7409 train 6.808961 (lr=4.2184e-05) (hash(x)=24980112) +7410 train 6.674761 (lr=4.2166e-05) (hash(x)=26668975) +7411 train 6.834339 (lr=4.2149e-05) (hash(x)=27625217) +7412 train 6.660984 (lr=4.2131e-05) (hash(x)=25068842) +7413 train 7.100204 (lr=4.2113e-05) (hash(x)=28729128) +7414 train 7.100906 (lr=4.2095e-05) (hash(x)=26934049) +7415 train 6.570048 (lr=4.2077e-05) (hash(x)=24341937) +7416 train 6.438373 (lr=4.2059e-05) (hash(x)=22435637) +7417 train 6.556995 (lr=4.2041e-05) (hash(x)=21697871) +7418 train 6.751103 (lr=4.2023e-05) (hash(x)=25110175) +7419 train 6.770072 (lr=4.2005e-05) (hash(x)=26362971) +7420 train 6.712819 (lr=4.1987e-05) (hash(x)=25099947) +7421 train 6.446992 (lr=4.1969e-05) (hash(x)=21209140) +7422 train 6.379606 (lr=4.1951e-05) (hash(x)=21156628) +7423 train 6.437874 (lr=4.1933e-05) (hash(x)=22736558) +7424 train 6.551506 (lr=4.1915e-05) (hash(x)=22599045) +7425 train 6.408646 (lr=4.1897e-05) (hash(x)=19835086) +7426 train 6.363206 (lr=4.1879e-05) (hash(x)=19681348) +7427 train 6.796852 (lr=4.1862e-05) (hash(x)=26287113) +7428 train 6.491601 (lr=4.1844e-05) (hash(x)=25601562) +7429 train 6.525100 (lr=4.1826e-05) (hash(x)=23701414) +7430 train 6.615187 (lr=4.1808e-05) (hash(x)=25866910) +7431 train 6.830785 (lr=4.1790e-05) (hash(x)=23843744) +7432 train 6.867092 (lr=4.1772e-05) (hash(x)=28445342) +7433 train 6.369881 (lr=4.1754e-05) (hash(x)=23013949) +7434 train 6.672235 (lr=4.1736e-05) (hash(x)=23503224) +7435 train 6.537111 (lr=4.1719e-05) (hash(x)=24509223) +7436 train 6.857903 (lr=4.1701e-05) (hash(x)=29069071) +7437 train 6.590974 (lr=4.1683e-05) (hash(x)=25778863) +7438 train 6.799545 (lr=4.1665e-05) (hash(x)=30702183) +7439 train 6.804401 (lr=4.1647e-05) (hash(x)=27218468) +7440 train 6.664795 (lr=4.1629e-05) (hash(x)=25120377) +7441 train 6.754530 (lr=4.1612e-05) (hash(x)=27330382) +7442 train 6.762718 (lr=4.1594e-05) (hash(x)=26874766) +7443 train 6.502801 (lr=4.1576e-05) (hash(x)=22348365) +7444 train 6.497804 (lr=4.1558e-05) (hash(x)=23302341) +7445 train 6.852642 (lr=4.1540e-05) (hash(x)=25557954) +7446 train 6.595945 (lr=4.1523e-05) (hash(x)=27009906) +7447 train 6.564153 (lr=4.1505e-05) (hash(x)=26042053) +7448 train 7.043893 (lr=4.1487e-05) (hash(x)=22036412) +7449 train 6.803277 (lr=4.1469e-05) (hash(x)=27956533) +7450 val loss 6.6790 +7450 val perplexity 795.5117 +7450 train 6.386014 (lr=4.1451e-05) (hash(x)=23056562) +7451 train 6.495496 (lr=4.1434e-05) (hash(x)=25652715) +7452 train 6.550363 (lr=4.1416e-05) (hash(x)=26142336) +7453 train 6.624763 (lr=4.1398e-05) (hash(x)=24871264) +7454 train 6.766588 (lr=4.1380e-05) (hash(x)=27478967) +7455 train 6.664369 (lr=4.1363e-05) (hash(x)=25776082) +7456 train 6.654572 (lr=4.1345e-05) (hash(x)=24328862) +7457 train 6.674741 (lr=4.1327e-05) (hash(x)=24604995) +7458 train 6.388486 (lr=4.1309e-05) (hash(x)=22791916) +7459 train 6.450645 (lr=4.1292e-05) (hash(x)=22229606) +7460 train 6.678285 (lr=4.1274e-05) (hash(x)=25428460) +7461 train 6.744768 (lr=4.1256e-05) (hash(x)=25518638) +7462 train 6.408605 (lr=4.1239e-05) (hash(x)=21443388) +7463 train 6.368228 (lr=4.1221e-05) (hash(x)=21594447) +7464 train 6.395185 (lr=4.1203e-05) (hash(x)=21787075) +7465 train 6.622315 (lr=4.1185e-05) (hash(x)=24049225) +7466 train 6.717178 (lr=4.1168e-05) (hash(x)=23530828) +7467 train 6.758842 (lr=4.1150e-05) (hash(x)=23722987) +7468 train 6.638102 (lr=4.1132e-05) (hash(x)=24286323) +7469 train 6.468109 (lr=4.1115e-05) (hash(x)=22538896) +7470 train 6.673298 (lr=4.1097e-05) (hash(x)=25515278) +7471 train 6.435717 (lr=4.1079e-05) (hash(x)=21674469) +7472 train 6.491863 (lr=4.1062e-05) (hash(x)=23162283) +7473 train 6.263569 (lr=4.1044e-05) (hash(x)=23633119) +7474 train 6.344867 (lr=4.1026e-05) (hash(x)=22272254) +7475 train 6.440292 (lr=4.1009e-05) (hash(x)=21200087) +7476 train 6.742130 (lr=4.0991e-05) (hash(x)=24634897) +7477 train 6.637197 (lr=4.0974e-05) (hash(x)=25076156) +7478 train 6.524723 (lr=4.0956e-05) (hash(x)=24198586) +7479 train 6.675777 (lr=4.0938e-05) (hash(x)=26213966) +7480 train 6.634652 (lr=4.0921e-05) (hash(x)=25814500) +7481 train 6.261082 (lr=4.0903e-05) (hash(x)=22052502) +7482 train 6.615785 (lr=4.0886e-05) (hash(x)=27717860) +7483 train 6.559366 (lr=4.0868e-05) (hash(x)=23103626) +7484 train 6.450264 (lr=4.0850e-05) (hash(x)=22212579) +7485 train 6.651353 (lr=4.0833e-05) (hash(x)=24920844) +7486 train 6.675838 (lr=4.0815e-05) (hash(x)=23795969) +7487 train 6.500902 (lr=4.0798e-05) (hash(x)=23770702) +7488 train 6.519300 (lr=4.0780e-05) (hash(x)=24156454) +7489 train 6.586504 (lr=4.0763e-05) (hash(x)=22965430) +7490 train 6.677139 (lr=4.0745e-05) (hash(x)=24403702) +7491 train 6.670397 (lr=4.0727e-05) (hash(x)=26139229) +7492 train 6.579942 (lr=4.0710e-05) (hash(x)=23037161) +7493 train 6.501621 (lr=4.0692e-05) (hash(x)=25738110) +7494 train 6.777252 (lr=4.0675e-05) (hash(x)=26359303) +7495 train 6.848044 (lr=4.0657e-05) (hash(x)=27829878) +7496 train 6.406326 (lr=4.0640e-05) (hash(x)=24114795) +7497 train 6.470056 (lr=4.0622e-05) (hash(x)=20576987) +7498 train 6.798357 (lr=4.0605e-05) (hash(x)=26122779) +7499 train 7.071010 (lr=4.0587e-05) (hash(x)=27221940) +7500 val loss 6.6778 +7500 val perplexity 794.6060 +7500 train 6.336708 (lr=4.0570e-05) (hash(x)=21246967) +7501 train 6.576608 (lr=4.0552e-05) (hash(x)=25272042) +7502 train 7.366607 (lr=4.0535e-05) (hash(x)=28836949) +7503 train 6.876251 (lr=4.0517e-05) (hash(x)=29177278) +7504 train 6.594550 (lr=4.0500e-05) (hash(x)=23840882) +7505 train 6.383641 (lr=4.0482e-05) (hash(x)=22186169) +7506 train 7.045199 (lr=4.0465e-05) (hash(x)=27941595) +7507 train 6.699123 (lr=4.0447e-05) (hash(x)=26418252) +7508 train 6.777814 (lr=4.0430e-05) (hash(x)=24614728) +7509 train 6.731606 (lr=4.0412e-05) (hash(x)=26354367) +7510 train 6.626625 (lr=4.0395e-05) (hash(x)=26652830) +7511 train 6.656984 (lr=4.0378e-05) (hash(x)=26020089) +7512 train 6.496828 (lr=4.0360e-05) (hash(x)=23794444) +7513 train 6.712035 (lr=4.0343e-05) (hash(x)=26102649) +7514 train 6.738059 (lr=4.0325e-05) (hash(x)=22617015) +7515 train 6.537338 (lr=4.0308e-05) (hash(x)=24114078) +7516 train 6.554920 (lr=4.0290e-05) (hash(x)=26795488) +7517 train 6.549732 (lr=4.0273e-05) (hash(x)=21065534) +7518 train 6.377985 (lr=4.0256e-05) (hash(x)=21785713) +7519 train 6.685277 (lr=4.0238e-05) (hash(x)=24676475) +7520 train 6.677341 (lr=4.0221e-05) (hash(x)=25871720) +7521 train 6.704437 (lr=4.0203e-05) (hash(x)=23258275) +7522 train 6.753885 (lr=4.0186e-05) (hash(x)=26974040) +7523 train 7.007971 (lr=4.0169e-05) (hash(x)=30538340) +7524 train 6.395813 (lr=4.0151e-05) (hash(x)=21300961) +7525 train 6.658528 (lr=4.0134e-05) (hash(x)=24264874) +7526 train 6.416191 (lr=4.0117e-05) (hash(x)=21897055) +7527 train 6.311632 (lr=4.0099e-05) (hash(x)=24056174) +7528 train 6.522072 (lr=4.0082e-05) (hash(x)=25361413) +7529 train 6.482234 (lr=4.0065e-05) (hash(x)=22087466) +7530 train 6.798813 (lr=4.0047e-05) (hash(x)=25185013) +7531 train 6.985558 (lr=4.0030e-05) (hash(x)=23937392) +7532 train 7.020616 (lr=4.0013e-05) (hash(x)=24485761) +7533 train 6.554741 (lr=3.9995e-05) (hash(x)=24839143) +7534 train 6.748693 (lr=3.9978e-05) (hash(x)=25648063) +7535 train 6.403526 (lr=3.9961e-05) (hash(x)=21887514) +7536 train 6.750354 (lr=3.9943e-05) (hash(x)=29370437) +7537 train 6.857024 (lr=3.9926e-05) (hash(x)=27733168) +7538 train 6.780139 (lr=3.9909e-05) (hash(x)=24989210) +7539 train 6.665413 (lr=3.9892e-05) (hash(x)=24617463) +7540 train 6.422860 (lr=3.9874e-05) (hash(x)=20913252) +7541 train 6.753971 (lr=3.9857e-05) (hash(x)=24850107) +7542 train 6.503296 (lr=3.9840e-05) (hash(x)=25930790) +7543 train 6.513616 (lr=3.9822e-05) (hash(x)=24196100) +7544 train 6.672065 (lr=3.9805e-05) (hash(x)=27344264) +7545 train 6.376647 (lr=3.9788e-05) (hash(x)=23547632) +7546 train 6.527713 (lr=3.9771e-05) (hash(x)=23887753) +7547 train 7.208600 (lr=3.9753e-05) (hash(x)=26719200) +7548 train 7.100832 (lr=3.9736e-05) (hash(x)=27682392) +7549 train 6.456378 (lr=3.9719e-05) (hash(x)=24789657) +7550 val loss 6.6719 +7550 val perplexity 789.8726 +7550 train 6.435788 (lr=3.9702e-05) (hash(x)=23478093) +7551 train 6.594149 (lr=3.9685e-05) (hash(x)=25700093) +7552 train 6.895485 (lr=3.9667e-05) (hash(x)=29726620) +7553 train 6.645132 (lr=3.9650e-05) (hash(x)=25702686) +7554 train 6.510483 (lr=3.9633e-05) (hash(x)=23474272) +7555 train 6.697042 (lr=3.9616e-05) (hash(x)=25253145) +7556 train 6.772842 (lr=3.9599e-05) (hash(x)=26434297) +7557 train 7.173682 (lr=3.9581e-05) (hash(x)=30032123) +7558 train 6.912156 (lr=3.9564e-05) (hash(x)=26391058) +7559 train 6.525450 (lr=3.9547e-05) (hash(x)=24365834) +7560 train 6.849874 (lr=3.9530e-05) (hash(x)=26513237) +7561 train 6.601866 (lr=3.9513e-05) (hash(x)=25472287) +7562 train 6.565958 (lr=3.9496e-05) (hash(x)=25692067) +7563 train 6.556322 (lr=3.9478e-05) (hash(x)=23331500) +7564 train 6.558510 (lr=3.9461e-05) (hash(x)=25278061) +7565 train 6.589468 (lr=3.9444e-05) (hash(x)=25195327) +7566 train 6.504879 (lr=3.9427e-05) (hash(x)=24923971) +7567 train 6.644042 (lr=3.9410e-05) (hash(x)=25631786) +7568 train 6.616380 (lr=3.9393e-05) (hash(x)=25739951) +7569 train 6.655359 (lr=3.9376e-05) (hash(x)=23174094) +7570 train 6.773734 (lr=3.9358e-05) (hash(x)=22926830) +7571 train 6.787888 (lr=3.9341e-05) (hash(x)=26627700) +7572 train 6.832498 (lr=3.9324e-05) (hash(x)=27230179) +7573 train 6.645321 (lr=3.9307e-05) (hash(x)=22636814) +7574 train 6.812033 (lr=3.9290e-05) (hash(x)=26282102) +7575 train 6.569860 (lr=3.9273e-05) (hash(x)=24452345) +7576 train 6.354856 (lr=3.9256e-05) (hash(x)=21561389) +7577 train 6.435582 (lr=3.9239e-05) (hash(x)=24474970) +7578 train 5.956204 (lr=3.9222e-05) (hash(x)=17994617) +7579 train 6.338360 (lr=3.9205e-05) (hash(x)=21063302) +7580 train 6.639052 (lr=3.9188e-05) (hash(x)=24617151) +7581 train 6.530328 (lr=3.9171e-05) (hash(x)=26114864) +7582 train 6.526371 (lr=3.9154e-05) (hash(x)=25091911) +7583 train 6.422962 (lr=3.9137e-05) (hash(x)=21465330) +7584 train 6.595773 (lr=3.9120e-05) (hash(x)=21966553) +7585 train 6.379537 (lr=3.9103e-05) (hash(x)=23377832) +7586 train 6.636463 (lr=3.9085e-05) (hash(x)=22300027) +7587 train 6.564620 (lr=3.9068e-05) (hash(x)=23031979) +7588 train 6.618315 (lr=3.9051e-05) (hash(x)=24882930) +7589 train 6.325606 (lr=3.9034e-05) (hash(x)=23424300) +7590 train 6.776273 (lr=3.9017e-05) (hash(x)=25807351) +7591 train 6.272079 (lr=3.9000e-05) (hash(x)=20427493) +7592 train 6.389126 (lr=3.8983e-05) (hash(x)=24612130) +7593 train 6.332981 (lr=3.8966e-05) (hash(x)=22165520) +7594 train 6.608325 (lr=3.8950e-05) (hash(x)=26430133) +7595 train 6.419967 (lr=3.8933e-05) (hash(x)=23476688) +7596 train 7.054042 (lr=3.8916e-05) (hash(x)=26303877) +7597 train 6.351674 (lr=3.8899e-05) (hash(x)=16631115) +7598 train 6.633428 (lr=3.8882e-05) (hash(x)=25186344) +7599 train 6.787073 (lr=3.8865e-05) (hash(x)=25439720) +7600 val loss 6.6707 +7600 val perplexity 788.9398 +7600 train 6.914994 (lr=3.8848e-05) (hash(x)=26896463) +7601 train 6.978131 (lr=3.8831e-05) (hash(x)=27737064) +7602 train 6.681125 (lr=3.8814e-05) (hash(x)=24609310) +7603 train 6.648186 (lr=3.8797e-05) (hash(x)=26682690) +7604 train 6.590759 (lr=3.8780e-05) (hash(x)=24183905) +7605 train 6.709817 (lr=3.8763e-05) (hash(x)=29288247) +7606 train 6.493871 (lr=3.8746e-05) (hash(x)=23775779) +7607 train 6.253738 (lr=3.8729e-05) (hash(x)=21652988) +7608 train 6.595964 (lr=3.8712e-05) (hash(x)=25528958) +7609 train 6.514751 (lr=3.8696e-05) (hash(x)=25159500) +7610 train 6.604710 (lr=3.8679e-05) (hash(x)=25872544) +7611 train 6.669449 (lr=3.8662e-05) (hash(x)=26679136) +7612 train 6.461734 (lr=3.8645e-05) (hash(x)=24253918) +7613 train 6.509511 (lr=3.8628e-05) (hash(x)=24323038) +7614 train 6.674759 (lr=3.8611e-05) (hash(x)=27469726) +7615 train 6.675195 (lr=3.8594e-05) (hash(x)=22546779) +7616 train 6.831690 (lr=3.8577e-05) (hash(x)=22158965) +7617 train 6.552657 (lr=3.8561e-05) (hash(x)=24696198) +7618 train 6.487308 (lr=3.8544e-05) (hash(x)=21717599) +7619 train 6.632233 (lr=3.8527e-05) (hash(x)=25183353) +7620 train 6.550217 (lr=3.8510e-05) (hash(x)=23696483) +7621 train 6.300082 (lr=3.8493e-05) (hash(x)=22113763) +7622 train 6.035616 (lr=3.8477e-05) (hash(x)=17460309) +7623 train 6.282424 (lr=3.8460e-05) (hash(x)=20855736) +7624 train 6.577970 (lr=3.8443e-05) (hash(x)=25062029) +7625 train 6.576305 (lr=3.8426e-05) (hash(x)=24961706) +7626 train 6.330944 (lr=3.8409e-05) (hash(x)=21374655) +7627 train 6.427788 (lr=3.8393e-05) (hash(x)=20906769) +7628 train 6.810165 (lr=3.8376e-05) (hash(x)=29044808) +7629 train 6.839183 (lr=3.8359e-05) (hash(x)=27261849) +7630 train 6.716559 (lr=3.8342e-05) (hash(x)=25862464) +7631 train 6.820354 (lr=3.8325e-05) (hash(x)=27725873) +7632 train 7.147611 (lr=3.8309e-05) (hash(x)=30991833) +7633 train 6.610614 (lr=3.8292e-05) (hash(x)=23330476) +7634 train 6.513046 (lr=3.8275e-05) (hash(x)=25188641) +7635 train 6.554767 (lr=3.8258e-05) (hash(x)=25108332) +7636 train 6.828986 (lr=3.8242e-05) (hash(x)=30511751) +7637 train 6.572528 (lr=3.8225e-05) (hash(x)=25657859) +7638 train 6.698097 (lr=3.8208e-05) (hash(x)=24589729) +7639 train 6.854860 (lr=3.8191e-05) (hash(x)=24582989) +7640 train 6.556986 (lr=3.8175e-05) (hash(x)=24558698) +7641 train 6.561925 (lr=3.8158e-05) (hash(x)=23349707) +7642 train 6.723874 (lr=3.8141e-05) (hash(x)=27536067) +7643 train 6.501926 (lr=3.8125e-05) (hash(x)=22469417) +7644 train 6.688893 (lr=3.8108e-05) (hash(x)=23907537) +7645 train 6.598038 (lr=3.8091e-05) (hash(x)=25509306) +7646 train 6.415997 (lr=3.8075e-05) (hash(x)=23853273) +7647 train 6.618357 (lr=3.8058e-05) (hash(x)=24822372) +7648 train 6.404264 (lr=3.8041e-05) (hash(x)=21453583) +7649 train 6.493309 (lr=3.8025e-05) (hash(x)=23983201) +7650 val loss 6.6795 +7650 val perplexity 795.9128 +7650 train 6.821159 (lr=3.8008e-05) (hash(x)=27119679) +7651 train 6.597961 (lr=3.7991e-05) (hash(x)=26039874) +7652 train 6.576206 (lr=3.7975e-05) (hash(x)=24045094) +7653 train 6.561910 (lr=3.7958e-05) (hash(x)=22517876) +7654 train 6.673608 (lr=3.7941e-05) (hash(x)=23572839) +7655 train 6.852081 (lr=3.7925e-05) (hash(x)=25624588) +7656 train 6.588033 (lr=3.7908e-05) (hash(x)=24891004) +7657 train 6.586327 (lr=3.7892e-05) (hash(x)=22319601) +7658 train 6.293853 (lr=3.7875e-05) (hash(x)=22203556) +7659 train 6.484670 (lr=3.7858e-05) (hash(x)=24225722) +7660 train 6.570678 (lr=3.7842e-05) (hash(x)=24571169) +7661 train 6.579637 (lr=3.7825e-05) (hash(x)=25483578) +7662 train 6.805276 (lr=3.7809e-05) (hash(x)=24831282) +7663 train 6.644073 (lr=3.7792e-05) (hash(x)=23566489) +7664 train 6.693688 (lr=3.7775e-05) (hash(x)=25708298) +7665 train 6.459038 (lr=3.7759e-05) (hash(x)=21390177) +7666 train 6.538207 (lr=3.7742e-05) (hash(x)=25275054) +7667 train 6.829160 (lr=3.7726e-05) (hash(x)=28993619) +7668 train 7.296783 (lr=3.7709e-05) (hash(x)=30259974) +7669 train 6.944072 (lr=3.7693e-05) (hash(x)=26281157) +7670 train 6.657648 (lr=3.7676e-05) (hash(x)=26806152) +7671 train 6.635847 (lr=3.7660e-05) (hash(x)=28117387) +7672 train 6.458244 (lr=3.7643e-05) (hash(x)=22480930) +7673 train 6.509645 (lr=3.7626e-05) (hash(x)=23750652) +7674 train 6.581586 (lr=3.7610e-05) (hash(x)=24763622) +7675 train 6.574565 (lr=3.7593e-05) (hash(x)=26294682) +7676 train 6.828773 (lr=3.7577e-05) (hash(x)=27468276) +7677 train 6.335279 (lr=3.7560e-05) (hash(x)=21421993) +7678 train 6.524513 (lr=3.7544e-05) (hash(x)=23173696) +7679 train 6.479890 (lr=3.7527e-05) (hash(x)=26874283) +7680 train 6.500362 (lr=3.7511e-05) (hash(x)=23607479) +7681 train 6.613008 (lr=3.7494e-05) (hash(x)=21539486) +7682 train 6.155995 (lr=3.7478e-05) (hash(x)=17477099) +7683 train 6.352081 (lr=3.7462e-05) (hash(x)=20610535) +7684 train 6.566343 (lr=3.7445e-05) (hash(x)=24784717) +7685 train 6.747506 (lr=3.7429e-05) (hash(x)=24529403) +7686 train 6.533147 (lr=3.7412e-05) (hash(x)=24066216) +7687 train 6.998796 (lr=3.7396e-05) (hash(x)=28570123) +7688 train 6.806288 (lr=3.7379e-05) (hash(x)=24455358) +7689 train 6.475570 (lr=3.7363e-05) (hash(x)=20561973) +7690 train 6.711328 (lr=3.7346e-05) (hash(x)=27778739) +7691 train 6.441564 (lr=3.7330e-05) (hash(x)=24386170) +7692 train 6.599199 (lr=3.7314e-05) (hash(x)=26831711) +7693 train 6.716424 (lr=3.7297e-05) (hash(x)=24162470) +7694 train 6.718179 (lr=3.7281e-05) (hash(x)=28497301) +7695 train 6.598321 (lr=3.7264e-05) (hash(x)=24807017) +7696 train 6.714472 (lr=3.7248e-05) (hash(x)=25794880) +7697 train 6.439725 (lr=3.7232e-05) (hash(x)=22676021) +7698 train 6.549085 (lr=3.7215e-05) (hash(x)=24138115) +7699 train 6.487312 (lr=3.7199e-05) (hash(x)=23678981) +7700 val loss 6.6757 +7700 val perplexity 792.9206 +7700 train 6.533952 (lr=3.7183e-05) (hash(x)=25072330) +7701 train 6.445240 (lr=3.7166e-05) (hash(x)=22922754) +7702 train 6.665409 (lr=3.7150e-05) (hash(x)=26456236) +7703 train 6.583162 (lr=3.7133e-05) (hash(x)=25189993) +7704 train 6.637260 (lr=3.7117e-05) (hash(x)=23137141) +7705 train 7.006622 (lr=3.7101e-05) (hash(x)=26428613) +7706 train 6.495636 (lr=3.7084e-05) (hash(x)=22157979) +7707 train 6.260461 (lr=3.7068e-05) (hash(x)=21889553) +7708 train 6.981061 (lr=3.7052e-05) (hash(x)=29218200) +7709 train 6.432395 (lr=3.7035e-05) (hash(x)=22267059) +7710 train 6.512971 (lr=3.7019e-05) (hash(x)=22468568) +7711 train 6.970141 (lr=3.7003e-05) (hash(x)=29202226) +7712 train 6.858507 (lr=3.6987e-05) (hash(x)=28090830) +7713 train 6.842725 (lr=3.6970e-05) (hash(x)=26773985) +7714 train 6.503704 (lr=3.6954e-05) (hash(x)=22143665) +7715 train 6.586791 (lr=3.6938e-05) (hash(x)=22117007) +7716 train 6.881764 (lr=3.6921e-05) (hash(x)=25918720) +7717 train 7.338179 (lr=3.6905e-05) (hash(x)=28554085) +7718 train 7.565788 (lr=3.6889e-05) (hash(x)=30377734) +7719 train 6.586313 (lr=3.6873e-05) (hash(x)=26060713) +7720 train 6.709439 (lr=3.6856e-05) (hash(x)=26534669) +7721 train 6.472769 (lr=3.6840e-05) (hash(x)=22760237) +7722 train 6.594124 (lr=3.6824e-05) (hash(x)=23966049) +7723 train 6.578218 (lr=3.6808e-05) (hash(x)=21459371) +7724 train 7.099968 (lr=3.6791e-05) (hash(x)=30917512) +7725 train 7.152944 (lr=3.6775e-05) (hash(x)=29904475) +7726 train 6.723958 (lr=3.6759e-05) (hash(x)=27226081) +7727 train 6.630601 (lr=3.6743e-05) (hash(x)=23053285) +7728 train 6.874565 (lr=3.6727e-05) (hash(x)=25329846) +7729 train 6.775817 (lr=3.6710e-05) (hash(x)=25230185) +7730 train 6.984717 (lr=3.6694e-05) (hash(x)=28455655) +7731 train 6.706703 (lr=3.6678e-05) (hash(x)=27336585) +7732 train 6.772488 (lr=3.6662e-05) (hash(x)=28130618) +7733 train 6.528971 (lr=3.6646e-05) (hash(x)=23794687) +7734 train 6.523548 (lr=3.6630e-05) (hash(x)=22123174) +7735 train 6.619587 (lr=3.6613e-05) (hash(x)=21968481) +7736 train 6.466017 (lr=3.6597e-05) (hash(x)=23020813) +7737 train 7.032118 (lr=3.6581e-05) (hash(x)=29534235) +7738 train 6.733896 (lr=3.6565e-05) (hash(x)=29525683) +7739 train 6.642055 (lr=3.6549e-05) (hash(x)=28089468) +7740 train 6.547453 (lr=3.6533e-05) (hash(x)=25903904) +7741 train 6.720105 (lr=3.6517e-05) (hash(x)=25562718) +7742 train 6.100623 (lr=3.6500e-05) (hash(x)=21029319) +7743 train 6.611395 (lr=3.6484e-05) (hash(x)=24492698) +7744 train 6.548602 (lr=3.6468e-05) (hash(x)=25471162) +7745 train 6.293752 (lr=3.6452e-05) (hash(x)=21966131) +7746 train 6.364090 (lr=3.6436e-05) (hash(x)=25554808) +7747 train 6.548221 (lr=3.6420e-05) (hash(x)=24244858) +7748 train 6.604419 (lr=3.6404e-05) (hash(x)=23624474) +7749 train 6.607872 (lr=3.6388e-05) (hash(x)=23933180) +7750 val loss 6.6704 +7750 val perplexity 788.6942 +7750 train 7.022202 (lr=3.6372e-05) (hash(x)=28681252) +7751 train 6.664559 (lr=3.6356e-05) (hash(x)=25760806) +7752 train 6.575202 (lr=3.6340e-05) (hash(x)=24125755) +7753 train 6.463812 (lr=3.6323e-05) (hash(x)=23692433) +7754 train 6.393904 (lr=3.6307e-05) (hash(x)=19631607) +7755 train 6.789625 (lr=3.6291e-05) (hash(x)=28695065) +7756 train 6.887761 (lr=3.6275e-05) (hash(x)=28354129) +7757 train 6.554893 (lr=3.6259e-05) (hash(x)=23940798) +7758 train 6.629671 (lr=3.6243e-05) (hash(x)=26625318) +7759 train 6.819131 (lr=3.6227e-05) (hash(x)=27417392) +7760 train 6.569164 (lr=3.6211e-05) (hash(x)=25169375) +7761 train 6.134173 (lr=3.6195e-05) (hash(x)=19572409) +7762 train 6.496423 (lr=3.6179e-05) (hash(x)=23864239) +7763 train 6.408600 (lr=3.6163e-05) (hash(x)=23855495) +7764 train 7.324286 (lr=3.6147e-05) (hash(x)=28565044) +7765 train 6.296550 (lr=3.6131e-05) (hash(x)=20398052) +7766 train 6.690843 (lr=3.6115e-05) (hash(x)=24123056) +7767 train 6.847931 (lr=3.6099e-05) (hash(x)=26767105) +7768 train 6.793277 (lr=3.6083e-05) (hash(x)=27494455) +7769 train 6.957162 (lr=3.6067e-05) (hash(x)=29008178) +7770 train 6.639150 (lr=3.6051e-05) (hash(x)=25567434) +7771 train 6.812973 (lr=3.6035e-05) (hash(x)=28544187) +7772 train 6.324443 (lr=3.6020e-05) (hash(x)=20818451) +7773 train 6.669033 (lr=3.6004e-05) (hash(x)=30138063) +7774 train 6.464606 (lr=3.5988e-05) (hash(x)=22996166) +7775 train 6.691620 (lr=3.5972e-05) (hash(x)=25117678) +7776 train 6.424893 (lr=3.5956e-05) (hash(x)=22444101) +7777 train 6.772670 (lr=3.5940e-05) (hash(x)=26634522) +7778 train 6.541060 (lr=3.5924e-05) (hash(x)=22961993) +7779 train 6.556573 (lr=3.5908e-05) (hash(x)=23552401) +7780 train 6.566035 (lr=3.5892e-05) (hash(x)=23101383) +7781 train 6.781307 (lr=3.5876e-05) (hash(x)=26340139) +7782 train 6.306129 (lr=3.5860e-05) (hash(x)=21444239) +7783 train 6.340297 (lr=3.5845e-05) (hash(x)=24233758) +7784 train 6.695933 (lr=3.5829e-05) (hash(x)=26129818) +7785 train 6.518198 (lr=3.5813e-05) (hash(x)=23126166) +7786 train 6.616628 (lr=3.5797e-05) (hash(x)=21067978) +7787 train 6.318052 (lr=3.5781e-05) (hash(x)=21618887) +7788 train 6.534423 (lr=3.5765e-05) (hash(x)=25474342) +7789 train 6.844591 (lr=3.5749e-05) (hash(x)=25175000) +7790 train 6.609581 (lr=3.5734e-05) (hash(x)=25621769) +7791 train 6.956961 (lr=3.5718e-05) (hash(x)=29907634) +7792 train 6.047832 (lr=3.5702e-05) (hash(x)=19989629) +7793 train 6.232030 (lr=3.5686e-05) (hash(x)=21646970) +7794 train 6.609250 (lr=3.5670e-05) (hash(x)=22763930) +7795 train 6.326595 (lr=3.5654e-05) (hash(x)=20462990) +7796 train 6.559404 (lr=3.5639e-05) (hash(x)=26961413) +7797 train 6.476683 (lr=3.5623e-05) (hash(x)=24677361) +7798 train 6.437519 (lr=3.5607e-05) (hash(x)=23652398) +7799 train 6.563979 (lr=3.5591e-05) (hash(x)=23552436) +7800 val loss 6.6768 +7800 val perplexity 793.7733 +7800 train 6.525675 (lr=3.5576e-05) (hash(x)=24292897) +7801 train 6.545325 (lr=3.5560e-05) (hash(x)=25011036) +7802 train 6.675313 (lr=3.5544e-05) (hash(x)=24555115) +7803 train 7.070667 (lr=3.5528e-05) (hash(x)=24794800) +7804 train 6.742511 (lr=3.5513e-05) (hash(x)=28972091) +7805 train 6.947727 (lr=3.5497e-05) (hash(x)=26425104) +7806 train 6.541933 (lr=3.5481e-05) (hash(x)=21123921) +7807 train 7.024318 (lr=3.5465e-05) (hash(x)=28610406) +7808 train 6.738506 (lr=3.5450e-05) (hash(x)=22785147) +7809 train 6.632240 (lr=3.5434e-05) (hash(x)=25811870) +7810 train 6.565361 (lr=3.5418e-05) (hash(x)=23514152) +7811 train 6.685027 (lr=3.5402e-05) (hash(x)=24281320) +7812 train 6.280391 (lr=3.5387e-05) (hash(x)=20626927) +7813 train 6.621869 (lr=3.5371e-05) (hash(x)=24391439) +7814 train 6.868849 (lr=3.5355e-05) (hash(x)=24587029) +7815 train 6.558184 (lr=3.5340e-05) (hash(x)=23858212) +7816 train 6.635289 (lr=3.5324e-05) (hash(x)=23932873) +7817 train 6.563950 (lr=3.5308e-05) (hash(x)=23817740) +7818 train 6.541761 (lr=3.5293e-05) (hash(x)=23082139) +7819 train 6.526227 (lr=3.5277e-05) (hash(x)=24304509) +7820 train 6.863393 (lr=3.5261e-05) (hash(x)=27894034) +7821 train 6.303819 (lr=3.5246e-05) (hash(x)=23243601) +7822 train 6.555946 (lr=3.5230e-05) (hash(x)=26743827) +7823 train 6.141901 (lr=3.5214e-05) (hash(x)=20567764) +7824 train 6.507846 (lr=3.5199e-05) (hash(x)=24590915) +7825 train 6.420918 (lr=3.5183e-05) (hash(x)=23519078) +7826 train 6.427283 (lr=3.5167e-05) (hash(x)=22956392) +7827 train 6.574813 (lr=3.5152e-05) (hash(x)=26873246) +7828 train 6.518413 (lr=3.5136e-05) (hash(x)=21559865) +7829 train 6.413501 (lr=3.5121e-05) (hash(x)=23062298) +7830 train 6.524779 (lr=3.5105e-05) (hash(x)=21387976) +7831 train 6.771373 (lr=3.5089e-05) (hash(x)=29631106) +7832 train 6.429782 (lr=3.5074e-05) (hash(x)=22684316) +7833 train 6.284540 (lr=3.5058e-05) (hash(x)=21648452) +7834 train 6.600772 (lr=3.5043e-05) (hash(x)=25492959) +7835 train 6.756242 (lr=3.5027e-05) (hash(x)=25305791) +7836 train 6.446573 (lr=3.5012e-05) (hash(x)=23222514) +7837 train 6.633222 (lr=3.4996e-05) (hash(x)=22307623) +7838 train 6.550487 (lr=3.4981e-05) (hash(x)=24837302) +7839 train 6.274726 (lr=3.4965e-05) (hash(x)=19843564) +7840 train 7.240134 (lr=3.4949e-05) (hash(x)=31677324) +7841 train 6.421285 (lr=3.4934e-05) (hash(x)=22655517) +7842 train 6.501403 (lr=3.4918e-05) (hash(x)=25755154) +7843 train 6.703548 (lr=3.4903e-05) (hash(x)=25101224) +7844 train 6.540807 (lr=3.4887e-05) (hash(x)=21343640) +7845 train 6.827384 (lr=3.4872e-05) (hash(x)=25032974) +7846 train 6.569338 (lr=3.4856e-05) (hash(x)=24889640) +7847 train 6.349977 (lr=3.4841e-05) (hash(x)=22589891) +7848 train 6.539163 (lr=3.4825e-05) (hash(x)=27144794) +7849 train 6.548454 (lr=3.4810e-05) (hash(x)=25489784) +7850 val loss 6.6724 +7850 val perplexity 790.2844 +7850 train 6.565800 (lr=3.4794e-05) (hash(x)=25347574) +7851 train 6.607196 (lr=3.4779e-05) (hash(x)=24533991) +7852 train 6.514316 (lr=3.4764e-05) (hash(x)=25767139) +7853 train 6.160069 (lr=3.4748e-05) (hash(x)=18969890) +7854 train 6.512647 (lr=3.4733e-05) (hash(x)=25600074) +7855 train 6.410480 (lr=3.4717e-05) (hash(x)=21183943) +7856 train 7.025703 (lr=3.4702e-05) (hash(x)=28609090) +7857 train 6.413728 (lr=3.4686e-05) (hash(x)=24000198) +7858 train 6.657486 (lr=3.4671e-05) (hash(x)=24678067) +7859 train 6.449864 (lr=3.4655e-05) (hash(x)=25008761) +7860 train 6.351762 (lr=3.4640e-05) (hash(x)=20476490) +7861 train 6.752309 (lr=3.4625e-05) (hash(x)=23398221) +7862 train 6.219427 (lr=3.4609e-05) (hash(x)=22398079) +7863 train 6.808530 (lr=3.4594e-05) (hash(x)=26152241) +7864 train 6.691321 (lr=3.4578e-05) (hash(x)=24785394) +7865 train 6.537114 (lr=3.4563e-05) (hash(x)=25486070) +7866 train 6.456749 (lr=3.4548e-05) (hash(x)=24608065) +7867 train 6.715192 (lr=3.4532e-05) (hash(x)=26276234) +7868 train 6.773761 (lr=3.4517e-05) (hash(x)=27480342) +7869 train 6.544905 (lr=3.4502e-05) (hash(x)=23622107) +7870 train 6.672452 (lr=3.4486e-05) (hash(x)=25836453) +7871 train 6.442212 (lr=3.4471e-05) (hash(x)=22700785) +7872 train 6.582932 (lr=3.4456e-05) (hash(x)=23088949) +7873 train 6.434143 (lr=3.4440e-05) (hash(x)=22802001) +7874 train 6.451859 (lr=3.4425e-05) (hash(x)=23064276) +7875 train 6.646222 (lr=3.4410e-05) (hash(x)=24096486) +7876 train 7.115904 (lr=3.4394e-05) (hash(x)=25740010) +7877 train 6.581229 (lr=3.4379e-05) (hash(x)=24578737) +7878 train 7.242606 (lr=3.4364e-05) (hash(x)=26850665) +7879 train 7.505863 (lr=3.4348e-05) (hash(x)=29611280) +7880 train 7.501423 (lr=3.4333e-05) (hash(x)=29470261) +7881 train 7.756194 (lr=3.4318e-05) (hash(x)=30218145) +7882 train 7.273016 (lr=3.4302e-05) (hash(x)=26992212) +7883 train 6.272937 (lr=3.4287e-05) (hash(x)=22812890) +7884 train 6.553540 (lr=3.4272e-05) (hash(x)=26384382) +7885 train 6.548767 (lr=3.4257e-05) (hash(x)=25982513) +7886 train 6.481285 (lr=3.4241e-05) (hash(x)=23926560) +7887 train 6.768938 (lr=3.4226e-05) (hash(x)=25972823) +7888 train 6.494096 (lr=3.4211e-05) (hash(x)=21677567) +7889 train 6.743237 (lr=3.4196e-05) (hash(x)=24058871) +7890 train 6.432420 (lr=3.4180e-05) (hash(x)=27919563) +7891 train 6.737248 (lr=3.4165e-05) (hash(x)=24988300) +7892 train 6.519125 (lr=3.4150e-05) (hash(x)=22334999) +7893 train 6.266761 (lr=3.4135e-05) (hash(x)=21496420) +7894 train 6.908739 (lr=3.4120e-05) (hash(x)=28606185) +7895 train 6.724741 (lr=3.4104e-05) (hash(x)=23447782) +7896 train 6.508957 (lr=3.4089e-05) (hash(x)=25566724) +7897 train 6.646072 (lr=3.4074e-05) (hash(x)=25663935) +7898 train 6.341791 (lr=3.4059e-05) (hash(x)=21529073) +7899 train 6.398320 (lr=3.4044e-05) (hash(x)=22871262) +7900 val loss 6.6695 +7900 val perplexity 788.0153 +7900 train 6.773282 (lr=3.4028e-05) (hash(x)=28500664) +7901 train 6.927690 (lr=3.4013e-05) (hash(x)=27258546) +7902 train 6.455095 (lr=3.3998e-05) (hash(x)=21028657) +7903 train 6.484569 (lr=3.3983e-05) (hash(x)=22578453) +7904 train 7.041003 (lr=3.3968e-05) (hash(x)=26365380) +7905 train 6.652400 (lr=3.3953e-05) (hash(x)=25302485) +7906 train 6.338194 (lr=3.3938e-05) (hash(x)=23088848) +7907 train 6.358881 (lr=3.3922e-05) (hash(x)=22754287) +7908 train 6.583477 (lr=3.3907e-05) (hash(x)=23273793) +7909 train 6.628934 (lr=3.3892e-05) (hash(x)=24109427) +7910 train 6.497155 (lr=3.3877e-05) (hash(x)=23037062) +7911 train 6.547635 (lr=3.3862e-05) (hash(x)=25474622) +7912 train 6.396543 (lr=3.3847e-05) (hash(x)=25516547) +7913 train 6.667221 (lr=3.3832e-05) (hash(x)=25921397) +7914 train 6.467020 (lr=3.3817e-05) (hash(x)=25597193) +7915 train 6.882482 (lr=3.3802e-05) (hash(x)=28567887) +7916 train 6.509205 (lr=3.3787e-05) (hash(x)=24722602) +7917 train 6.609418 (lr=3.3772e-05) (hash(x)=25888915) +7918 train 6.844190 (lr=3.3756e-05) (hash(x)=25909185) +7919 train 6.874820 (lr=3.3741e-05) (hash(x)=22965762) +7920 train 6.682892 (lr=3.3726e-05) (hash(x)=25132952) +7921 train 6.801501 (lr=3.3711e-05) (hash(x)=26762050) +7922 train 7.026177 (lr=3.3696e-05) (hash(x)=27821861) +7923 train 6.713807 (lr=3.3681e-05) (hash(x)=27712097) +7924 train 6.585559 (lr=3.3666e-05) (hash(x)=26668077) +7925 train 6.567218 (lr=3.3651e-05) (hash(x)=23977862) +7926 train 6.361099 (lr=3.3636e-05) (hash(x)=22920065) +7927 train 6.787805 (lr=3.3621e-05) (hash(x)=26116321) +7928 train 6.518939 (lr=3.3606e-05) (hash(x)=25428823) +7929 train 6.237734 (lr=3.3591e-05) (hash(x)=19842263) +7930 train 6.512197 (lr=3.3576e-05) (hash(x)=24613587) +7931 train 6.524716 (lr=3.3561e-05) (hash(x)=24709237) +7932 train 6.549156 (lr=3.3546e-05) (hash(x)=24713381) +7933 train 6.935922 (lr=3.3531e-05) (hash(x)=26220194) +7934 train 6.598290 (lr=3.3516e-05) (hash(x)=23269354) +7935 train 6.635098 (lr=3.3501e-05) (hash(x)=25934549) +7936 train 6.758711 (lr=3.3486e-05) (hash(x)=24257703) +7937 train 6.456726 (lr=3.3472e-05) (hash(x)=24540497) +7938 train 6.299969 (lr=3.3457e-05) (hash(x)=24801019) +7939 train 6.387801 (lr=3.3442e-05) (hash(x)=21680120) +7940 train 6.655469 (lr=3.3427e-05) (hash(x)=26087218) +7941 train 6.777917 (lr=3.3412e-05) (hash(x)=22464414) +7942 train 6.310669 (lr=3.3397e-05) (hash(x)=21197341) +7943 train 6.403690 (lr=3.3382e-05) (hash(x)=23937495) +7944 train 6.527813 (lr=3.3367e-05) (hash(x)=24026983) +7945 train 6.512945 (lr=3.3352e-05) (hash(x)=21201514) +7946 train 6.708008 (lr=3.3337e-05) (hash(x)=25733970) +7947 train 6.929585 (lr=3.3322e-05) (hash(x)=25113226) +7948 train 6.932140 (lr=3.3308e-05) (hash(x)=24782532) +7949 train 6.545969 (lr=3.3293e-05) (hash(x)=20678432) +7950 val loss 6.6816 +7950 val perplexity 797.5837 +7950 train 7.015337 (lr=3.3278e-05) (hash(x)=25130552) +7951 train 6.767987 (lr=3.3263e-05) (hash(x)=26286442) +7952 train 6.622571 (lr=3.3248e-05) (hash(x)=24528398) +7953 train 6.699791 (lr=3.3233e-05) (hash(x)=25162164) +7954 train 6.841523 (lr=3.3218e-05) (hash(x)=28761564) +7955 train 7.138896 (lr=3.3204e-05) (hash(x)=30334549) +7956 train 6.931890 (lr=3.3189e-05) (hash(x)=30219445) +7957 train 6.855089 (lr=3.3174e-05) (hash(x)=30405517) +7958 train 7.032974 (lr=3.3159e-05) (hash(x)=32583015) +7959 train 7.309836 (lr=3.3144e-05) (hash(x)=32737711) +7960 train 6.242550 (lr=3.3130e-05) (hash(x)=21417014) +7961 train 6.615648 (lr=3.3115e-05) (hash(x)=25779685) +7962 train 6.272830 (lr=3.3100e-05) (hash(x)=22339899) +7963 train 6.455429 (lr=3.3085e-05) (hash(x)=23732519) +7964 train 6.747964 (lr=3.3070e-05) (hash(x)=26707754) +7965 train 7.313262 (lr=3.3056e-05) (hash(x)=29480838) +7966 train 6.566870 (lr=3.3041e-05) (hash(x)=25619433) +7967 train 6.351980 (lr=3.3026e-05) (hash(x)=20563613) +7968 train 7.117912 (lr=3.3011e-05) (hash(x)=29087294) +7969 train 6.831560 (lr=3.2997e-05) (hash(x)=25419620) +7970 train 7.015338 (lr=3.2982e-05) (hash(x)=26954882) +7971 train 6.638406 (lr=3.2967e-05) (hash(x)=21731597) +7972 train 7.057965 (lr=3.2953e-05) (hash(x)=24007512) +7973 train 6.834740 (lr=3.2938e-05) (hash(x)=26755619) +7974 train 6.637570 (lr=3.2923e-05) (hash(x)=26126126) +7975 train 6.804242 (lr=3.2908e-05) (hash(x)=26234770) +7976 train 6.662654 (lr=3.2894e-05) (hash(x)=24327571) +7977 train 6.969583 (lr=3.2879e-05) (hash(x)=23467797) +7978 train 6.537533 (lr=3.2864e-05) (hash(x)=24052543) +7979 train 6.773183 (lr=3.2850e-05) (hash(x)=25615077) +7980 train 6.517743 (lr=3.2835e-05) (hash(x)=26142937) +7981 train 6.319776 (lr=3.2820e-05) (hash(x)=23955961) +7982 train 6.973806 (lr=3.2806e-05) (hash(x)=30232295) +7983 train 6.978645 (lr=3.2791e-05) (hash(x)=26179422) +7984 train 6.643884 (lr=3.2776e-05) (hash(x)=23149315) +7985 train 6.677115 (lr=3.2762e-05) (hash(x)=25081971) +7986 train 6.576097 (lr=3.2747e-05) (hash(x)=24208764) +7987 train 6.673412 (lr=3.2732e-05) (hash(x)=23938333) +7988 train 6.810877 (lr=3.2718e-05) (hash(x)=24852787) +7989 train 6.848784 (lr=3.2703e-05) (hash(x)=27208446) +7990 train 6.594316 (lr=3.2689e-05) (hash(x)=23328362) +7991 train 6.473960 (lr=3.2674e-05) (hash(x)=23289651) +7992 train 6.865067 (lr=3.2659e-05) (hash(x)=25199368) +7993 train 6.425140 (lr=3.2645e-05) (hash(x)=21880796) +7994 train 6.603384 (lr=3.2630e-05) (hash(x)=25160607) +7995 train 7.215494 (lr=3.2616e-05) (hash(x)=28250152) +7996 train 6.700681 (lr=3.2601e-05) (hash(x)=25710921) +7997 train 7.177916 (lr=3.2586e-05) (hash(x)=28828426) +7998 train 7.523563 (lr=3.2572e-05) (hash(x)=35340474) +7999 train 7.793506 (lr=3.2557e-05) (hash(x)=36436617) +8000 val loss 6.6848 +8000 val perplexity 800.1733 +8000 train 6.767854 (lr=3.2543e-05) (hash(x)=27466943) +8001 train 6.607197 (lr=3.2528e-05) (hash(x)=23888872) +8002 train 6.673109 (lr=3.2514e-05) (hash(x)=24649009) +8003 train 6.629551 (lr=3.2499e-05) (hash(x)=24720781) +8004 train 6.485747 (lr=3.2485e-05) (hash(x)=24492728) +8005 train 6.561484 (lr=3.2470e-05) (hash(x)=23403672) +8006 train 6.497463 (lr=3.2456e-05) (hash(x)=22536483) +8007 train 6.545958 (lr=3.2441e-05) (hash(x)=24854398) +8008 train 6.893901 (lr=3.2427e-05) (hash(x)=31109356) +8009 train 6.996819 (lr=3.2412e-05) (hash(x)=32863622) +8010 train 6.702425 (lr=3.2398e-05) (hash(x)=25351172) +8011 train 6.759248 (lr=3.2383e-05) (hash(x)=22482108) +8012 train 6.701537 (lr=3.2369e-05) (hash(x)=26811154) +8013 train 6.464996 (lr=3.2354e-05) (hash(x)=22039371) +8014 train 6.731084 (lr=3.2340e-05) (hash(x)=25885230) +8015 train 6.534519 (lr=3.2325e-05) (hash(x)=25162669) +8016 train 6.420839 (lr=3.2311e-05) (hash(x)=22432142) +8017 train 6.470613 (lr=3.2296e-05) (hash(x)=21133209) +8018 train 6.565704 (lr=3.2282e-05) (hash(x)=23370074) +8019 train 6.714070 (lr=3.2268e-05) (hash(x)=24940321) +8020 train 6.772840 (lr=3.2253e-05) (hash(x)=25556156) +8021 train 6.653572 (lr=3.2239e-05) (hash(x)=25627362) +8022 train 6.269392 (lr=3.2224e-05) (hash(x)=20047713) +8023 train 6.331783 (lr=3.2210e-05) (hash(x)=20845671) +8024 train 6.800382 (lr=3.2196e-05) (hash(x)=26474806) +8025 train 6.795053 (lr=3.2181e-05) (hash(x)=26577501) +8026 train 6.889256 (lr=3.2167e-05) (hash(x)=29355336) +8027 train 6.708779 (lr=3.2152e-05) (hash(x)=24442121) +8028 train 6.645634 (lr=3.2138e-05) (hash(x)=24748974) +8029 train 6.434592 (lr=3.2124e-05) (hash(x)=21961508) +8030 train 6.625420 (lr=3.2109e-05) (hash(x)=23564979) +8031 train 6.609041 (lr=3.2095e-05) (hash(x)=23276958) +8032 train 6.655609 (lr=3.2081e-05) (hash(x)=27062020) +8033 train 6.039230 (lr=3.2066e-05) (hash(x)=18141943) +8034 train 6.412030 (lr=3.2052e-05) (hash(x)=23826340) +8035 train 6.307836 (lr=3.2038e-05) (hash(x)=20427388) +8036 train 6.739733 (lr=3.2023e-05) (hash(x)=27546226) +8037 train 6.878957 (lr=3.2009e-05) (hash(x)=25028032) +8038 train 6.438719 (lr=3.1995e-05) (hash(x)=22200513) +8039 train 6.303019 (lr=3.1980e-05) (hash(x)=22544363) +8040 train 6.492963 (lr=3.1966e-05) (hash(x)=24212094) +8041 train 6.580471 (lr=3.1952e-05) (hash(x)=24869419) +8042 train 6.548059 (lr=3.1938e-05) (hash(x)=24296836) +8043 train 6.498152 (lr=3.1923e-05) (hash(x)=26034883) +8044 train 6.771156 (lr=3.1909e-05) (hash(x)=26315167) +8045 train 6.376304 (lr=3.1895e-05) (hash(x)=24214272) +8046 train 6.573934 (lr=3.1880e-05) (hash(x)=23793866) +8047 train 6.480091 (lr=3.1866e-05) (hash(x)=22559566) +8048 train 6.702045 (lr=3.1852e-05) (hash(x)=26541218) +8049 train 6.801824 (lr=3.1838e-05) (hash(x)=21635164) +8050 val loss 6.6768 +8050 val perplexity 793.7422 +8050 train 6.401625 (lr=3.1823e-05) (hash(x)=22443760) +8051 train 6.589962 (lr=3.1809e-05) (hash(x)=25153242) +8052 train 6.687459 (lr=3.1795e-05) (hash(x)=26635351) +8053 train 6.371140 (lr=3.1781e-05) (hash(x)=23522887) +8054 train 6.608144 (lr=3.1767e-05) (hash(x)=24404717) +8055 train 6.617194 (lr=3.1752e-05) (hash(x)=24102231) +8056 train 6.715718 (lr=3.1738e-05) (hash(x)=26309006) +8057 train 6.587651 (lr=3.1724e-05) (hash(x)=23669103) +8058 train 6.620748 (lr=3.1710e-05) (hash(x)=23883924) +8059 train 6.581703 (lr=3.1696e-05) (hash(x)=24901920) +8060 train 6.882967 (lr=3.1682e-05) (hash(x)=28712869) +8061 train 6.765465 (lr=3.1667e-05) (hash(x)=26829824) +8062 train 6.691729 (lr=3.1653e-05) (hash(x)=27296346) +8063 train 6.672835 (lr=3.1639e-05) (hash(x)=26376027) +8064 train 6.466487 (lr=3.1625e-05) (hash(x)=21937626) +8065 train 6.404419 (lr=3.1611e-05) (hash(x)=25110789) +8066 train 6.812001 (lr=3.1597e-05) (hash(x)=28391608) +8067 train 7.106475 (lr=3.1583e-05) (hash(x)=27062064) +8068 train 6.997665 (lr=3.1568e-05) (hash(x)=26986091) +8069 train 6.339361 (lr=3.1554e-05) (hash(x)=22656832) +8070 train 6.525603 (lr=3.1540e-05) (hash(x)=20554057) +8071 train 6.423801 (lr=3.1526e-05) (hash(x)=22471591) +8072 train 6.628633 (lr=3.1512e-05) (hash(x)=27132488) +8073 train 6.999032 (lr=3.1498e-05) (hash(x)=29098044) +8074 train 6.351471 (lr=3.1484e-05) (hash(x)=22287166) +8075 train 6.588919 (lr=3.1470e-05) (hash(x)=23441436) +8076 train 6.498632 (lr=3.1456e-05) (hash(x)=22623734) +8077 train 6.576855 (lr=3.1442e-05) (hash(x)=25091462) +8078 train 6.537865 (lr=3.1428e-05) (hash(x)=24840167) +8079 train 6.581876 (lr=3.1414e-05) (hash(x)=25526310) +8080 train 6.675012 (lr=3.1400e-05) (hash(x)=25239622) +8081 train 6.699353 (lr=3.1385e-05) (hash(x)=25468387) +8082 train 6.355662 (lr=3.1371e-05) (hash(x)=21889264) +8083 train 6.752433 (lr=3.1357e-05) (hash(x)=24779462) +8084 train 6.694923 (lr=3.1343e-05) (hash(x)=25544643) +8085 train 6.456937 (lr=3.1329e-05) (hash(x)=25278229) +8086 train 6.511435 (lr=3.1315e-05) (hash(x)=23887373) +8087 train 6.680747 (lr=3.1301e-05) (hash(x)=25749229) +8088 train 6.748172 (lr=3.1287e-05) (hash(x)=27224436) +8089 train 6.572643 (lr=3.1273e-05) (hash(x)=25938623) +8090 train 6.704053 (lr=3.1259e-05) (hash(x)=28535936) +8091 train 6.912878 (lr=3.1245e-05) (hash(x)=27410703) +8092 train 6.976724 (lr=3.1232e-05) (hash(x)=27487669) +8093 train 6.563428 (lr=3.1218e-05) (hash(x)=23944021) +8094 train 6.581525 (lr=3.1204e-05) (hash(x)=24078812) +8095 train 6.622192 (lr=3.1190e-05) (hash(x)=26163080) +8096 train 6.566797 (lr=3.1176e-05) (hash(x)=25628371) +8097 train 6.715875 (lr=3.1162e-05) (hash(x)=25650588) +8098 train 6.982234 (lr=3.1148e-05) (hash(x)=28255316) +8099 train 6.559495 (lr=3.1134e-05) (hash(x)=26163104) +8100 val loss 6.6666 +8100 val perplexity 785.6992 +8100 train 6.923132 (lr=3.1120e-05) (hash(x)=27937451) +8101 train 6.687499 (lr=3.1106e-05) (hash(x)=27568757) +8102 train 6.228965 (lr=3.1092e-05) (hash(x)=20920095) +8103 train 6.657777 (lr=3.1078e-05) (hash(x)=25983824) +8104 train 6.667263 (lr=3.1064e-05) (hash(x)=23654026) +8105 train 6.490704 (lr=3.1051e-05) (hash(x)=21663626) +8106 train 6.511171 (lr=3.1037e-05) (hash(x)=24913817) +8107 train 6.573724 (lr=3.1023e-05) (hash(x)=24363656) +8108 train 6.354289 (lr=3.1009e-05) (hash(x)=22855954) +8109 train 6.356257 (lr=3.0995e-05) (hash(x)=22503583) +8110 train 6.673878 (lr=3.0981e-05) (hash(x)=25920535) +8111 train 6.506651 (lr=3.0967e-05) (hash(x)=22782927) +8112 train 6.690049 (lr=3.0954e-05) (hash(x)=23038752) +8113 train 6.579005 (lr=3.0940e-05) (hash(x)=25997900) +8114 train 7.133235 (lr=3.0926e-05) (hash(x)=25080127) +8115 train 6.566104 (lr=3.0912e-05) (hash(x)=21280677) +8116 train 6.542530 (lr=3.0898e-05) (hash(x)=23341605) +8117 train 6.318773 (lr=3.0885e-05) (hash(x)=22449510) +8118 train 6.581766 (lr=3.0871e-05) (hash(x)=21772566) +8119 train 7.160965 (lr=3.0857e-05) (hash(x)=27342614) +8120 train 6.722047 (lr=3.0843e-05) (hash(x)=24786142) +8121 train 6.582935 (lr=3.0829e-05) (hash(x)=24698672) +8122 train 6.696206 (lr=3.0816e-05) (hash(x)=23657694) +8123 train 6.807714 (lr=3.0802e-05) (hash(x)=24784010) +8124 train 6.596427 (lr=3.0788e-05) (hash(x)=22472621) +8125 train 6.624838 (lr=3.0774e-05) (hash(x)=23201473) +8126 train 6.602440 (lr=3.0761e-05) (hash(x)=24327447) +8127 train 7.073522 (lr=3.0747e-05) (hash(x)=31792461) +8128 train 6.512752 (lr=3.0733e-05) (hash(x)=25062312) +8129 train 6.688289 (lr=3.0719e-05) (hash(x)=25303707) +8130 train 7.078277 (lr=3.0706e-05) (hash(x)=29510116) +8131 train 7.553618 (lr=3.0692e-05) (hash(x)=32012132) +8132 train 6.207656 (lr=3.0678e-05) (hash(x)=19687320) +8133 train 6.757926 (lr=3.0665e-05) (hash(x)=28948253) +8134 train 6.806688 (lr=3.0651e-05) (hash(x)=26468684) +8135 train 6.434772 (lr=3.0637e-05) (hash(x)=24579444) +8136 train 6.727848 (lr=3.0624e-05) (hash(x)=25073940) +8137 train 6.257980 (lr=3.0610e-05) (hash(x)=22379856) +8138 train 6.487827 (lr=3.0596e-05) (hash(x)=25780978) +8139 train 6.463362 (lr=3.0583e-05) (hash(x)=24219393) +8140 train 6.912344 (lr=3.0569e-05) (hash(x)=25762719) +8141 train 6.645679 (lr=3.0555e-05) (hash(x)=24065309) +8142 train 6.497585 (lr=3.0542e-05) (hash(x)=22954824) +8143 train 6.592496 (lr=3.0528e-05) (hash(x)=26027784) +8144 train 6.821402 (lr=3.0514e-05) (hash(x)=24905633) +8145 train 6.562718 (lr=3.0501e-05) (hash(x)=25977319) +8146 train 6.343000 (lr=3.0487e-05) (hash(x)=21779245) +8147 train 6.581078 (lr=3.0473e-05) (hash(x)=24563059) +8148 train 6.579755 (lr=3.0460e-05) (hash(x)=24088662) +8149 train 6.587022 (lr=3.0446e-05) (hash(x)=23679988) +8150 val loss 6.6666 +8150 val perplexity 785.6895 +8150 train 6.342138 (lr=3.0433e-05) (hash(x)=22401244) +8151 train 6.516125 (lr=3.0419e-05) (hash(x)=23796407) +8152 train 6.537857 (lr=3.0406e-05) (hash(x)=22505873) +8153 train 6.536806 (lr=3.0392e-05) (hash(x)=22843653) +8154 train 6.926820 (lr=3.0378e-05) (hash(x)=25111799) +8155 train 6.477293 (lr=3.0365e-05) (hash(x)=24465024) +8156 train 6.485335 (lr=3.0351e-05) (hash(x)=24935841) +8157 train 6.360046 (lr=3.0338e-05) (hash(x)=21805049) +8158 train 6.598434 (lr=3.0324e-05) (hash(x)=24835421) +8159 train 6.623868 (lr=3.0311e-05) (hash(x)=25098715) +8160 train 6.776651 (lr=3.0297e-05) (hash(x)=28489841) +8161 train 6.657532 (lr=3.0284e-05) (hash(x)=23686798) +8162 train 6.570779 (lr=3.0270e-05) (hash(x)=23939462) +8163 train 6.502289 (lr=3.0257e-05) (hash(x)=23492430) +8164 train 6.379208 (lr=3.0243e-05) (hash(x)=22740065) +8165 train 6.415912 (lr=3.0230e-05) (hash(x)=23660827) +8166 train 6.432827 (lr=3.0216e-05) (hash(x)=21626652) +8167 train 6.633473 (lr=3.0203e-05) (hash(x)=25277692) +8168 train 6.520145 (lr=3.0189e-05) (hash(x)=27042991) +8169 train 6.618991 (lr=3.0176e-05) (hash(x)=25977302) +8170 train 6.456417 (lr=3.0162e-05) (hash(x)=22519601) +8171 train 6.495955 (lr=3.0149e-05) (hash(x)=24546014) +8172 train 6.453663 (lr=3.0135e-05) (hash(x)=24240593) +8173 train 6.450372 (lr=3.0122e-05) (hash(x)=23927922) +8174 train 6.581815 (lr=3.0109e-05) (hash(x)=25967897) +8175 train 6.385902 (lr=3.0095e-05) (hash(x)=20733689) +8176 train 6.636992 (lr=3.0082e-05) (hash(x)=23347111) +8177 train 6.575161 (lr=3.0068e-05) (hash(x)=23237687) +8178 train 6.396792 (lr=3.0055e-05) (hash(x)=21188182) +8179 train 6.705589 (lr=3.0041e-05) (hash(x)=24203337) +8180 train 6.755925 (lr=3.0028e-05) (hash(x)=27929945) +8181 train 6.460435 (lr=3.0015e-05) (hash(x)=22511355) +8182 train 6.536844 (lr=3.0001e-05) (hash(x)=20977032) +8183 train 6.380893 (lr=2.9988e-05) (hash(x)=21858565) +8184 train 6.369100 (lr=2.9975e-05) (hash(x)=21213479) +8185 train 6.721146 (lr=2.9961e-05) (hash(x)=25946762) +8186 train 6.303322 (lr=2.9948e-05) (hash(x)=21009008) +8187 train 5.872566 (lr=2.9934e-05) (hash(x)=18440304) +8188 train 6.426782 (lr=2.9921e-05) (hash(x)=22505915) +8189 train 6.734174 (lr=2.9908e-05) (hash(x)=27890065) +8190 train 6.592868 (lr=2.9894e-05) (hash(x)=25534240) +8191 train 6.617149 (lr=2.9881e-05) (hash(x)=25012219) +8192 train 6.610683 (lr=2.9868e-05) (hash(x)=22834991) +8193 train 6.378580 (lr=2.9855e-05) (hash(x)=23731919) +8194 train 6.605856 (lr=2.9841e-05) (hash(x)=23273004) +8195 train 6.615141 (lr=2.9828e-05) (hash(x)=24082398) +8196 train 6.562256 (lr=2.9815e-05) (hash(x)=23867180) +8197 train 6.540926 (lr=2.9801e-05) (hash(x)=25816243) +8198 train 6.998346 (lr=2.9788e-05) (hash(x)=27595078) +8199 train 6.836653 (lr=2.9775e-05) (hash(x)=25365357) +8200 val loss 6.6712 +8200 val perplexity 789.3639 +8200 train 6.592293 (lr=2.9762e-05) (hash(x)=21346912) +8201 train 6.557256 (lr=2.9748e-05) (hash(x)=22754363) +8202 train 6.630695 (lr=2.9735e-05) (hash(x)=23830033) +8203 train 6.362316 (lr=2.9722e-05) (hash(x)=23424625) +8204 train 6.734236 (lr=2.9709e-05) (hash(x)=25906746) +8205 train 6.521849 (lr=2.9695e-05) (hash(x)=24250485) +8206 train 6.640211 (lr=2.9682e-05) (hash(x)=26523143) +8207 train 6.595953 (lr=2.9669e-05) (hash(x)=22952042) +8208 train 6.525026 (lr=2.9656e-05) (hash(x)=23337243) +8209 train 6.538651 (lr=2.9642e-05) (hash(x)=25742281) +8210 train 6.398237 (lr=2.9629e-05) (hash(x)=25326781) +8211 train 6.460918 (lr=2.9616e-05) (hash(x)=25054382) +8212 train 6.868692 (lr=2.9603e-05) (hash(x)=24694024) +8213 train 6.941994 (lr=2.9590e-05) (hash(x)=27346323) +8214 train 6.845313 (lr=2.9577e-05) (hash(x)=25237882) +8215 train 6.561362 (lr=2.9563e-05) (hash(x)=23755293) +8216 train 6.577775 (lr=2.9550e-05) (hash(x)=27793110) +8217 train 6.439731 (lr=2.9537e-05) (hash(x)=23471296) +8218 train 6.697569 (lr=2.9524e-05) (hash(x)=28166465) +8219 train 6.596317 (lr=2.9511e-05) (hash(x)=25792926) +8220 train 6.552085 (lr=2.9498e-05) (hash(x)=24091621) +8221 train 6.737006 (lr=2.9485e-05) (hash(x)=24484961) +8222 train 6.992888 (lr=2.9471e-05) (hash(x)=28198266) +8223 train 6.400650 (lr=2.9458e-05) (hash(x)=23549853) +8224 train 6.625433 (lr=2.9445e-05) (hash(x)=24638112) +8225 train 6.708868 (lr=2.9432e-05) (hash(x)=26199638) +8226 train 6.291754 (lr=2.9419e-05) (hash(x)=22105141) +8227 train 6.448370 (lr=2.9406e-05) (hash(x)=23260060) +8228 train 6.397312 (lr=2.9393e-05) (hash(x)=21622199) +8229 train 6.845526 (lr=2.9380e-05) (hash(x)=26379145) +8230 train 6.843900 (lr=2.9367e-05) (hash(x)=25424224) +8231 train 7.524856 (lr=2.9354e-05) (hash(x)=28187393) +8232 train 6.400561 (lr=2.9341e-05) (hash(x)=22219046) +8233 train 6.644012 (lr=2.9328e-05) (hash(x)=22394746) +8234 train 6.562096 (lr=2.9315e-05) (hash(x)=25076456) +8235 train 6.703789 (lr=2.9302e-05) (hash(x)=26535767) +8236 train 6.689594 (lr=2.9289e-05) (hash(x)=25114535) +8237 train 6.352548 (lr=2.9275e-05) (hash(x)=22614475) +8238 train 6.579559 (lr=2.9262e-05) (hash(x)=23461867) +8239 train 6.691078 (lr=2.9249e-05) (hash(x)=24001909) +8240 train 6.613570 (lr=2.9236e-05) (hash(x)=28387107) +8241 train 6.804121 (lr=2.9223e-05) (hash(x)=28069697) +8242 train 6.765247 (lr=2.9210e-05) (hash(x)=26760782) +8243 train 6.497682 (lr=2.9198e-05) (hash(x)=24772352) +8244 train 6.973305 (lr=2.9185e-05) (hash(x)=28819231) +8245 train 6.965797 (lr=2.9172e-05) (hash(x)=28547203) +8246 train 6.546841 (lr=2.9159e-05) (hash(x)=25505094) +8247 train 6.536661 (lr=2.9146e-05) (hash(x)=24662903) +8248 train 6.509041 (lr=2.9133e-05) (hash(x)=22725063) +8249 train 6.176909 (lr=2.9120e-05) (hash(x)=20160775) +8250 val loss 6.6595 +8250 val perplexity 780.1613 +8250 train 6.627576 (lr=2.9107e-05) (hash(x)=25631966) +8251 train 6.610925 (lr=2.9094e-05) (hash(x)=27264395) +8252 train 6.714864 (lr=2.9081e-05) (hash(x)=22258278) +8253 train 6.511690 (lr=2.9068e-05) (hash(x)=25479509) +8254 train 6.450778 (lr=2.9055e-05) (hash(x)=25604021) +8255 train 6.805446 (lr=2.9042e-05) (hash(x)=25011798) +8256 train 6.291698 (lr=2.9029e-05) (hash(x)=20395692) +8257 train 6.564186 (lr=2.9017e-05) (hash(x)=25744518) +8258 train 6.434360 (lr=2.9004e-05) (hash(x)=24128628) +8259 train 6.490831 (lr=2.8991e-05) (hash(x)=25339108) +8260 train 6.396846 (lr=2.8978e-05) (hash(x)=25598405) +8261 train 6.632276 (lr=2.8965e-05) (hash(x)=24595675) +8262 train 6.529489 (lr=2.8952e-05) (hash(x)=23597125) +8263 train 6.318368 (lr=2.8939e-05) (hash(x)=22266963) +8264 train 6.586546 (lr=2.8926e-05) (hash(x)=24201854) +8265 train 6.675946 (lr=2.8914e-05) (hash(x)=23513916) +8266 train 6.095990 (lr=2.8901e-05) (hash(x)=19253843) +8267 train 6.385145 (lr=2.8888e-05) (hash(x)=24723976) +8268 train 6.602170 (lr=2.8875e-05) (hash(x)=24353316) +8269 train 6.458056 (lr=2.8862e-05) (hash(x)=23260347) +8270 train 6.563020 (lr=2.8850e-05) (hash(x)=26082739) +8271 train 6.869086 (lr=2.8837e-05) (hash(x)=28052131) +8272 train 6.594038 (lr=2.8824e-05) (hash(x)=25789986) +8273 train 6.703381 (lr=2.8811e-05) (hash(x)=24039711) +8274 train 6.440059 (lr=2.8798e-05) (hash(x)=22283411) +8275 train 6.576683 (lr=2.8786e-05) (hash(x)=23848221) +8276 train 6.882077 (lr=2.8773e-05) (hash(x)=25946640) +8277 train 6.664137 (lr=2.8760e-05) (hash(x)=24747105) +8278 train 6.711757 (lr=2.8747e-05) (hash(x)=26711267) +8279 train 6.735974 (lr=2.8735e-05) (hash(x)=27364904) +8280 train 6.894008 (lr=2.8722e-05) (hash(x)=28656982) +8281 train 6.329307 (lr=2.8709e-05) (hash(x)=23060568) +8282 train 6.523052 (lr=2.8697e-05) (hash(x)=24516125) +8283 train 6.616098 (lr=2.8684e-05) (hash(x)=25030412) +8284 train 6.504942 (lr=2.8671e-05) (hash(x)=25225968) +8285 train 6.508998 (lr=2.8658e-05) (hash(x)=22462143) +8286 train 6.497575 (lr=2.8646e-05) (hash(x)=22405463) +8287 train 6.769415 (lr=2.8633e-05) (hash(x)=25527764) +8288 train 6.610951 (lr=2.8620e-05) (hash(x)=24318321) +8289 train 6.514283 (lr=2.8608e-05) (hash(x)=24917732) +8290 train 6.659062 (lr=2.8595e-05) (hash(x)=24457805) +8291 train 7.206951 (lr=2.8582e-05) (hash(x)=26607434) +8292 train 6.712535 (lr=2.8570e-05) (hash(x)=25000944) +8293 train 6.523068 (lr=2.8557e-05) (hash(x)=23805495) +8294 train 6.398876 (lr=2.8544e-05) (hash(x)=21822450) +8295 train 7.328693 (lr=2.8532e-05) (hash(x)=31557726) +8296 train 6.761353 (lr=2.8519e-05) (hash(x)=26154948) +8297 train 6.464839 (lr=2.8507e-05) (hash(x)=24792046) +8298 train 6.727501 (lr=2.8494e-05) (hash(x)=28517844) +8299 train 6.919233 (lr=2.8481e-05) (hash(x)=27110417) +8300 val loss 6.6613 +8300 val perplexity 781.5695 +8300 train 6.646713 (lr=2.8469e-05) (hash(x)=21934946) +8301 train 6.557221 (lr=2.8456e-05) (hash(x)=23812638) +8302 train 6.601001 (lr=2.8444e-05) (hash(x)=23977615) +8303 train 6.470340 (lr=2.8431e-05) (hash(x)=23822119) +8304 train 6.388351 (lr=2.8418e-05) (hash(x)=21308892) +8305 train 6.457679 (lr=2.8406e-05) (hash(x)=23288684) +8306 train 6.377380 (lr=2.8393e-05) (hash(x)=23010605) +8307 train 6.266597 (lr=2.8381e-05) (hash(x)=22477165) +8308 train 6.521773 (lr=2.8368e-05) (hash(x)=24735163) +8309 train 6.812726 (lr=2.8356e-05) (hash(x)=30211681) +8310 train 6.715324 (lr=2.8343e-05) (hash(x)=28503702) +8311 train 6.133429 (lr=2.8331e-05) (hash(x)=21026034) +8312 train 6.655684 (lr=2.8318e-05) (hash(x)=26392924) +8313 train 6.489585 (lr=2.8306e-05) (hash(x)=25237015) +8314 train 6.325330 (lr=2.8293e-05) (hash(x)=22630508) +8315 train 6.440166 (lr=2.8281e-05) (hash(x)=23084445) +8316 train 6.314354 (lr=2.8268e-05) (hash(x)=22927381) +8317 train 6.457471 (lr=2.8256e-05) (hash(x)=23550270) +8318 train 6.501822 (lr=2.8243e-05) (hash(x)=23190549) +8319 train 6.665445 (lr=2.8231e-05) (hash(x)=25878395) +8320 train 6.501265 (lr=2.8218e-05) (hash(x)=23034017) +8321 train 6.619354 (lr=2.8206e-05) (hash(x)=25142805) +8322 train 6.623888 (lr=2.8193e-05) (hash(x)=26964763) +8323 train 6.460438 (lr=2.8181e-05) (hash(x)=25928298) +8324 train 7.189929 (lr=2.8168e-05) (hash(x)=31223146) +8325 train 6.688962 (lr=2.8156e-05) (hash(x)=24304343) +8326 train 6.548317 (lr=2.8143e-05) (hash(x)=25312035) +8327 train 6.338726 (lr=2.8131e-05) (hash(x)=22911010) +8328 train 6.446968 (lr=2.8119e-05) (hash(x)=23266004) +8329 train 6.515010 (lr=2.8106e-05) (hash(x)=23593283) +8330 train 6.786943 (lr=2.8094e-05) (hash(x)=27685415) +8331 train 6.535900 (lr=2.8081e-05) (hash(x)=22504637) +8332 train 6.445827 (lr=2.8069e-05) (hash(x)=24028185) +8333 train 6.526111 (lr=2.8057e-05) (hash(x)=23896829) +8334 train 6.463027 (lr=2.8044e-05) (hash(x)=22078577) +8335 train 6.704401 (lr=2.8032e-05) (hash(x)=26993263) +8336 train 7.045439 (lr=2.8020e-05) (hash(x)=27200675) +8337 train 6.926333 (lr=2.8007e-05) (hash(x)=30806534) +8338 train 6.708284 (lr=2.7995e-05) (hash(x)=27336326) +8339 train 6.456728 (lr=2.7983e-05) (hash(x)=23411126) +8340 train 6.714161 (lr=2.7970e-05) (hash(x)=28583293) +8341 train 6.439204 (lr=2.7958e-05) (hash(x)=24251549) +8342 train 6.171843 (lr=2.7946e-05) (hash(x)=18244404) +8343 train 6.647587 (lr=2.7933e-05) (hash(x)=23899619) +8344 train 6.313694 (lr=2.7921e-05) (hash(x)=20335423) +8345 train 6.326752 (lr=2.7909e-05) (hash(x)=24298532) +8346 train 6.556808 (lr=2.7896e-05) (hash(x)=26879476) +8347 train 6.723699 (lr=2.7884e-05) (hash(x)=25643027) +8348 train 6.544387 (lr=2.7872e-05) (hash(x)=20576510) +8349 train 6.413881 (lr=2.7860e-05) (hash(x)=21440632) +8350 val loss 6.6556 +8350 val perplexity 777.1033 +8350 train 6.838248 (lr=2.7847e-05) (hash(x)=25092353) +8351 train 6.470937 (lr=2.7835e-05) (hash(x)=23119758) +8352 train 6.664471 (lr=2.7823e-05) (hash(x)=26462012) +8353 train 7.107707 (lr=2.7811e-05) (hash(x)=25213587) +8354 train 6.631332 (lr=2.7798e-05) (hash(x)=23553353) +8355 train 6.358099 (lr=2.7786e-05) (hash(x)=22277032) +8356 train 6.683363 (lr=2.7774e-05) (hash(x)=24095797) +8357 train 6.604216 (lr=2.7762e-05) (hash(x)=23148627) +8358 train 6.847873 (lr=2.7749e-05) (hash(x)=26443044) +8359 train 7.412799 (lr=2.7737e-05) (hash(x)=30897645) +8360 train 7.058556 (lr=2.7725e-05) (hash(x)=31696114) +8361 train 6.475488 (lr=2.7713e-05) (hash(x)=21977825) +8362 train 6.831491 (lr=2.7701e-05) (hash(x)=28815816) +8363 train 6.059327 (lr=2.7688e-05) (hash(x)=20997528) +8364 train 6.546253 (lr=2.7676e-05) (hash(x)=25069615) +8365 train 6.354431 (lr=2.7664e-05) (hash(x)=19751176) +8366 train 6.670624 (lr=2.7652e-05) (hash(x)=23715168) +8367 train 6.781461 (lr=2.7640e-05) (hash(x)=24425875) +8368 train 6.975386 (lr=2.7628e-05) (hash(x)=28659611) +8369 train 6.799627 (lr=2.7616e-05) (hash(x)=22684492) +8370 train 6.303596 (lr=2.7603e-05) (hash(x)=23042845) +8371 train 6.385362 (lr=2.7591e-05) (hash(x)=24089962) +8372 train 6.619290 (lr=2.7579e-05) (hash(x)=26590848) +8373 train 6.493112 (lr=2.7567e-05) (hash(x)=22821539) +8374 train 6.652120 (lr=2.7555e-05) (hash(x)=24622128) +8375 train 6.772623 (lr=2.7543e-05) (hash(x)=28253341) +8376 train 6.859428 (lr=2.7531e-05) (hash(x)=25624195) +8377 train 6.781207 (lr=2.7519e-05) (hash(x)=24483642) +8378 train 6.742980 (lr=2.7507e-05) (hash(x)=25929373) +8379 train 6.753659 (lr=2.7495e-05) (hash(x)=25382746) +8380 train 6.779747 (lr=2.7483e-05) (hash(x)=25870450) +8381 train 6.687415 (lr=2.7470e-05) (hash(x)=25475873) +8382 train 6.609729 (lr=2.7458e-05) (hash(x)=24874844) +8383 train 6.578297 (lr=2.7446e-05) (hash(x)=23403513) +8384 train 6.494123 (lr=2.7434e-05) (hash(x)=24215021) +8385 train 6.894025 (lr=2.7422e-05) (hash(x)=28701704) +8386 train 6.968522 (lr=2.7410e-05) (hash(x)=26100061) +8387 train 6.603336 (lr=2.7398e-05) (hash(x)=24574442) +8388 train 6.477196 (lr=2.7386e-05) (hash(x)=22036566) +8389 train 7.177902 (lr=2.7374e-05) (hash(x)=28759403) +8390 train 6.919022 (lr=2.7362e-05) (hash(x)=30085356) +8391 train 6.469392 (lr=2.7350e-05) (hash(x)=24994995) +8392 train 6.402745 (lr=2.7338e-05) (hash(x)=19906687) +8393 train 6.317256 (lr=2.7326e-05) (hash(x)=23060032) +8394 train 6.594983 (lr=2.7314e-05) (hash(x)=25962418) +8395 train 7.016739 (lr=2.7302e-05) (hash(x)=26721799) +8396 train 6.920803 (lr=2.7290e-05) (hash(x)=28975605) +8397 train 7.068884 (lr=2.7279e-05) (hash(x)=30706190) +8398 train 7.002352 (lr=2.7267e-05) (hash(x)=25211102) +8399 train 6.742378 (lr=2.7255e-05) (hash(x)=24751625) +8400 val loss 6.6548 +8400 val perplexity 776.5004 +8400 train 6.573701 (lr=2.7243e-05) (hash(x)=24434524) +8401 train 6.566652 (lr=2.7231e-05) (hash(x)=27731310) +8402 train 6.707503 (lr=2.7219e-05) (hash(x)=26501288) +8403 train 6.994941 (lr=2.7207e-05) (hash(x)=25708316) +8404 train 6.767248 (lr=2.7195e-05) (hash(x)=22687989) +8405 train 6.504352 (lr=2.7183e-05) (hash(x)=22854783) +8406 train 6.350369 (lr=2.7171e-05) (hash(x)=21590282) +8407 train 6.442666 (lr=2.7159e-05) (hash(x)=24569689) +8408 train 6.338511 (lr=2.7148e-05) (hash(x)=19752026) +8409 train 6.482048 (lr=2.7136e-05) (hash(x)=21289331) +8410 train 6.385931 (lr=2.7124e-05) (hash(x)=20353064) +8411 train 6.356912 (lr=2.7112e-05) (hash(x)=20503047) +8412 train 6.516477 (lr=2.7100e-05) (hash(x)=21790400) +8413 train 6.491296 (lr=2.7088e-05) (hash(x)=23395376) +8414 train 6.649718 (lr=2.7077e-05) (hash(x)=26791536) +8415 train 6.751626 (lr=2.7065e-05) (hash(x)=25589724) +8416 train 6.627080 (lr=2.7053e-05) (hash(x)=27617543) +8417 train 6.446381 (lr=2.7041e-05) (hash(x)=23229539) +8418 train 6.613989 (lr=2.7029e-05) (hash(x)=24605106) +8419 train 6.493671 (lr=2.7017e-05) (hash(x)=22717216) +8420 train 6.493138 (lr=2.7006e-05) (hash(x)=26681572) +8421 train 6.536222 (lr=2.6994e-05) (hash(x)=24375489) +8422 train 6.593616 (lr=2.6982e-05) (hash(x)=25653545) +8423 train 6.564186 (lr=2.6970e-05) (hash(x)=26240309) +8424 train 6.308874 (lr=2.6959e-05) (hash(x)=22182386) +8425 train 6.628876 (lr=2.6947e-05) (hash(x)=25835592) +8426 train 6.554358 (lr=2.6935e-05) (hash(x)=25878086) +8427 train 6.447198 (lr=2.6923e-05) (hash(x)=20674151) +8428 train 6.332193 (lr=2.6912e-05) (hash(x)=22842685) +8429 train 6.939484 (lr=2.6900e-05) (hash(x)=29588582) +8430 train 7.009485 (lr=2.6888e-05) (hash(x)=28769377) +8431 train 6.663404 (lr=2.6876e-05) (hash(x)=27287150) +8432 train 6.373862 (lr=2.6865e-05) (hash(x)=25686898) +8433 train 6.570323 (lr=2.6853e-05) (hash(x)=24594186) +8434 train 6.572982 (lr=2.6841e-05) (hash(x)=23406267) +8435 train 6.746822 (lr=2.6830e-05) (hash(x)=26302259) +8436 train 7.250912 (lr=2.6818e-05) (hash(x)=34623663) +8437 train 6.419750 (lr=2.6806e-05) (hash(x)=22937308) +8438 train 6.543347 (lr=2.6795e-05) (hash(x)=22313264) +8439 train 6.400525 (lr=2.6783e-05) (hash(x)=21620160) +8440 train 6.633910 (lr=2.6771e-05) (hash(x)=23851680) +8441 train 6.761636 (lr=2.6760e-05) (hash(x)=25884337) +8442 train 6.581975 (lr=2.6748e-05) (hash(x)=22828831) +8443 train 6.440354 (lr=2.6736e-05) (hash(x)=19948407) +8444 train 6.574804 (lr=2.6725e-05) (hash(x)=24318773) +8445 train 6.517028 (lr=2.6713e-05) (hash(x)=25199121) +8446 train 6.796382 (lr=2.6702e-05) (hash(x)=27461132) +8447 train 6.549844 (lr=2.6690e-05) (hash(x)=25909048) +8448 train 6.613222 (lr=2.6678e-05) (hash(x)=25990097) +8449 train 6.363852 (lr=2.6667e-05) (hash(x)=20171092) +8450 val loss 6.6556 +8450 val perplexity 777.0956 +8450 train 6.736757 (lr=2.6655e-05) (hash(x)=25768461) +8451 train 6.520074 (lr=2.6644e-05) (hash(x)=26199182) +8452 train 6.351804 (lr=2.6632e-05) (hash(x)=23081914) +8453 train 7.501858 (lr=2.6621e-05) (hash(x)=28968813) +8454 train 6.447733 (lr=2.6609e-05) (hash(x)=23441977) +8455 train 6.563770 (lr=2.6597e-05) (hash(x)=24988924) +8456 train 6.504530 (lr=2.6586e-05) (hash(x)=24979485) +8457 train 6.700326 (lr=2.6574e-05) (hash(x)=26987620) +8458 train 6.629246 (lr=2.6563e-05) (hash(x)=24240216) +8459 train 6.576406 (lr=2.6551e-05) (hash(x)=24051167) +8460 train 6.681108 (lr=2.6540e-05) (hash(x)=24378218) +8461 train 6.628428 (lr=2.6528e-05) (hash(x)=24225864) +8462 train 6.455512 (lr=2.6517e-05) (hash(x)=25463499) +8463 train 6.250111 (lr=2.6505e-05) (hash(x)=21749184) +8464 train 6.556272 (lr=2.6494e-05) (hash(x)=25495460) +8465 train 6.434172 (lr=2.6482e-05) (hash(x)=21242537) +8466 train 6.739777 (lr=2.6471e-05) (hash(x)=26434292) +8467 train 6.552876 (lr=2.6459e-05) (hash(x)=24959243) +8468 train 6.168038 (lr=2.6448e-05) (hash(x)=23308776) +8469 train 6.594431 (lr=2.6436e-05) (hash(x)=25457559) +8470 train 6.635425 (lr=2.6425e-05) (hash(x)=24783385) +8471 train 6.636738 (lr=2.6414e-05) (hash(x)=28016509) +8472 train 6.841541 (lr=2.6402e-05) (hash(x)=23057905) +8473 train 6.433637 (lr=2.6391e-05) (hash(x)=26972689) +8474 train 6.355667 (lr=2.6379e-05) (hash(x)=21658886) +8475 train 6.435945 (lr=2.6368e-05) (hash(x)=24963855) +8476 train 6.592954 (lr=2.6357e-05) (hash(x)=26516156) +8477 train 6.640821 (lr=2.6345e-05) (hash(x)=26438819) +8478 train 6.496377 (lr=2.6334e-05) (hash(x)=22436536) +8479 train 5.934738 (lr=2.6322e-05) (hash(x)=16968685) +8480 train 6.283493 (lr=2.6311e-05) (hash(x)=22022900) +8481 train 6.709780 (lr=2.6300e-05) (hash(x)=25351350) +8482 train 6.767949 (lr=2.6288e-05) (hash(x)=27892531) +8483 train 6.737724 (lr=2.6277e-05) (hash(x)=24744756) +8484 train 6.931917 (lr=2.6266e-05) (hash(x)=25707768) +8485 train 6.178755 (lr=2.6254e-05) (hash(x)=19694178) +8486 train 6.249964 (lr=2.6243e-05) (hash(x)=21260481) +8487 train 6.446766 (lr=2.6232e-05) (hash(x)=23250948) +8488 train 6.773357 (lr=2.6220e-05) (hash(x)=26925807) +8489 train 6.686813 (lr=2.6209e-05) (hash(x)=23742260) +8490 train 6.745599 (lr=2.6198e-05) (hash(x)=24248052) +8491 train 6.325933 (lr=2.6186e-05) (hash(x)=21033881) +8492 train 6.398744 (lr=2.6175e-05) (hash(x)=21805271) +8493 train 6.683134 (lr=2.6164e-05) (hash(x)=23609357) +8494 train 6.240582 (lr=2.6152e-05) (hash(x)=21476166) +8495 train 6.735211 (lr=2.6141e-05) (hash(x)=29704860) +8496 train 6.751578 (lr=2.6130e-05) (hash(x)=28319634) +8497 train 6.648999 (lr=2.6119e-05) (hash(x)=23749636) +8498 train 6.388485 (lr=2.6107e-05) (hash(x)=22328407) +8499 train 6.436356 (lr=2.6096e-05) (hash(x)=23068363) +8500 val loss 6.6587 +8500 val perplexity 779.5250 +8500 train 6.186885 (lr=2.6085e-05) (hash(x)=20776092) +8501 train 6.272510 (lr=2.6074e-05) (hash(x)=20771670) +8502 train 6.442693 (lr=2.6062e-05) (hash(x)=23722191) +8503 train 6.494325 (lr=2.6051e-05) (hash(x)=23631523) +8504 train 6.642488 (lr=2.6040e-05) (hash(x)=27883070) +8505 train 6.839876 (lr=2.6029e-05) (hash(x)=26852519) +8506 train 7.040348 (lr=2.6018e-05) (hash(x)=31072241) +8507 train 6.424535 (lr=2.6006e-05) (hash(x)=23414648) +8508 train 6.701898 (lr=2.5995e-05) (hash(x)=23716138) +8509 train 6.548913 (lr=2.5984e-05) (hash(x)=28210484) +8510 train 6.340782 (lr=2.5973e-05) (hash(x)=22279020) +8511 train 6.311351 (lr=2.5962e-05) (hash(x)=23371548) +8512 train 6.201765 (lr=2.5951e-05) (hash(x)=22262161) +8513 train 6.827701 (lr=2.5939e-05) (hash(x)=32365249) +8514 train 6.661064 (lr=2.5928e-05) (hash(x)=26278383) +8515 train 6.767652 (lr=2.5917e-05) (hash(x)=25884825) +8516 train 6.652939 (lr=2.5906e-05) (hash(x)=25525856) +8517 train 6.671720 (lr=2.5895e-05) (hash(x)=27066161) +8518 train 6.244260 (lr=2.5884e-05) (hash(x)=23116614) +8519 train 6.361143 (lr=2.5873e-05) (hash(x)=23135296) +8520 train 6.519803 (lr=2.5862e-05) (hash(x)=26067163) +8521 train 6.606851 (lr=2.5851e-05) (hash(x)=25081364) +8522 train 6.238978 (lr=2.5839e-05) (hash(x)=22250276) +8523 train 6.538141 (lr=2.5828e-05) (hash(x)=24686637) +8524 train 6.492230 (lr=2.5817e-05) (hash(x)=25635781) +8525 train 6.210051 (lr=2.5806e-05) (hash(x)=21374749) +8526 train 6.647522 (lr=2.5795e-05) (hash(x)=30119417) +8527 train 6.362004 (lr=2.5784e-05) (hash(x)=23680607) +8528 train 6.795624 (lr=2.5773e-05) (hash(x)=26029596) +8529 train 6.731184 (lr=2.5762e-05) (hash(x)=25164153) +8530 train 6.388533 (lr=2.5751e-05) (hash(x)=23648852) +8531 train 6.388109 (lr=2.5740e-05) (hash(x)=22871659) +8532 train 6.402179 (lr=2.5729e-05) (hash(x)=24543620) +8533 train 6.270894 (lr=2.5718e-05) (hash(x)=22541829) +8534 train 6.509220 (lr=2.5707e-05) (hash(x)=27045892) +8535 train 6.517290 (lr=2.5696e-05) (hash(x)=25216320) +8536 train 6.628946 (lr=2.5685e-05) (hash(x)=22647852) +8537 train 6.794110 (lr=2.5674e-05) (hash(x)=26311404) +8538 train 6.571932 (lr=2.5663e-05) (hash(x)=22434076) +8539 train 6.628641 (lr=2.5652e-05) (hash(x)=26470755) +8540 train 6.666052 (lr=2.5641e-05) (hash(x)=25767393) +8541 train 6.635524 (lr=2.5630e-05) (hash(x)=26872581) +8542 train 6.435760 (lr=2.5619e-05) (hash(x)=24615017) +8543 train 6.602876 (lr=2.5608e-05) (hash(x)=24136535) +8544 train 6.619873 (lr=2.5597e-05) (hash(x)=22602756) +8545 train 6.543046 (lr=2.5586e-05) (hash(x)=21616327) +8546 train 6.430142 (lr=2.5576e-05) (hash(x)=27264694) +8547 train 6.949100 (lr=2.5565e-05) (hash(x)=29383906) +8548 train 7.366580 (lr=2.5554e-05) (hash(x)=31571548) +8549 train 6.908302 (lr=2.5543e-05) (hash(x)=28095903) +8550 val loss 6.6593 +8550 val perplexity 780.0273 +8550 train 6.329861 (lr=2.5532e-05) (hash(x)=20464579) +8551 train 6.386850 (lr=2.5521e-05) (hash(x)=24617268) +8552 train 6.724887 (lr=2.5510e-05) (hash(x)=25173275) +8553 train 6.508788 (lr=2.5499e-05) (hash(x)=26788479) +8554 train 6.455632 (lr=2.5488e-05) (hash(x)=23627665) +8555 train 6.665208 (lr=2.5478e-05) (hash(x)=25403205) +8556 train 6.300783 (lr=2.5467e-05) (hash(x)=21129455) +8557 train 6.570062 (lr=2.5456e-05) (hash(x)=24295823) +8558 train 6.388895 (lr=2.5445e-05) (hash(x)=22666653) +8559 train 6.507273 (lr=2.5434e-05) (hash(x)=24291572) +8560 train 6.626953 (lr=2.5423e-05) (hash(x)=23469373) +8561 train 6.361722 (lr=2.5413e-05) (hash(x)=21606938) +8562 train 6.506806 (lr=2.5402e-05) (hash(x)=23107465) +8563 train 6.603667 (lr=2.5391e-05) (hash(x)=28146936) +8564 train 6.715875 (lr=2.5380e-05) (hash(x)=28459237) +8565 train 6.846870 (lr=2.5369e-05) (hash(x)=28851234) +8566 train 6.319969 (lr=2.5359e-05) (hash(x)=23420577) +8567 train 6.582256 (lr=2.5348e-05) (hash(x)=25526717) +8568 train 6.748273 (lr=2.5337e-05) (hash(x)=27440564) +8569 train 6.557669 (lr=2.5326e-05) (hash(x)=25217943) +8570 train 6.353969 (lr=2.5316e-05) (hash(x)=25030079) +8571 train 6.330217 (lr=2.5305e-05) (hash(x)=22240570) +8572 train 6.340901 (lr=2.5294e-05) (hash(x)=20347475) +8573 train 6.501120 (lr=2.5283e-05) (hash(x)=26572462) +8574 train 6.697322 (lr=2.5273e-05) (hash(x)=26664685) +8575 train 6.788381 (lr=2.5262e-05) (hash(x)=25870938) +8576 train 6.416017 (lr=2.5251e-05) (hash(x)=22499900) +8577 train 6.583688 (lr=2.5241e-05) (hash(x)=25302109) +8578 train 6.414445 (lr=2.5230e-05) (hash(x)=23841099) +8579 train 6.204655 (lr=2.5219e-05) (hash(x)=22962888) +8580 train 6.802993 (lr=2.5208e-05) (hash(x)=25729632) +8581 train 6.136186 (lr=2.5198e-05) (hash(x)=20085773) +8582 train 6.300439 (lr=2.5187e-05) (hash(x)=21983167) +8583 train 6.301785 (lr=2.5176e-05) (hash(x)=21716336) +8584 train 6.537594 (lr=2.5166e-05) (hash(x)=24485667) +8585 train 6.376434 (lr=2.5155e-05) (hash(x)=21045672) +8586 train 6.484006 (lr=2.5145e-05) (hash(x)=24819030) +8587 train 6.643178 (lr=2.5134e-05) (hash(x)=24563963) +8588 train 6.276055 (lr=2.5123e-05) (hash(x)=21026936) +8589 train 6.828970 (lr=2.5113e-05) (hash(x)=27144130) +8590 train 6.964736 (lr=2.5102e-05) (hash(x)=28872750) +8591 train 6.536179 (lr=2.5091e-05) (hash(x)=23613060) +8592 train 6.715086 (lr=2.5081e-05) (hash(x)=29852415) +8593 train 6.736017 (lr=2.5070e-05) (hash(x)=30130128) +8594 train 6.569860 (lr=2.5060e-05) (hash(x)=24382776) +8595 train 6.676486 (lr=2.5049e-05) (hash(x)=27364688) +8596 train 6.370260 (lr=2.5039e-05) (hash(x)=23303230) +8597 train 6.337667 (lr=2.5028e-05) (hash(x)=22983508) +8598 train 6.289720 (lr=2.5017e-05) (hash(x)=23944396) +8599 train 6.311992 (lr=2.5007e-05) (hash(x)=24139659) +8600 val loss 6.6577 +8600 val perplexity 778.7589 +8600 train 6.640585 (lr=2.4996e-05) (hash(x)=27110380) +8601 train 6.560880 (lr=2.4986e-05) (hash(x)=25218666) +8602 train 6.926788 (lr=2.4975e-05) (hash(x)=26444028) +8603 train 6.977468 (lr=2.4965e-05) (hash(x)=26640743) +8604 train 6.579473 (lr=2.4954e-05) (hash(x)=25627122) +8605 train 6.567085 (lr=2.4944e-05) (hash(x)=24084098) +8606 train 6.476420 (lr=2.4933e-05) (hash(x)=23074088) +8607 train 6.404071 (lr=2.4923e-05) (hash(x)=23278075) +8608 train 6.524109 (lr=2.4912e-05) (hash(x)=24585400) +8609 train 6.806484 (lr=2.4902e-05) (hash(x)=26571053) +8610 train 6.501312 (lr=2.4891e-05) (hash(x)=24960755) +8611 train 6.288532 (lr=2.4881e-05) (hash(x)=20591951) +8612 train 6.423604 (lr=2.4870e-05) (hash(x)=25048910) +8613 train 6.606762 (lr=2.4860e-05) (hash(x)=24443041) +8614 train 6.402092 (lr=2.4850e-05) (hash(x)=23227976) +8615 train 6.163879 (lr=2.4839e-05) (hash(x)=20279799) +8616 train 6.546820 (lr=2.4829e-05) (hash(x)=25105838) +8617 train 6.589650 (lr=2.4818e-05) (hash(x)=27092069) +8618 train 6.337872 (lr=2.4808e-05) (hash(x)=22489218) +8619 train 6.345532 (lr=2.4797e-05) (hash(x)=24045703) +8620 train 6.503868 (lr=2.4787e-05) (hash(x)=24981198) +8621 train 6.530401 (lr=2.4777e-05) (hash(x)=25360189) +8622 train 6.520947 (lr=2.4766e-05) (hash(x)=23997025) +8623 train 6.552486 (lr=2.4756e-05) (hash(x)=22273288) +8624 train 6.594115 (lr=2.4746e-05) (hash(x)=20911715) +8625 train 6.601766 (lr=2.4735e-05) (hash(x)=22142901) +8626 train 7.037008 (lr=2.4725e-05) (hash(x)=26025893) +8627 train 6.549620 (lr=2.4714e-05) (hash(x)=24818246) +8628 train 7.109550 (lr=2.4704e-05) (hash(x)=29589876) +8629 train 6.385396 (lr=2.4694e-05) (hash(x)=25672352) +8630 train 6.669409 (lr=2.4683e-05) (hash(x)=24329924) +8631 train 6.260204 (lr=2.4673e-05) (hash(x)=23823738) +8632 train 6.360794 (lr=2.4663e-05) (hash(x)=21363236) +8633 train 6.534702 (lr=2.4652e-05) (hash(x)=24007341) +8634 train 7.353964 (lr=2.4642e-05) (hash(x)=29167999) +8635 train 6.890717 (lr=2.4632e-05) (hash(x)=29371345) +8636 train 6.311992 (lr=2.4622e-05) (hash(x)=24145489) +8637 train 6.692700 (lr=2.4611e-05) (hash(x)=27710420) +8638 train 6.528833 (lr=2.4601e-05) (hash(x)=22937055) +8639 train 6.481090 (lr=2.4591e-05) (hash(x)=23986451) +8640 train 6.331453 (lr=2.4581e-05) (hash(x)=24684521) +8641 train 6.864862 (lr=2.4570e-05) (hash(x)=25310095) +8642 train 6.403211 (lr=2.4560e-05) (hash(x)=22686776) +8643 train 6.920883 (lr=2.4550e-05) (hash(x)=26487840) +8644 train 6.671350 (lr=2.4540e-05) (hash(x)=25721934) +8645 train 6.278382 (lr=2.4529e-05) (hash(x)=22305036) +8646 train 6.781372 (lr=2.4519e-05) (hash(x)=25937920) +8647 train 6.285715 (lr=2.4509e-05) (hash(x)=22007606) +8648 train 6.096864 (lr=2.4499e-05) (hash(x)=25552412) +8649 train 6.745410 (lr=2.4489e-05) (hash(x)=23967063) +8650 val loss 6.6529 +8650 val perplexity 775.0185 +8650 train 6.141388 (lr=2.4478e-05) (hash(x)=21466936) +8651 train 6.320846 (lr=2.4468e-05) (hash(x)=21805011) +8652 train 6.383992 (lr=2.4458e-05) (hash(x)=24491211) +8653 train 6.581687 (lr=2.4448e-05) (hash(x)=24486636) +8654 train 6.410314 (lr=2.4438e-05) (hash(x)=23724981) +8655 train 6.211773 (lr=2.4428e-05) (hash(x)=26005846) +8656 train 6.540382 (lr=2.4417e-05) (hash(x)=26391171) +8657 train 6.151287 (lr=2.4407e-05) (hash(x)=21610448) +8658 train 6.614807 (lr=2.4397e-05) (hash(x)=24603700) +8659 train 6.475494 (lr=2.4387e-05) (hash(x)=22609993) +8660 train 6.501482 (lr=2.4377e-05) (hash(x)=23680277) +8661 train 6.446471 (lr=2.4367e-05) (hash(x)=23183024) +8662 train 6.281592 (lr=2.4357e-05) (hash(x)=21840979) +8663 train 6.384237 (lr=2.4347e-05) (hash(x)=21124146) +8664 train 6.873028 (lr=2.4337e-05) (hash(x)=28496086) +8665 train 7.084639 (lr=2.4326e-05) (hash(x)=30512535) +8666 train 6.498601 (lr=2.4316e-05) (hash(x)=23915415) +8667 train 6.805183 (lr=2.4306e-05) (hash(x)=25757491) +8668 train 6.694702 (lr=2.4296e-05) (hash(x)=25942362) +8669 train 6.584756 (lr=2.4286e-05) (hash(x)=23569736) +8670 train 6.270038 (lr=2.4276e-05) (hash(x)=20932101) +8671 train 6.585765 (lr=2.4266e-05) (hash(x)=26393576) +8672 train 6.360230 (lr=2.4256e-05) (hash(x)=23537910) +8673 train 6.286182 (lr=2.4246e-05) (hash(x)=24896330) +8674 train 6.348115 (lr=2.4236e-05) (hash(x)=24084951) +8675 train 6.771108 (lr=2.4226e-05) (hash(x)=26252028) +8676 train 6.318330 (lr=2.4216e-05) (hash(x)=21296599) +8677 train 6.774930 (lr=2.4206e-05) (hash(x)=27386936) +8678 train 6.544194 (lr=2.4196e-05) (hash(x)=23862832) +8679 train 6.539182 (lr=2.4186e-05) (hash(x)=23905543) +8680 train 6.470841 (lr=2.4176e-05) (hash(x)=22845592) +8681 train 6.519144 (lr=2.4166e-05) (hash(x)=23364632) +8682 train 6.592225 (lr=2.4156e-05) (hash(x)=25211290) +8683 train 7.693361 (lr=2.4146e-05) (hash(x)=28689501) +8684 train 6.666510 (lr=2.4136e-05) (hash(x)=25344694) +8685 train 6.561859 (lr=2.4126e-05) (hash(x)=24663231) +8686 train 6.686920 (lr=2.4116e-05) (hash(x)=27244112) +8687 train 6.923576 (lr=2.4106e-05) (hash(x)=33296423) +8688 train 6.897177 (lr=2.4097e-05) (hash(x)=26231822) +8689 train 6.740987 (lr=2.4087e-05) (hash(x)=25497517) +8690 train 6.225374 (lr=2.4077e-05) (hash(x)=21001299) +8691 train 6.586884 (lr=2.4067e-05) (hash(x)=26161975) +8692 train 6.334857 (lr=2.4057e-05) (hash(x)=23856850) +8693 train 6.584815 (lr=2.4047e-05) (hash(x)=25937843) +8694 train 6.747669 (lr=2.4037e-05) (hash(x)=26452702) +8695 train 6.563253 (lr=2.4027e-05) (hash(x)=26612719) +8696 train 6.618069 (lr=2.4017e-05) (hash(x)=26106134) +8697 train 6.517928 (lr=2.4008e-05) (hash(x)=24455131) +8698 train 6.160886 (lr=2.3998e-05) (hash(x)=19098734) +8699 train 6.424770 (lr=2.3988e-05) (hash(x)=22842285) +8700 val loss 6.6509 +8700 val perplexity 773.4446 +8700 train 6.461669 (lr=2.3978e-05) (hash(x)=26115026) +8701 train 7.050031 (lr=2.3968e-05) (hash(x)=27931313) +8702 train 6.491330 (lr=2.3958e-05) (hash(x)=24237854) +8703 train 6.752290 (lr=2.3949e-05) (hash(x)=26513425) +8704 train 6.815408 (lr=2.3939e-05) (hash(x)=27168702) +8705 train 6.475770 (lr=2.3929e-05) (hash(x)=24201459) +8706 train 6.744309 (lr=2.3919e-05) (hash(x)=26215188) +8707 train 6.280230 (lr=2.3909e-05) (hash(x)=21284018) +8708 train 6.511497 (lr=2.3900e-05) (hash(x)=25854467) +8709 train 6.380366 (lr=2.3890e-05) (hash(x)=24367707) +8710 train 6.435988 (lr=2.3880e-05) (hash(x)=24538584) +8711 train 6.695065 (lr=2.3870e-05) (hash(x)=26987888) +8712 train 6.613605 (lr=2.3861e-05) (hash(x)=23864261) +8713 train 6.480890 (lr=2.3851e-05) (hash(x)=24928818) +8714 train 6.655280 (lr=2.3841e-05) (hash(x)=24727299) +8715 train 6.330149 (lr=2.3831e-05) (hash(x)=24050563) +8716 train 6.540241 (lr=2.3822e-05) (hash(x)=26647086) +8717 train 6.641075 (lr=2.3812e-05) (hash(x)=25389890) +8718 train 6.443983 (lr=2.3802e-05) (hash(x)=22976180) +8719 train 6.232387 (lr=2.3793e-05) (hash(x)=23231269) +8720 train 6.408223 (lr=2.3783e-05) (hash(x)=23551041) +8721 train 6.387546 (lr=2.3773e-05) (hash(x)=21380877) +8722 train 6.694019 (lr=2.3764e-05) (hash(x)=26213415) +8723 train 7.064844 (lr=2.3754e-05) (hash(x)=26970987) +8724 train 7.105027 (lr=2.3744e-05) (hash(x)=25721847) +8725 train 6.642654 (lr=2.3735e-05) (hash(x)=25245269) +8726 train 7.273691 (lr=2.3725e-05) (hash(x)=31367527) +8727 train 6.599285 (lr=2.3715e-05) (hash(x)=24910068) +8728 train 6.594855 (lr=2.3706e-05) (hash(x)=25152235) +8729 train 6.587743 (lr=2.3696e-05) (hash(x)=26692459) +8730 train 6.503550 (lr=2.3686e-05) (hash(x)=25056290) +8731 train 6.134771 (lr=2.3677e-05) (hash(x)=21475124) +8732 train 6.271245 (lr=2.3667e-05) (hash(x)=20929763) +8733 train 6.267717 (lr=2.3658e-05) (hash(x)=22717431) +8734 train 6.560431 (lr=2.3648e-05) (hash(x)=27369141) +8735 train 6.402206 (lr=2.3639e-05) (hash(x)=22312912) +8736 train 6.412847 (lr=2.3629e-05) (hash(x)=24248117) +8737 train 6.668724 (lr=2.3619e-05) (hash(x)=24990050) +8738 train 6.532883 (lr=2.3610e-05) (hash(x)=25906297) +8739 train 6.446107 (lr=2.3600e-05) (hash(x)=25202491) +8740 train 6.550331 (lr=2.3591e-05) (hash(x)=25276622) +8741 train 6.522514 (lr=2.3581e-05) (hash(x)=24144633) +8742 train 6.511474 (lr=2.3572e-05) (hash(x)=24985503) +8743 train 6.786417 (lr=2.3562e-05) (hash(x)=28451492) +8744 train 6.663208 (lr=2.3553e-05) (hash(x)=25847179) +8745 train 6.499845 (lr=2.3543e-05) (hash(x)=22821810) +8746 train 6.706174 (lr=2.3534e-05) (hash(x)=26334740) +8747 train 6.628452 (lr=2.3524e-05) (hash(x)=26662729) +8748 train 6.370283 (lr=2.3515e-05) (hash(x)=26283886) +8749 train 6.357078 (lr=2.3505e-05) (hash(x)=24202447) +8750 val loss 6.6492 +8750 val perplexity 772.2028 +8750 train 6.491815 (lr=2.3496e-05) (hash(x)=24184363) +8751 train 6.176812 (lr=2.3486e-05) (hash(x)=21194753) +8752 train 7.193627 (lr=2.3477e-05) (hash(x)=25328063) +8753 train 6.777242 (lr=2.3467e-05) (hash(x)=25571299) +8754 train 6.625201 (lr=2.3458e-05) (hash(x)=25289043) +8755 train 6.561859 (lr=2.3448e-05) (hash(x)=26218321) +8756 train 6.554811 (lr=2.3439e-05) (hash(x)=24126845) +8757 train 6.335963 (lr=2.3430e-05) (hash(x)=22411026) +8758 train 6.662181 (lr=2.3420e-05) (hash(x)=24214901) +8759 train 6.459583 (lr=2.3411e-05) (hash(x)=23880312) +8760 train 6.558656 (lr=2.3401e-05) (hash(x)=26939120) +8761 train 6.315576 (lr=2.3392e-05) (hash(x)=22532092) +8762 train 6.576183 (lr=2.3383e-05) (hash(x)=24043346) +8763 train 6.527356 (lr=2.3373e-05) (hash(x)=23217194) +8764 train 6.178508 (lr=2.3364e-05) (hash(x)=22529246) +8765 train 6.663021 (lr=2.3354e-05) (hash(x)=26233330) +8766 train 6.545520 (lr=2.3345e-05) (hash(x)=26692420) +8767 train 6.545175 (lr=2.3336e-05) (hash(x)=26803143) +8768 train 6.343675 (lr=2.3326e-05) (hash(x)=21131229) +8769 train 6.397383 (lr=2.3317e-05) (hash(x)=21823248) +8770 train 6.413396 (lr=2.3308e-05) (hash(x)=25266554) +8771 train 6.654973 (lr=2.3298e-05) (hash(x)=23427249) +8772 train 6.396995 (lr=2.3289e-05) (hash(x)=24331020) +8773 train 6.504103 (lr=2.3280e-05) (hash(x)=25488580) +8774 train 6.399563 (lr=2.3270e-05) (hash(x)=24774485) +8775 train 6.420255 (lr=2.3261e-05) (hash(x)=24147822) +8776 train 6.233415 (lr=2.3252e-05) (hash(x)=20292714) +8777 train 6.114442 (lr=2.3243e-05) (hash(x)=23483022) +8778 train 6.458772 (lr=2.3233e-05) (hash(x)=21159972) +8779 train 6.421271 (lr=2.3224e-05) (hash(x)=21491600) +8780 train 6.644321 (lr=2.3215e-05) (hash(x)=26736999) +8781 train 6.289959 (lr=2.3206e-05) (hash(x)=21655173) +8782 train 6.716603 (lr=2.3196e-05) (hash(x)=24733720) +8783 train 6.306255 (lr=2.3187e-05) (hash(x)=22868399) +8784 train 6.024184 (lr=2.3178e-05) (hash(x)=18371344) +8785 train 6.261169 (lr=2.3169e-05) (hash(x)=24232955) +8786 train 6.706850 (lr=2.3159e-05) (hash(x)=27503708) +8787 train 6.526357 (lr=2.3150e-05) (hash(x)=23119732) +8788 train 6.756556 (lr=2.3141e-05) (hash(x)=25223725) +8789 train 6.771811 (lr=2.3132e-05) (hash(x)=28964917) +8790 train 6.325233 (lr=2.3123e-05) (hash(x)=23235335) +8791 train 6.393715 (lr=2.3113e-05) (hash(x)=24666868) +8792 train 6.508041 (lr=2.3104e-05) (hash(x)=24717141) +8793 train 6.405264 (lr=2.3095e-05) (hash(x)=23813669) +8794 train 6.557827 (lr=2.3086e-05) (hash(x)=23700865) +8795 train 6.431593 (lr=2.3077e-05) (hash(x)=23299873) +8796 train 6.389543 (lr=2.3068e-05) (hash(x)=22526489) +8797 train 6.904928 (lr=2.3059e-05) (hash(x)=26234265) +8798 train 6.721533 (lr=2.3049e-05) (hash(x)=28304597) +8799 train 6.756663 (lr=2.3040e-05) (hash(x)=25668453) +8800 val loss 6.6490 +8800 val perplexity 771.9874 +8800 train 6.391313 (lr=2.3031e-05) (hash(x)=21115814) +8801 train 6.330753 (lr=2.3022e-05) (hash(x)=22792643) +8802 train 6.590141 (lr=2.3013e-05) (hash(x)=26194587) +8803 train 6.667714 (lr=2.3004e-05) (hash(x)=24617431) +8804 train 6.518291 (lr=2.2995e-05) (hash(x)=23870410) +8805 train 6.980026 (lr=2.2986e-05) (hash(x)=26958453) +8806 train 6.359098 (lr=2.2977e-05) (hash(x)=23608134) +8807 train 6.892104 (lr=2.2968e-05) (hash(x)=28461208) +8808 train 6.977829 (lr=2.2959e-05) (hash(x)=28759693) +8809 train 6.495873 (lr=2.2950e-05) (hash(x)=23235698) +8810 train 6.466940 (lr=2.2940e-05) (hash(x)=24818188) +8811 train 6.442008 (lr=2.2931e-05) (hash(x)=26589581) +8812 train 6.488530 (lr=2.2922e-05) (hash(x)=23279405) +8813 train 6.563664 (lr=2.2913e-05) (hash(x)=28646133) +8814 train 6.008737 (lr=2.2904e-05) (hash(x)=19727066) +8815 train 6.384880 (lr=2.2895e-05) (hash(x)=24580038) +8816 train 6.475479 (lr=2.2886e-05) (hash(x)=22803596) +8817 train 6.400506 (lr=2.2877e-05) (hash(x)=24051767) +8818 train 6.364844 (lr=2.2868e-05) (hash(x)=23077537) +8819 train 6.472343 (lr=2.2859e-05) (hash(x)=22232039) +8820 train 6.567401 (lr=2.2850e-05) (hash(x)=26801180) +8821 train 6.846593 (lr=2.2841e-05) (hash(x)=28479353) +8822 train 6.343251 (lr=2.2833e-05) (hash(x)=21979730) +8823 train 6.411407 (lr=2.2824e-05) (hash(x)=22703857) +8824 train 6.447281 (lr=2.2815e-05) (hash(x)=23070671) +8825 train 6.412515 (lr=2.2806e-05) (hash(x)=24445973) +8826 train 6.544647 (lr=2.2797e-05) (hash(x)=23667043) +8827 train 6.349079 (lr=2.2788e-05) (hash(x)=22100323) +8828 train 6.575761 (lr=2.2779e-05) (hash(x)=22746823) +8829 train 6.620089 (lr=2.2770e-05) (hash(x)=23660633) +8830 train 6.397853 (lr=2.2761e-05) (hash(x)=22952341) +8831 train 6.714927 (lr=2.2752e-05) (hash(x)=25695897) +8832 train 6.886032 (lr=2.2743e-05) (hash(x)=25824374) +8833 train 6.484201 (lr=2.2735e-05) (hash(x)=24604080) +8834 train 6.403810 (lr=2.2726e-05) (hash(x)=22411178) +8835 train 6.290466 (lr=2.2717e-05) (hash(x)=22730308) +8836 train 6.744762 (lr=2.2708e-05) (hash(x)=28302419) +8837 train 6.716188 (lr=2.2699e-05) (hash(x)=25641174) +8838 train 6.439359 (lr=2.2690e-05) (hash(x)=22749097) +8839 train 6.332683 (lr=2.2681e-05) (hash(x)=23634054) +8840 train 6.319432 (lr=2.2673e-05) (hash(x)=19968228) +8841 train 6.526042 (lr=2.2664e-05) (hash(x)=26513268) +8842 train 6.479387 (lr=2.2655e-05) (hash(x)=24479278) +8843 train 6.808056 (lr=2.2646e-05) (hash(x)=27573268) +8844 train 6.292716 (lr=2.2637e-05) (hash(x)=24443065) +8845 train 6.515209 (lr=2.2629e-05) (hash(x)=22891103) +8846 train 6.559586 (lr=2.2620e-05) (hash(x)=24644446) +8847 train 6.554855 (lr=2.2611e-05) (hash(x)=25682723) +8848 train 6.720876 (lr=2.2602e-05) (hash(x)=28342241) +8849 train 6.483667 (lr=2.2594e-05) (hash(x)=25791125) +8850 val loss 6.6476 +8850 val perplexity 770.9026 +8850 train 6.082273 (lr=2.2585e-05) (hash(x)=21661861) +8851 train 6.257925 (lr=2.2576e-05) (hash(x)=23585532) +8852 train 6.089666 (lr=2.2567e-05) (hash(x)=23835271) +8853 train 6.457006 (lr=2.2559e-05) (hash(x)=25948723) +8854 train 6.566504 (lr=2.2550e-05) (hash(x)=25944805) +8855 train 6.259353 (lr=2.2541e-05) (hash(x)=22983818) +8856 train 6.749860 (lr=2.2532e-05) (hash(x)=30437159) +8857 train 6.614436 (lr=2.2524e-05) (hash(x)=27489824) +8858 train 6.723072 (lr=2.2515e-05) (hash(x)=25206173) +8859 train 6.702859 (lr=2.2506e-05) (hash(x)=23962560) +8860 train 6.609483 (lr=2.2498e-05) (hash(x)=25317033) +8861 train 6.590539 (lr=2.2489e-05) (hash(x)=23802688) +8862 train 6.522419 (lr=2.2480e-05) (hash(x)=23564792) +8863 train 6.728818 (lr=2.2472e-05) (hash(x)=25231749) +8864 train 6.520679 (lr=2.2463e-05) (hash(x)=24116652) +8865 train 6.633066 (lr=2.2454e-05) (hash(x)=28110264) +8866 train 6.513738 (lr=2.2446e-05) (hash(x)=26100965) +8867 train 6.267305 (lr=2.2437e-05) (hash(x)=22504975) +8868 train 6.348384 (lr=2.2429e-05) (hash(x)=23475781) +8869 train 6.091587 (lr=2.2420e-05) (hash(x)=18167940) +8870 train 6.369767 (lr=2.2411e-05) (hash(x)=23028338) +8871 train 6.256449 (lr=2.2403e-05) (hash(x)=22602033) +8872 train 6.583927 (lr=2.2394e-05) (hash(x)=26117205) +8873 train 6.925232 (lr=2.2386e-05) (hash(x)=25547734) +8874 train 6.532799 (lr=2.2377e-05) (hash(x)=22467339) +8875 train 6.784616 (lr=2.2368e-05) (hash(x)=28369634) +8876 train 6.984197 (lr=2.2360e-05) (hash(x)=28775193) +8877 train 6.880838 (lr=2.2351e-05) (hash(x)=30572716) +8878 train 6.528053 (lr=2.2343e-05) (hash(x)=25252828) +8879 train 6.915796 (lr=2.2334e-05) (hash(x)=27646283) +8880 train 6.502190 (lr=2.2326e-05) (hash(x)=24146650) +8881 train 6.173846 (lr=2.2317e-05) (hash(x)=22185738) +8882 train 6.595132 (lr=2.2309e-05) (hash(x)=26069473) +8883 train 6.823424 (lr=2.2300e-05) (hash(x)=25752645) +8884 train 6.220708 (lr=2.2292e-05) (hash(x)=25622978) +8885 train 5.790269 (lr=2.2283e-05) (hash(x)=16335769) +8886 train 5.965664 (lr=2.2275e-05) (hash(x)=17915719) +8887 train 6.794730 (lr=2.2266e-05) (hash(x)=24225306) +8888 train 6.534476 (lr=2.2258e-05) (hash(x)=27439136) +8889 train 6.293988 (lr=2.2249e-05) (hash(x)=21536256) +8890 train 6.457119 (lr=2.2241e-05) (hash(x)=27799104) +8891 train 6.839482 (lr=2.2232e-05) (hash(x)=27837497) +8892 train 6.814733 (lr=2.2224e-05) (hash(x)=25484348) +8893 train 6.803966 (lr=2.2215e-05) (hash(x)=26340510) +8894 train 6.193835 (lr=2.2207e-05) (hash(x)=20185884) +8895 train 6.554814 (lr=2.2199e-05) (hash(x)=25310638) +8896 train 6.574386 (lr=2.2190e-05) (hash(x)=25673874) +8897 train 7.026555 (lr=2.2182e-05) (hash(x)=27562096) +8898 train 6.938821 (lr=2.2173e-05) (hash(x)=29276502) +8899 train 6.259396 (lr=2.2165e-05) (hash(x)=21822104) +8900 val loss 6.6472 +8900 val perplexity 770.6564 +8900 train 6.533802 (lr=2.2157e-05) (hash(x)=26720680) +8901 train 6.424530 (lr=2.2148e-05) (hash(x)=23373839) +8902 train 6.657642 (lr=2.2140e-05) (hash(x)=24206699) +8903 train 6.910144 (lr=2.2131e-05) (hash(x)=26638313) +8904 train 6.675177 (lr=2.2123e-05) (hash(x)=24749489) +8905 train 6.272216 (lr=2.2115e-05) (hash(x)=20638335) +8906 train 7.050366 (lr=2.2106e-05) (hash(x)=28559243) +8907 train 7.173493 (lr=2.2098e-05) (hash(x)=32404659) +8908 train 6.510294 (lr=2.2090e-05) (hash(x)=22482170) +8909 train 6.725113 (lr=2.2081e-05) (hash(x)=26280758) +8910 train 6.635864 (lr=2.2073e-05) (hash(x)=23167730) +8911 train 6.367504 (lr=2.2065e-05) (hash(x)=23412334) +8912 train 6.642335 (lr=2.2057e-05) (hash(x)=25534782) +8913 train 6.454973 (lr=2.2048e-05) (hash(x)=22962570) +8914 train 6.280652 (lr=2.2040e-05) (hash(x)=21017162) +8915 train 6.334048 (lr=2.2032e-05) (hash(x)=21916690) +8916 train 6.770995 (lr=2.2023e-05) (hash(x)=27002497) +8917 train 6.956468 (lr=2.2015e-05) (hash(x)=25037197) +8918 train 6.704952 (lr=2.2007e-05) (hash(x)=27600648) +8919 train 6.438086 (lr=2.1999e-05) (hash(x)=23936809) +8920 train 6.531808 (lr=2.1990e-05) (hash(x)=24760257) +8921 train 6.490064 (lr=2.1982e-05) (hash(x)=24887124) +8922 train 6.507394 (lr=2.1974e-05) (hash(x)=22195711) +8923 train 6.443630 (lr=2.1966e-05) (hash(x)=24602728) +8924 train 6.394941 (lr=2.1958e-05) (hash(x)=24918808) +8925 train 6.397453 (lr=2.1949e-05) (hash(x)=23433273) +8926 train 6.369081 (lr=2.1941e-05) (hash(x)=25805868) +8927 train 6.801632 (lr=2.1933e-05) (hash(x)=27829482) +8928 train 6.497377 (lr=2.1925e-05) (hash(x)=25913318) +8929 train 6.429066 (lr=2.1917e-05) (hash(x)=25969594) +8930 train 6.360277 (lr=2.1908e-05) (hash(x)=25488037) +8931 train 6.353688 (lr=2.1900e-05) (hash(x)=19382426) +8932 train 6.852020 (lr=2.1892e-05) (hash(x)=26862030) +8933 train 6.532066 (lr=2.1884e-05) (hash(x)=24934849) +8934 train 6.539623 (lr=2.1876e-05) (hash(x)=22572609) +8935 train 6.463147 (lr=2.1868e-05) (hash(x)=22773307) +8936 train 6.594986 (lr=2.1860e-05) (hash(x)=24391569) +8937 train 6.912981 (lr=2.1851e-05) (hash(x)=24926482) +8938 train 6.627120 (lr=2.1843e-05) (hash(x)=24143375) +8939 train 6.639394 (lr=2.1835e-05) (hash(x)=26772134) +8940 train 6.190619 (lr=2.1827e-05) (hash(x)=19926992) +8941 train 6.287183 (lr=2.1819e-05) (hash(x)=20062224) +8942 train 6.546944 (lr=2.1811e-05) (hash(x)=21782337) +8943 train 6.573734 (lr=2.1803e-05) (hash(x)=25784576) +8944 train 6.652446 (lr=2.1795e-05) (hash(x)=24580606) +8945 train 6.472230 (lr=2.1787e-05) (hash(x)=24998258) +8946 train 6.323936 (lr=2.1779e-05) (hash(x)=22494003) +8947 train 6.436369 (lr=2.1771e-05) (hash(x)=23086245) +8948 train 6.586824 (lr=2.1763e-05) (hash(x)=24733163) +8949 train 6.472614 (lr=2.1755e-05) (hash(x)=23073697) +8950 val loss 6.6496 +8950 val perplexity 772.4767 +8950 train 6.487410 (lr=2.1747e-05) (hash(x)=21853765) +8951 train 6.273366 (lr=2.1739e-05) (hash(x)=24228273) +8952 train 7.132581 (lr=2.1731e-05) (hash(x)=29084643) +8953 train 6.397983 (lr=2.1723e-05) (hash(x)=25182395) +8954 train 6.413599 (lr=2.1715e-05) (hash(x)=24177905) +8955 train 6.649852 (lr=2.1707e-05) (hash(x)=26187461) +8956 train 6.886891 (lr=2.1699e-05) (hash(x)=26025256) +8957 train 6.970254 (lr=2.1691e-05) (hash(x)=27869663) +8958 train 6.556131 (lr=2.1683e-05) (hash(x)=23615442) +8959 train 6.794820 (lr=2.1675e-05) (hash(x)=28563822) +8960 train 6.642966 (lr=2.1667e-05) (hash(x)=24842324) +8961 train 6.705481 (lr=2.1659e-05) (hash(x)=29772723) +8962 train 6.607500 (lr=2.1651e-05) (hash(x)=26574930) +8963 train 6.506393 (lr=2.1643e-05) (hash(x)=24672684) +8964 train 6.667793 (lr=2.1635e-05) (hash(x)=25435702) +8965 train 6.671445 (lr=2.1627e-05) (hash(x)=24186582) +8966 train 6.372623 (lr=2.1619e-05) (hash(x)=25352260) +8967 train 6.474668 (lr=2.1611e-05) (hash(x)=22613352) +8968 train 6.732846 (lr=2.1604e-05) (hash(x)=28644124) +8969 train 6.617206 (lr=2.1596e-05) (hash(x)=21988584) +8970 train 6.850403 (lr=2.1588e-05) (hash(x)=26312535) +8971 train 6.358171 (lr=2.1580e-05) (hash(x)=23785827) +8972 train 6.517017 (lr=2.1572e-05) (hash(x)=24372109) +8973 train 6.561804 (lr=2.1564e-05) (hash(x)=24743580) +8974 train 6.178829 (lr=2.1556e-05) (hash(x)=19593213) +8975 train 6.716358 (lr=2.1549e-05) (hash(x)=26277740) +8976 train 6.732576 (lr=2.1541e-05) (hash(x)=26273778) +8977 train 6.627294 (lr=2.1533e-05) (hash(x)=24414336) +8978 train 6.751396 (lr=2.1525e-05) (hash(x)=28106054) +8979 train 6.636346 (lr=2.1517e-05) (hash(x)=26103115) +8980 train 6.651338 (lr=2.1509e-05) (hash(x)=24948128) +8981 train 6.557690 (lr=2.1502e-05) (hash(x)=24247829) +8982 train 6.661812 (lr=2.1494e-05) (hash(x)=22865026) +8983 train 6.632744 (lr=2.1486e-05) (hash(x)=25910468) +8984 train 6.691420 (lr=2.1478e-05) (hash(x)=27234274) +8985 train 6.551815 (lr=2.1471e-05) (hash(x)=23035523) +8986 train 6.560637 (lr=2.1463e-05) (hash(x)=21584428) +8987 train 6.594011 (lr=2.1455e-05) (hash(x)=25036040) +8988 train 6.345907 (lr=2.1447e-05) (hash(x)=21469728) +8989 train 6.464258 (lr=2.1440e-05) (hash(x)=23742647) +8990 train 6.830983 (lr=2.1432e-05) (hash(x)=30650073) +8991 train 6.632387 (lr=2.1424e-05) (hash(x)=25973739) +8992 train 6.655666 (lr=2.1416e-05) (hash(x)=24263902) +8993 train 6.562112 (lr=2.1409e-05) (hash(x)=25988151) +8994 train 6.621278 (lr=2.1401e-05) (hash(x)=25119223) +8995 train 7.218901 (lr=2.1393e-05) (hash(x)=29686377) +8996 train 7.637837 (lr=2.1386e-05) (hash(x)=36202600) +8997 train 7.636045 (lr=2.1378e-05) (hash(x)=34295460) +8998 train 6.243412 (lr=2.1370e-05) (hash(x)=20289529) +8999 train 6.292711 (lr=2.1363e-05) (hash(x)=21974495) +9000 val loss 6.6437 +9000 val perplexity 767.9147 +9000 train 6.459174 (lr=2.1355e-05) (hash(x)=24239485) +9001 train 6.587346 (lr=2.1347e-05) (hash(x)=26050769) +9002 train 6.475616 (lr=2.1340e-05) (hash(x)=25926483) +9003 train 6.500825 (lr=2.1332e-05) (hash(x)=26055960) +9004 train 6.662062 (lr=2.1325e-05) (hash(x)=26800793) +9005 train 6.330394 (lr=2.1317e-05) (hash(x)=24501814) +9006 train 6.573635 (lr=2.1309e-05) (hash(x)=23270439) +9007 train 6.431807 (lr=2.1302e-05) (hash(x)=24048226) +9008 train 5.890071 (lr=2.1294e-05) (hash(x)=16652432) +9009 train 6.257294 (lr=2.1287e-05) (hash(x)=23492861) +9010 train 6.383750 (lr=2.1279e-05) (hash(x)=21299317) +9011 train 6.709564 (lr=2.1271e-05) (hash(x)=26408832) +9012 train 6.745391 (lr=2.1264e-05) (hash(x)=26584480) +9013 train 6.796146 (lr=2.1256e-05) (hash(x)=26771989) +9014 train 6.827872 (lr=2.1249e-05) (hash(x)=27145935) +9015 train 6.793513 (lr=2.1241e-05) (hash(x)=31689089) +9016 train 6.731533 (lr=2.1234e-05) (hash(x)=26885967) +9017 train 6.498445 (lr=2.1226e-05) (hash(x)=24874804) +9018 train 6.253002 (lr=2.1219e-05) (hash(x)=22070335) +9019 train 6.574771 (lr=2.1211e-05) (hash(x)=25221725) +9020 train 6.669769 (lr=2.1204e-05) (hash(x)=24790549) +9021 train 6.561818 (lr=2.1196e-05) (hash(x)=24482119) +9022 train 6.336987 (lr=2.1189e-05) (hash(x)=25898842) +9023 train 6.534312 (lr=2.1181e-05) (hash(x)=23209952) +9024 train 6.527933 (lr=2.1174e-05) (hash(x)=25260019) +9025 train 6.134933 (lr=2.1166e-05) (hash(x)=19180586) +9026 train 6.584012 (lr=2.1159e-05) (hash(x)=25032927) +9027 train 6.459397 (lr=2.1151e-05) (hash(x)=25975211) +9028 train 7.122793 (lr=2.1144e-05) (hash(x)=26271082) +9029 train 6.905295 (lr=2.1136e-05) (hash(x)=31450093) +9030 train 6.212322 (lr=2.1129e-05) (hash(x)=20736284) +9031 train 6.552136 (lr=2.1122e-05) (hash(x)=24836505) +9032 train 6.891275 (lr=2.1114e-05) (hash(x)=30624650) +9033 train 6.941224 (lr=2.1107e-05) (hash(x)=31115605) +9034 train 6.609634 (lr=2.1099e-05) (hash(x)=26339705) +9035 train 6.790312 (lr=2.1092e-05) (hash(x)=29081003) +9036 train 6.599048 (lr=2.1085e-05) (hash(x)=24740097) +9037 train 6.904994 (lr=2.1077e-05) (hash(x)=25633419) +9038 train 6.376090 (lr=2.1070e-05) (hash(x)=24299047) +9039 train 6.447081 (lr=2.1062e-05) (hash(x)=24929260) +9040 train 6.560443 (lr=2.1055e-05) (hash(x)=25968950) +9041 train 6.547569 (lr=2.1048e-05) (hash(x)=25088572) +9042 train 6.999001 (lr=2.1040e-05) (hash(x)=30661959) +9043 train 6.966756 (lr=2.1033e-05) (hash(x)=31355108) +9044 train 6.566985 (lr=2.1026e-05) (hash(x)=22973056) +9045 train 7.152983 (lr=2.1018e-05) (hash(x)=25068406) +9046 train 6.662148 (lr=2.1011e-05) (hash(x)=24226993) +9047 train 6.567325 (lr=2.1004e-05) (hash(x)=26776257) +9048 train 6.465736 (lr=2.0997e-05) (hash(x)=25126336) +9049 train 6.663368 (lr=2.0989e-05) (hash(x)=23307542) +9050 val loss 6.6452 +9050 val perplexity 769.0554 +9050 train 6.542237 (lr=2.0982e-05) (hash(x)=26979454) +9051 train 6.240234 (lr=2.0975e-05) (hash(x)=22466194) +9052 train 6.628737 (lr=2.0967e-05) (hash(x)=24082730) +9053 train 6.504655 (lr=2.0960e-05) (hash(x)=25030928) +9054 train 6.256500 (lr=2.0953e-05) (hash(x)=17568374) +9055 train 6.113745 (lr=2.0946e-05) (hash(x)=16899654) +9056 train 6.553908 (lr=2.0938e-05) (hash(x)=24612765) +9057 train 6.585964 (lr=2.0931e-05) (hash(x)=23999559) +9058 train 6.828987 (lr=2.0924e-05) (hash(x)=25824485) +9059 train 6.451093 (lr=2.0917e-05) (hash(x)=21389104) +9060 train 6.345010 (lr=2.0910e-05) (hash(x)=21722951) +9061 train 7.030707 (lr=2.0902e-05) (hash(x)=30558637) +9062 train 6.756346 (lr=2.0895e-05) (hash(x)=24033688) +9063 train 6.579618 (lr=2.0888e-05) (hash(x)=21875140) +9064 train 6.603675 (lr=2.0881e-05) (hash(x)=23862745) +9065 train 6.544387 (lr=2.0874e-05) (hash(x)=24902157) +9066 train 6.433049 (lr=2.0867e-05) (hash(x)=24682502) +9067 train 6.705353 (lr=2.0859e-05) (hash(x)=28022349) +9068 train 6.737311 (lr=2.0852e-05) (hash(x)=25886770) +9069 train 6.702477 (lr=2.0845e-05) (hash(x)=29456041) +9070 train 6.671536 (lr=2.0838e-05) (hash(x)=26411869) +9071 train 6.685962 (lr=2.0831e-05) (hash(x)=28701451) +9072 train 6.252660 (lr=2.0824e-05) (hash(x)=22317347) +9073 train 6.410497 (lr=2.0817e-05) (hash(x)=22874706) +9074 train 6.350862 (lr=2.0810e-05) (hash(x)=21490948) +9075 train 6.180054 (lr=2.0802e-05) (hash(x)=20174998) +9076 train 6.366919 (lr=2.0795e-05) (hash(x)=23783972) +9077 train 6.432173 (lr=2.0788e-05) (hash(x)=22643736) +9078 train 6.820276 (lr=2.0781e-05) (hash(x)=25257743) +9079 train 6.520775 (lr=2.0774e-05) (hash(x)=24430351) +9080 train 6.354766 (lr=2.0767e-05) (hash(x)=22235750) +9081 train 6.699642 (lr=2.0760e-05) (hash(x)=23915392) +9082 train 6.317273 (lr=2.0753e-05) (hash(x)=21287787) +9083 train 6.249547 (lr=2.0746e-05) (hash(x)=19353265) +9084 train 6.482569 (lr=2.0739e-05) (hash(x)=22958440) +9085 train 6.267360 (lr=2.0732e-05) (hash(x)=22419491) +9086 train 6.547076 (lr=2.0725e-05) (hash(x)=23459506) +9087 train 7.083869 (lr=2.0718e-05) (hash(x)=26805171) +9088 train 7.125351 (lr=2.0711e-05) (hash(x)=28209541) +9089 train 7.023525 (lr=2.0704e-05) (hash(x)=27147478) +9090 train 6.440376 (lr=2.0697e-05) (hash(x)=23121825) +9091 train 6.540563 (lr=2.0690e-05) (hash(x)=25684089) +9092 train 6.643010 (lr=2.0683e-05) (hash(x)=23746405) +9093 train 6.836931 (lr=2.0676e-05) (hash(x)=25501424) +9094 train 6.409348 (lr=2.0669e-05) (hash(x)=21880340) +9095 train 6.312646 (lr=2.0662e-05) (hash(x)=22971332) +9096 train 6.533618 (lr=2.0655e-05) (hash(x)=26520287) +9097 train 6.502580 (lr=2.0648e-05) (hash(x)=23772630) +9098 train 6.677915 (lr=2.0641e-05) (hash(x)=25509572) +9099 train 6.529162 (lr=2.0634e-05) (hash(x)=23430488) +9100 val loss 6.6403 +9100 val perplexity 765.2974 +9100 train 6.370384 (lr=2.0627e-05) (hash(x)=20893340) +9101 train 6.623824 (lr=2.0621e-05) (hash(x)=25389402) +9102 train 6.605816 (lr=2.0614e-05) (hash(x)=24870357) +9103 train 6.502847 (lr=2.0607e-05) (hash(x)=23313042) +9104 train 6.087887 (lr=2.0600e-05) (hash(x)=19141040) +9105 train 6.253181 (lr=2.0593e-05) (hash(x)=23625720) +9106 train 6.711902 (lr=2.0586e-05) (hash(x)=24701265) +9107 train 6.522183 (lr=2.0579e-05) (hash(x)=23152055) +9108 train 6.300448 (lr=2.0573e-05) (hash(x)=21627113) +9109 train 6.522536 (lr=2.0566e-05) (hash(x)=23643199) +9110 train 6.030354 (lr=2.0559e-05) (hash(x)=19569504) +9111 train 6.667950 (lr=2.0552e-05) (hash(x)=25651770) +9112 train 6.231370 (lr=2.0545e-05) (hash(x)=20838422) +9113 train 6.375637 (lr=2.0538e-05) (hash(x)=22219315) +9114 train 6.797569 (lr=2.0532e-05) (hash(x)=30769128) +9115 train 6.500165 (lr=2.0525e-05) (hash(x)=25076930) +9116 train 6.712369 (lr=2.0518e-05) (hash(x)=26809537) +9117 train 7.274558 (lr=2.0511e-05) (hash(x)=31787246) +9118 train 7.263929 (lr=2.0504e-05) (hash(x)=29330491) +9119 train 6.323291 (lr=2.0498e-05) (hash(x)=21621425) +9120 train 6.519324 (lr=2.0491e-05) (hash(x)=21780630) +9121 train 6.684480 (lr=2.0484e-05) (hash(x)=28836715) +9122 train 6.569617 (lr=2.0477e-05) (hash(x)=23802252) +9123 train 6.416270 (lr=2.0471e-05) (hash(x)=23028096) +9124 train 6.497173 (lr=2.0464e-05) (hash(x)=21960468) +9125 train 6.440488 (lr=2.0457e-05) (hash(x)=25664497) +9126 train 6.475012 (lr=2.0451e-05) (hash(x)=24387831) +9127 train 6.540100 (lr=2.0444e-05) (hash(x)=25104779) +9128 train 6.268877 (lr=2.0437e-05) (hash(x)=22510653) +9129 train 6.829474 (lr=2.0430e-05) (hash(x)=27507283) +9130 train 7.105706 (lr=2.0424e-05) (hash(x)=29587949) +9131 train 6.699957 (lr=2.0417e-05) (hash(x)=26484624) +9132 train 6.341288 (lr=2.0410e-05) (hash(x)=22837889) +9133 train 6.820790 (lr=2.0404e-05) (hash(x)=24836151) +9134 train 6.641150 (lr=2.0397e-05) (hash(x)=26534625) +9135 train 6.861594 (lr=2.0390e-05) (hash(x)=30109204) +9136 train 6.167636 (lr=2.0384e-05) (hash(x)=21469465) +9137 train 6.334138 (lr=2.0377e-05) (hash(x)=24267037) +9138 train 6.774049 (lr=2.0371e-05) (hash(x)=21670451) +9139 train 6.524863 (lr=2.0364e-05) (hash(x)=19707952) +9140 train 6.612137 (lr=2.0357e-05) (hash(x)=24039226) +9141 train 6.520522 (lr=2.0351e-05) (hash(x)=24677643) +9142 train 6.406798 (lr=2.0344e-05) (hash(x)=20841628) +9143 train 6.591863 (lr=2.0338e-05) (hash(x)=25317075) +9144 train 6.130583 (lr=2.0331e-05) (hash(x)=18134237) +9145 train 6.454084 (lr=2.0324e-05) (hash(x)=25191498) +9146 train 6.910151 (lr=2.0318e-05) (hash(x)=25647557) +9147 train 7.129046 (lr=2.0311e-05) (hash(x)=26848392) +9148 train 6.911962 (lr=2.0305e-05) (hash(x)=26730329) +9149 train 6.736307 (lr=2.0298e-05) (hash(x)=26202222) +9150 val loss 6.6385 +9150 val perplexity 763.9487 +9150 train 6.796690 (lr=2.0292e-05) (hash(x)=27144676) +9151 train 6.391327 (lr=2.0285e-05) (hash(x)=22341233) +9152 train 6.593953 (lr=2.0279e-05) (hash(x)=27071110) +9153 train 6.540374 (lr=2.0272e-05) (hash(x)=24349007) +9154 train 6.636922 (lr=2.0266e-05) (hash(x)=28280110) +9155 train 6.956235 (lr=2.0259e-05) (hash(x)=30059041) +9156 train 7.000773 (lr=2.0253e-05) (hash(x)=25759891) +9157 train 6.843100 (lr=2.0246e-05) (hash(x)=26107179) +9158 train 6.643211 (lr=2.0240e-05) (hash(x)=27946494) +9159 train 6.414499 (lr=2.0233e-05) (hash(x)=25850406) +9160 train 6.401083 (lr=2.0227e-05) (hash(x)=23819578) +9161 train 6.501044 (lr=2.0220e-05) (hash(x)=26496160) +9162 train 6.156096 (lr=2.0214e-05) (hash(x)=25440129) +9163 train 6.197886 (lr=2.0207e-05) (hash(x)=23340008) +9164 train 6.348926 (lr=2.0201e-05) (hash(x)=24495290) +9165 train 6.406624 (lr=2.0195e-05) (hash(x)=22137910) +9166 train 6.364319 (lr=2.0188e-05) (hash(x)=23150451) +9167 train 6.533990 (lr=2.0182e-05) (hash(x)=23732439) +9168 train 6.426977 (lr=2.0175e-05) (hash(x)=24467313) +9169 train 6.339980 (lr=2.0169e-05) (hash(x)=22063327) +9170 train 6.388768 (lr=2.0163e-05) (hash(x)=23305072) +9171 train 6.514081 (lr=2.0156e-05) (hash(x)=22629233) +9172 train 6.608959 (lr=2.0150e-05) (hash(x)=21483936) +9173 train 6.256128 (lr=2.0143e-05) (hash(x)=20363154) +9174 train 6.411287 (lr=2.0137e-05) (hash(x)=24378898) +9175 train 6.233238 (lr=2.0131e-05) (hash(x)=20890194) +9176 train 6.391384 (lr=2.0124e-05) (hash(x)=21003462) +9177 train 6.358519 (lr=2.0118e-05) (hash(x)=21133576) +9178 train 6.447913 (lr=2.0112e-05) (hash(x)=23596215) +9179 train 6.265294 (lr=2.0105e-05) (hash(x)=17617224) +9180 train 6.622192 (lr=2.0099e-05) (hash(x)=25716742) +9181 train 7.636861 (lr=2.0093e-05) (hash(x)=36927425) +9182 train 7.393723 (lr=2.0087e-05) (hash(x)=33803746) +9183 train 6.467655 (lr=2.0080e-05) (hash(x)=23302742) +9184 train 6.413693 (lr=2.0074e-05) (hash(x)=23556493) +9185 train 6.652478 (lr=2.0068e-05) (hash(x)=26149010) +9186 train 6.582948 (lr=2.0061e-05) (hash(x)=23825469) +9187 train 6.685520 (lr=2.0055e-05) (hash(x)=25768565) +9188 train 6.438413 (lr=2.0049e-05) (hash(x)=26095324) +9189 train 6.421281 (lr=2.0043e-05) (hash(x)=21162451) +9190 train 7.125652 (lr=2.0036e-05) (hash(x)=29199910) +9191 train 6.928459 (lr=2.0030e-05) (hash(x)=27134148) +9192 train 7.094827 (lr=2.0024e-05) (hash(x)=31411014) +9193 train 7.074428 (lr=2.0018e-05) (hash(x)=28646304) +9194 train 6.846988 (lr=2.0012e-05) (hash(x)=26112500) +9195 train 7.352482 (lr=2.0005e-05) (hash(x)=32041599) +9196 train 7.159222 (lr=1.9999e-05) (hash(x)=30384700) +9197 train 7.345566 (lr=1.9993e-05) (hash(x)=32791607) +9198 train 7.103821 (lr=1.9987e-05) (hash(x)=30433512) +9199 train 6.354040 (lr=1.9981e-05) (hash(x)=23262927) +9200 val loss 6.6389 +9200 val perplexity 764.2234 +9200 train 6.510211 (lr=1.9975e-05) (hash(x)=25735666) +9201 train 6.490416 (lr=1.9968e-05) (hash(x)=24952007) +9202 train 6.368518 (lr=1.9962e-05) (hash(x)=22019766) +9203 train 6.227195 (lr=1.9956e-05) (hash(x)=21711657) +9204 train 6.635931 (lr=1.9950e-05) (hash(x)=24875306) +9205 train 6.363454 (lr=1.9944e-05) (hash(x)=24362530) +9206 train 6.351857 (lr=1.9938e-05) (hash(x)=22076419) +9207 train 6.749822 (lr=1.9932e-05) (hash(x)=28382544) +9208 train 6.380038 (lr=1.9926e-05) (hash(x)=24843764) +9209 train 7.077409 (lr=1.9919e-05) (hash(x)=29987122) +9210 train 7.445177 (lr=1.9913e-05) (hash(x)=33278552) +9211 train 6.610921 (lr=1.9907e-05) (hash(x)=26618651) +9212 train 6.548019 (lr=1.9901e-05) (hash(x)=27285887) +9213 train 6.215189 (lr=1.9895e-05) (hash(x)=22061506) +9214 train 6.492844 (lr=1.9889e-05) (hash(x)=23789658) +9215 train 6.947005 (lr=1.9883e-05) (hash(x)=30322804) +9216 train 6.723122 (lr=1.9877e-05) (hash(x)=24331425) +9217 train 6.397577 (lr=1.9871e-05) (hash(x)=23027458) +9218 train 6.685774 (lr=1.9865e-05) (hash(x)=26106961) +9219 train 6.540910 (lr=1.9859e-05) (hash(x)=22959915) +9220 train 6.577232 (lr=1.9853e-05) (hash(x)=24468059) +9221 train 6.462518 (lr=1.9847e-05) (hash(x)=25857145) +9222 train 6.590186 (lr=1.9841e-05) (hash(x)=28184570) +9223 train 6.343802 (lr=1.9835e-05) (hash(x)=24743366) +9224 train 6.525176 (lr=1.9829e-05) (hash(x)=23498435) +9225 train 6.735257 (lr=1.9823e-05) (hash(x)=25161787) +9226 train 5.923873 (lr=1.9817e-05) (hash(x)=18127591) +9227 train 6.621706 (lr=1.9811e-05) (hash(x)=23923395) +9228 train 8.276273 (lr=1.9805e-05) (hash(x)=27583048) +9229 train 6.805570 (lr=1.9799e-05) (hash(x)=25344762) +9230 train 6.214119 (lr=1.9793e-05) (hash(x)=22718066) +9231 train 6.703485 (lr=1.9787e-05) (hash(x)=26026937) +9232 train 6.665390 (lr=1.9782e-05) (hash(x)=23965637) +9233 train 6.179718 (lr=1.9776e-05) (hash(x)=19631904) +9234 train 6.569664 (lr=1.9770e-05) (hash(x)=27710783) +9235 train 5.999853 (lr=1.9764e-05) (hash(x)=18767284) +9236 train 6.667754 (lr=1.9758e-05) (hash(x)=25052312) +9237 train 6.538290 (lr=1.9752e-05) (hash(x)=24548153) +9238 train 6.570952 (lr=1.9746e-05) (hash(x)=23635032) +9239 train 7.236055 (lr=1.9740e-05) (hash(x)=27467591) +9240 train 6.541365 (lr=1.9734e-05) (hash(x)=23237356) +9241 train 6.618506 (lr=1.9729e-05) (hash(x)=25582248) +9242 train 6.753753 (lr=1.9723e-05) (hash(x)=27088689) +9243 train 6.092860 (lr=1.9717e-05) (hash(x)=17302241) +9244 train 6.327064 (lr=1.9711e-05) (hash(x)=23904432) +9245 train 6.596864 (lr=1.9705e-05) (hash(x)=27112605) +9246 train 6.823981 (lr=1.9699e-05) (hash(x)=30366699) +9247 train 6.370931 (lr=1.9694e-05) (hash(x)=22135596) +9248 train 6.669678 (lr=1.9688e-05) (hash(x)=26501906) +9249 train 6.418915 (lr=1.9682e-05) (hash(x)=23715941) +9250 val loss 6.6398 +9250 val perplexity 764.9702 +9250 train 6.496349 (lr=1.9676e-05) (hash(x)=24623579) +9251 train 6.677011 (lr=1.9671e-05) (hash(x)=25475640) +9252 train 6.464041 (lr=1.9665e-05) (hash(x)=23984729) +9253 train 6.463147 (lr=1.9659e-05) (hash(x)=24166270) +9254 train 6.362035 (lr=1.9653e-05) (hash(x)=21070832) +9255 train 6.640248 (lr=1.9648e-05) (hash(x)=24733333) +9256 train 6.795125 (lr=1.9642e-05) (hash(x)=25755506) +9257 train 6.373361 (lr=1.9636e-05) (hash(x)=23362130) +9258 train 6.702139 (lr=1.9630e-05) (hash(x)=26071982) +9259 train 7.034224 (lr=1.9625e-05) (hash(x)=29134326) +9260 train 7.547666 (lr=1.9619e-05) (hash(x)=34979012) +9261 train 6.454423 (lr=1.9613e-05) (hash(x)=22943282) +9262 train 6.431675 (lr=1.9608e-05) (hash(x)=22667765) +9263 train 6.521533 (lr=1.9602e-05) (hash(x)=25355718) +9264 train 6.683718 (lr=1.9596e-05) (hash(x)=26595295) +9265 train 6.702658 (lr=1.9591e-05) (hash(x)=28747908) +9266 train 6.432597 (lr=1.9585e-05) (hash(x)=20211405) +9267 train 6.371574 (lr=1.9579e-05) (hash(x)=20883581) +9268 train 6.417848 (lr=1.9574e-05) (hash(x)=22147212) +9269 train 6.158418 (lr=1.9568e-05) (hash(x)=20312611) +9270 train 6.325805 (lr=1.9562e-05) (hash(x)=23405223) +9271 train 6.313474 (lr=1.9557e-05) (hash(x)=21985459) +9272 train 6.355508 (lr=1.9551e-05) (hash(x)=25223418) +9273 train 6.352933 (lr=1.9545e-05) (hash(x)=22572927) +9274 train 6.647386 (lr=1.9540e-05) (hash(x)=27967387) +9275 train 6.751810 (lr=1.9534e-05) (hash(x)=24786229) +9276 train 6.669498 (lr=1.9529e-05) (hash(x)=24488758) +9277 train 6.480626 (lr=1.9523e-05) (hash(x)=25937020) +9278 train 6.860524 (lr=1.9518e-05) (hash(x)=28914580) +9279 train 6.256820 (lr=1.9512e-05) (hash(x)=22036120) +9280 train 6.600450 (lr=1.9506e-05) (hash(x)=24356344) +9281 train 6.527108 (lr=1.9501e-05) (hash(x)=24687165) +9282 train 6.606666 (lr=1.9495e-05) (hash(x)=24569860) +9283 train 6.438738 (lr=1.9490e-05) (hash(x)=23176408) +9284 train 6.479043 (lr=1.9484e-05) (hash(x)=21725924) +9285 train 6.638021 (lr=1.9479e-05) (hash(x)=25285954) +9286 train 6.405211 (lr=1.9473e-05) (hash(x)=22936662) +9287 train 6.522228 (lr=1.9468e-05) (hash(x)=21175158) +9288 train 6.882335 (lr=1.9462e-05) (hash(x)=24432059) +9289 train 6.638992 (lr=1.9457e-05) (hash(x)=21870295) +9290 train 6.299043 (lr=1.9451e-05) (hash(x)=21677468) +9291 train 6.508172 (lr=1.9446e-05) (hash(x)=24293642) +9292 train 6.277721 (lr=1.9440e-05) (hash(x)=19899173) +9293 train 6.726045 (lr=1.9435e-05) (hash(x)=25383408) +9294 train 6.572942 (lr=1.9429e-05) (hash(x)=23271382) +9295 train 6.642019 (lr=1.9424e-05) (hash(x)=27609191) +9296 train 6.771920 (lr=1.9419e-05) (hash(x)=29456990) +9297 train 6.520879 (lr=1.9413e-05) (hash(x)=24525729) +9298 train 6.334966 (lr=1.9408e-05) (hash(x)=24515653) +9299 train 6.154602 (lr=1.9402e-05) (hash(x)=21053202) +9300 val loss 6.6419 +9300 val perplexity 766.5658 +9300 train 6.025365 (lr=1.9397e-05) (hash(x)=17927693) +9301 train 6.350759 (lr=1.9392e-05) (hash(x)=20812412) +9302 train 6.280605 (lr=1.9386e-05) (hash(x)=22327784) +9303 train 6.314722 (lr=1.9381e-05) (hash(x)=23392029) +9304 train 6.503458 (lr=1.9375e-05) (hash(x)=24956888) +9305 train 6.283790 (lr=1.9370e-05) (hash(x)=19081898) +9306 train 6.426634 (lr=1.9365e-05) (hash(x)=22262068) +9307 train 6.511678 (lr=1.9359e-05) (hash(x)=23420997) +9308 train 7.699820 (lr=1.9354e-05) (hash(x)=31366600) +9309 train 6.578604 (lr=1.9349e-05) (hash(x)=24652208) +9310 train 6.477832 (lr=1.9343e-05) (hash(x)=22966996) +9311 train 6.471540 (lr=1.9338e-05) (hash(x)=23209578) +9312 train 6.455438 (lr=1.9333e-05) (hash(x)=21610459) +9313 train 6.418200 (lr=1.9327e-05) (hash(x)=25376744) +9314 train 6.396355 (lr=1.9322e-05) (hash(x)=24196791) +9315 train 6.954695 (lr=1.9317e-05) (hash(x)=29242161) +9316 train 7.100670 (lr=1.9312e-05) (hash(x)=31389192) +9317 train 6.593749 (lr=1.9306e-05) (hash(x)=27360485) +9318 train 6.328004 (lr=1.9301e-05) (hash(x)=24619436) +9319 train 6.535746 (lr=1.9296e-05) (hash(x)=24824528) +9320 train 6.519721 (lr=1.9290e-05) (hash(x)=25223720) +9321 train 6.400181 (lr=1.9285e-05) (hash(x)=22938842) +9322 train 6.483280 (lr=1.9280e-05) (hash(x)=24515640) +9323 train 6.792175 (lr=1.9275e-05) (hash(x)=27199401) +9324 train 6.879245 (lr=1.9270e-05) (hash(x)=26157638) +9325 train 6.956494 (lr=1.9264e-05) (hash(x)=29148627) +9326 train 6.523042 (lr=1.9259e-05) (hash(x)=25006031) +9327 train 6.512511 (lr=1.9254e-05) (hash(x)=24964626) +9328 train 6.285335 (lr=1.9249e-05) (hash(x)=21864131) +9329 train 6.654961 (lr=1.9244e-05) (hash(x)=26761990) +9330 train 6.691828 (lr=1.9238e-05) (hash(x)=23715726) +9331 train 6.227531 (lr=1.9233e-05) (hash(x)=23023484) +9332 train 6.323021 (lr=1.9228e-05) (hash(x)=22179342) +9333 train 6.520900 (lr=1.9223e-05) (hash(x)=26062015) +9334 train 6.637733 (lr=1.9218e-05) (hash(x)=27352857) +9335 train 6.965816 (lr=1.9213e-05) (hash(x)=28428887) +9336 train 6.449550 (lr=1.9208e-05) (hash(x)=25471415) +9337 train 6.382815 (lr=1.9202e-05) (hash(x)=23945512) +9338 train 6.897778 (lr=1.9197e-05) (hash(x)=30476226) +9339 train 6.536152 (lr=1.9192e-05) (hash(x)=19422223) +9340 train 6.566239 (lr=1.9187e-05) (hash(x)=22533318) +9341 train 6.423532 (lr=1.9182e-05) (hash(x)=24825184) +9342 train 6.555858 (lr=1.9177e-05) (hash(x)=24474252) +9343 train 6.509491 (lr=1.9172e-05) (hash(x)=26789021) +9344 train 6.687570 (lr=1.9167e-05) (hash(x)=25440658) +9345 train 6.654340 (lr=1.9162e-05) (hash(x)=25431844) +9346 train 6.662797 (lr=1.9157e-05) (hash(x)=26173188) +9347 train 6.603400 (lr=1.9152e-05) (hash(x)=26055887) +9348 train 7.170884 (lr=1.9147e-05) (hash(x)=30845354) +9349 train 6.670100 (lr=1.9142e-05) (hash(x)=25239899) +9350 val loss 6.6398 +9350 val perplexity 764.9213 +9350 train 6.363900 (lr=1.9137e-05) (hash(x)=24170815) +9351 train 6.351318 (lr=1.9132e-05) (hash(x)=22695968) +9352 train 6.598764 (lr=1.9127e-05) (hash(x)=28075168) +9353 train 6.669237 (lr=1.9122e-05) (hash(x)=24889127) +9354 train 6.822958 (lr=1.9117e-05) (hash(x)=28389276) +9355 train 6.258914 (lr=1.9112e-05) (hash(x)=20254044) +9356 train 6.447437 (lr=1.9107e-05) (hash(x)=25423015) +9357 train 6.515213 (lr=1.9102e-05) (hash(x)=26509174) +9358 train 6.607610 (lr=1.9097e-05) (hash(x)=26246963) +9359 train 6.083019 (lr=1.9092e-05) (hash(x)=21215047) +9360 train 6.360711 (lr=1.9087e-05) (hash(x)=21336867) +9361 train 6.458473 (lr=1.9082e-05) (hash(x)=22276078) +9362 train 6.716943 (lr=1.9077e-05) (hash(x)=25335512) +9363 train 6.538544 (lr=1.9072e-05) (hash(x)=24417502) +9364 train 6.178649 (lr=1.9067e-05) (hash(x)=20448762) +9365 train 6.747194 (lr=1.9062e-05) (hash(x)=24831012) +9366 train 6.890821 (lr=1.9057e-05) (hash(x)=26120200) +9367 train 6.563367 (lr=1.9052e-05) (hash(x)=25223052) +9368 train 6.172956 (lr=1.9047e-05) (hash(x)=21475349) +9369 train 6.865755 (lr=1.9043e-05) (hash(x)=27387700) +9370 train 6.946926 (lr=1.9038e-05) (hash(x)=30844781) +9371 train 6.515827 (lr=1.9033e-05) (hash(x)=26998654) +9372 train 6.537465 (lr=1.9028e-05) (hash(x)=24994378) +9373 train 6.271487 (lr=1.9023e-05) (hash(x)=21023223) +9374 train 6.524780 (lr=1.9018e-05) (hash(x)=24091903) +9375 train 6.615566 (lr=1.9013e-05) (hash(x)=28701940) +9376 train 6.650849 (lr=1.9009e-05) (hash(x)=27553802) +9377 train 6.581236 (lr=1.9004e-05) (hash(x)=27322792) +9378 train 6.495453 (lr=1.8999e-05) (hash(x)=21814629) +9379 train 6.977174 (lr=1.8994e-05) (hash(x)=25397088) +9380 train 6.387009 (lr=1.8989e-05) (hash(x)=22045626) +9381 train 6.136741 (lr=1.8985e-05) (hash(x)=22912781) +9382 train 6.393957 (lr=1.8980e-05) (hash(x)=24926822) +9383 train 6.822256 (lr=1.8975e-05) (hash(x)=26562495) +9384 train 6.721315 (lr=1.8970e-05) (hash(x)=24052605) +9385 train 6.718559 (lr=1.8966e-05) (hash(x)=25001363) +9386 train 6.858504 (lr=1.8961e-05) (hash(x)=22919889) +9387 train 6.782838 (lr=1.8956e-05) (hash(x)=23225946) +9388 train 6.523758 (lr=1.8951e-05) (hash(x)=23974840) +9389 train 6.563569 (lr=1.8947e-05) (hash(x)=23813266) +9390 train 7.347299 (lr=1.8942e-05) (hash(x)=27923277) +9391 train 6.806215 (lr=1.8937e-05) (hash(x)=26076238) +9392 train 6.624518 (lr=1.8932e-05) (hash(x)=25227985) +9393 train 6.277358 (lr=1.8928e-05) (hash(x)=22490186) +9394 train 6.299217 (lr=1.8923e-05) (hash(x)=21423992) +9395 train 6.278823 (lr=1.8918e-05) (hash(x)=21946864) +9396 train 6.475926 (lr=1.8914e-05) (hash(x)=25685664) +9397 train 6.818645 (lr=1.8909e-05) (hash(x)=30047438) +9398 train 6.421881 (lr=1.8904e-05) (hash(x)=24630755) +9399 train 6.219333 (lr=1.8900e-05) (hash(x)=23513415) +9400 val loss 6.6372 +9400 val perplexity 762.9807 +9400 train 6.390610 (lr=1.8895e-05) (hash(x)=22717447) +9401 train 6.907642 (lr=1.8891e-05) (hash(x)=29122666) +9402 train 6.536884 (lr=1.8886e-05) (hash(x)=25312760) +9403 train 6.468371 (lr=1.8881e-05) (hash(x)=21972630) +9404 train 6.520982 (lr=1.8877e-05) (hash(x)=25310197) +9405 train 6.617230 (lr=1.8872e-05) (hash(x)=26521041) +9406 train 6.010002 (lr=1.8867e-05) (hash(x)=19397688) +9407 train 6.436165 (lr=1.8863e-05) (hash(x)=23641242) +9408 train 6.621994 (lr=1.8858e-05) (hash(x)=27742717) +9409 train 6.324162 (lr=1.8854e-05) (hash(x)=22326293) +9410 train 6.323966 (lr=1.8849e-05) (hash(x)=20690613) +9411 train 6.280341 (lr=1.8845e-05) (hash(x)=22847346) +9412 train 6.127024 (lr=1.8840e-05) (hash(x)=21628392) +9413 train 6.549213 (lr=1.8836e-05) (hash(x)=27075766) +9414 train 7.025485 (lr=1.8831e-05) (hash(x)=31681391) +9415 train 6.775861 (lr=1.8826e-05) (hash(x)=29534561) +9416 train 6.656123 (lr=1.8822e-05) (hash(x)=27206337) +9417 train 6.643620 (lr=1.8817e-05) (hash(x)=24938611) +9418 train 6.419862 (lr=1.8813e-05) (hash(x)=24082156) +9419 train 6.502708 (lr=1.8808e-05) (hash(x)=23786763) +9420 train 6.732459 (lr=1.8804e-05) (hash(x)=25643250) +9421 train 6.726340 (lr=1.8799e-05) (hash(x)=26431267) +9422 train 6.641477 (lr=1.8795e-05) (hash(x)=26047943) +9423 train 6.439041 (lr=1.8791e-05) (hash(x)=19651622) +9424 train 6.426506 (lr=1.8786e-05) (hash(x)=23890631) +9425 train 6.509424 (lr=1.8782e-05) (hash(x)=25764043) +9426 train 6.711315 (lr=1.8777e-05) (hash(x)=26188770) +9427 train 6.905221 (lr=1.8773e-05) (hash(x)=30718836) +9428 train 6.463632 (lr=1.8768e-05) (hash(x)=25261532) +9429 train 6.546318 (lr=1.8764e-05) (hash(x)=24614221) +9430 train 6.722849 (lr=1.8759e-05) (hash(x)=25141158) +9431 train 6.677734 (lr=1.8755e-05) (hash(x)=26304955) +9432 train 6.394115 (lr=1.8751e-05) (hash(x)=24056506) +9433 train 6.587463 (lr=1.8746e-05) (hash(x)=27393349) +9434 train 6.576016 (lr=1.8742e-05) (hash(x)=24555172) +9435 train 6.713863 (lr=1.8738e-05) (hash(x)=26638096) +9436 train 7.002191 (lr=1.8733e-05) (hash(x)=27665368) +9437 train 6.778545 (lr=1.8729e-05) (hash(x)=27095877) +9438 train 6.522243 (lr=1.8724e-05) (hash(x)=25243145) +9439 train 7.067026 (lr=1.8720e-05) (hash(x)=29051604) +9440 train 6.510606 (lr=1.8716e-05) (hash(x)=22699247) +9441 train 6.811018 (lr=1.8711e-05) (hash(x)=26222919) +9442 train 6.154687 (lr=1.8707e-05) (hash(x)=20317938) +9443 train 6.542725 (lr=1.8703e-05) (hash(x)=26482518) +9444 train 6.634126 (lr=1.8699e-05) (hash(x)=26083085) +9445 train 6.503253 (lr=1.8694e-05) (hash(x)=22110278) +9446 train 6.515572 (lr=1.8690e-05) (hash(x)=25686635) +9447 train 6.489946 (lr=1.8686e-05) (hash(x)=25159711) +9448 train 6.213390 (lr=1.8681e-05) (hash(x)=20541765) +9449 train 6.882122 (lr=1.8677e-05) (hash(x)=27774300) +9450 val loss 6.6410 +9450 val perplexity 765.8914 +9450 train 6.618086 (lr=1.8673e-05) (hash(x)=26517169) +9451 train 6.569992 (lr=1.8669e-05) (hash(x)=27894029) +9452 train 6.452257 (lr=1.8664e-05) (hash(x)=24840062) +9453 train 6.377118 (lr=1.8660e-05) (hash(x)=22588789) +9454 train 6.342791 (lr=1.8656e-05) (hash(x)=22256563) +9455 train 6.564316 (lr=1.8652e-05) (hash(x)=26612189) +9456 train 6.499158 (lr=1.8647e-05) (hash(x)=25612290) +9457 train 6.530049 (lr=1.8643e-05) (hash(x)=23008801) +9458 train 6.920828 (lr=1.8639e-05) (hash(x)=29553733) +9459 train 6.706673 (lr=1.8635e-05) (hash(x)=27309306) +9460 train 6.603292 (lr=1.8631e-05) (hash(x)=28990600) +9461 train 6.477286 (lr=1.8627e-05) (hash(x)=23382803) +9462 train 6.878113 (lr=1.8622e-05) (hash(x)=28695249) +9463 train 6.263938 (lr=1.8618e-05) (hash(x)=21236021) +9464 train 6.601195 (lr=1.8614e-05) (hash(x)=26028643) +9465 train 6.375065 (lr=1.8610e-05) (hash(x)=22968681) +9466 train 6.530667 (lr=1.8606e-05) (hash(x)=22548314) +9467 train 6.569372 (lr=1.8602e-05) (hash(x)=26453996) +9468 train 6.499539 (lr=1.8598e-05) (hash(x)=23861291) +9469 train 6.830036 (lr=1.8593e-05) (hash(x)=25223320) +9470 train 6.683069 (lr=1.8589e-05) (hash(x)=23111385) +9471 train 6.743772 (lr=1.8585e-05) (hash(x)=19482110) +9472 train 6.978462 (lr=1.8581e-05) (hash(x)=24297371) +9473 train 6.501048 (lr=1.8577e-05) (hash(x)=24458120) +9474 train 6.615506 (lr=1.8573e-05) (hash(x)=26651694) +9475 train 6.667078 (lr=1.8569e-05) (hash(x)=27366737) +9476 train 6.617906 (lr=1.8565e-05) (hash(x)=22638514) +9477 train 6.655587 (lr=1.8561e-05) (hash(x)=25309421) +9478 train 6.960754 (lr=1.8557e-05) (hash(x)=29637906) +9479 train 6.994152 (lr=1.8553e-05) (hash(x)=28566856) +9480 train 6.303302 (lr=1.8549e-05) (hash(x)=24788847) +9481 train 6.506444 (lr=1.8545e-05) (hash(x)=24065282) +9482 train 6.634612 (lr=1.8541e-05) (hash(x)=25722447) +9483 train 6.879514 (lr=1.8537e-05) (hash(x)=27797472) +9484 train 6.793091 (lr=1.8533e-05) (hash(x)=27500358) +9485 train 6.845570 (lr=1.8529e-05) (hash(x)=27079020) +9486 train 6.819122 (lr=1.8525e-05) (hash(x)=24735909) +9487 train 6.469617 (lr=1.8521e-05) (hash(x)=22327217) +9488 train 6.671524 (lr=1.8517e-05) (hash(x)=26504995) +9489 train 6.486309 (lr=1.8513e-05) (hash(x)=23026175) +9490 train 6.495172 (lr=1.8509e-05) (hash(x)=22983731) +9491 train 6.577156 (lr=1.8505e-05) (hash(x)=23720739) +9492 train 6.804640 (lr=1.8501e-05) (hash(x)=25652438) +9493 train 6.524352 (lr=1.8497e-05) (hash(x)=24655150) +9494 train 6.860717 (lr=1.8493e-05) (hash(x)=21909875) +9495 train 6.783718 (lr=1.8489e-05) (hash(x)=23533293) +9496 train 6.856493 (lr=1.8485e-05) (hash(x)=25706268) +9497 train 6.707851 (lr=1.8481e-05) (hash(x)=25193449) +9498 train 6.622980 (lr=1.8477e-05) (hash(x)=25271486) +9499 train 6.916298 (lr=1.8474e-05) (hash(x)=26937554) +9500 val loss 6.6352 +9500 val perplexity 761.4600 +9500 train 6.973618 (lr=1.8470e-05) (hash(x)=28708931) +9501 train 6.827091 (lr=1.8466e-05) (hash(x)=25175996) +9502 train 6.528572 (lr=1.8462e-05) (hash(x)=23165421) +9503 train 6.549083 (lr=1.8458e-05) (hash(x)=26321048) +9504 train 6.587457 (lr=1.8454e-05) (hash(x)=21028300) +9505 train 6.742400 (lr=1.8450e-05) (hash(x)=24713460) +9506 train 6.473932 (lr=1.8447e-05) (hash(x)=22713785) +9507 train 6.398589 (lr=1.8443e-05) (hash(x)=21567145) +9508 train 6.379945 (lr=1.8439e-05) (hash(x)=22007961) +9509 train 6.591629 (lr=1.8435e-05) (hash(x)=21955317) +9510 train 6.535507 (lr=1.8431e-05) (hash(x)=23158364) +9511 train 6.778941 (lr=1.8428e-05) (hash(x)=24935086) +9512 train 6.549898 (lr=1.8424e-05) (hash(x)=24558460) +9513 train 6.752684 (lr=1.8420e-05) (hash(x)=24960618) +9514 train 6.769213 (lr=1.8416e-05) (hash(x)=28958188) +9515 train 6.418675 (lr=1.8413e-05) (hash(x)=20992234) +9516 train 6.643186 (lr=1.8409e-05) (hash(x)=24037853) +9517 train 6.777767 (lr=1.8405e-05) (hash(x)=27827997) +9518 train 6.445482 (lr=1.8401e-05) (hash(x)=18058118) +9519 train 6.890575 (lr=1.8398e-05) (hash(x)=26245668) +9520 train 6.313808 (lr=1.8394e-05) (hash(x)=20187375) +9521 train 6.343385 (lr=1.8390e-05) (hash(x)=18605235) +9522 train 6.550378 (lr=1.8386e-05) (hash(x)=21541756) +9523 train 6.403615 (lr=1.8383e-05) (hash(x)=23116316) +9524 train 7.119838 (lr=1.8379e-05) (hash(x)=26453023) +9525 train 6.549151 (lr=1.8375e-05) (hash(x)=21486416) +9526 train 6.567028 (lr=1.8372e-05) (hash(x)=23329183) +9527 train 6.575081 (lr=1.8368e-05) (hash(x)=24222780) +9528 train 6.552098 (lr=1.8364e-05) (hash(x)=23721398) +9529 train 6.490364 (lr=1.8361e-05) (hash(x)=22978954) +9530 train 6.684293 (lr=1.8357e-05) (hash(x)=25310958) +9531 train 6.560451 (lr=1.8353e-05) (hash(x)=23764952) +9532 train 6.471448 (lr=1.8350e-05) (hash(x)=22480947) +9533 train 6.808721 (lr=1.8346e-05) (hash(x)=26271374) +9534 train 6.679526 (lr=1.8343e-05) (hash(x)=23308778) +9535 train 6.645955 (lr=1.8339e-05) (hash(x)=22736761) +9536 train 6.615398 (lr=1.8335e-05) (hash(x)=24836962) +9537 train 6.724934 (lr=1.8332e-05) (hash(x)=24314603) +9538 train 6.511977 (lr=1.8328e-05) (hash(x)=23702262) +9539 train 6.814348 (lr=1.8325e-05) (hash(x)=26463399) +9540 train 6.981390 (lr=1.8321e-05) (hash(x)=28866355) +9541 train 6.737869 (lr=1.8317e-05) (hash(x)=27071943) +9542 train 6.833472 (lr=1.8314e-05) (hash(x)=27510738) +9543 train 6.813501 (lr=1.8310e-05) (hash(x)=29885869) +9544 train 6.818653 (lr=1.8307e-05) (hash(x)=23394930) +9545 train 7.018656 (lr=1.8303e-05) (hash(x)=25957755) +9546 train 6.892858 (lr=1.8300e-05) (hash(x)=27121494) +9547 train 6.499014 (lr=1.8296e-05) (hash(x)=24675759) +9548 train 6.552686 (lr=1.8293e-05) (hash(x)=24557566) +9549 train 6.524613 (lr=1.8289e-05) (hash(x)=25057589) +9550 val loss 6.6316 +9550 val perplexity 758.7030 +9550 train 6.795966 (lr=1.8286e-05) (hash(x)=28349095) +9551 train 6.544412 (lr=1.8282e-05) (hash(x)=24701749) +9552 train 6.476583 (lr=1.8279e-05) (hash(x)=23018176) +9553 train 6.519416 (lr=1.8275e-05) (hash(x)=25036725) +9554 train 6.797563 (lr=1.8272e-05) (hash(x)=27496324) +9555 train 6.616818 (lr=1.8268e-05) (hash(x)=25120286) +9556 train 6.408988 (lr=1.8265e-05) (hash(x)=23750303) +9557 train 6.605627 (lr=1.8262e-05) (hash(x)=25829552) +9558 train 6.913907 (lr=1.8258e-05) (hash(x)=27549670) +9559 train 6.878724 (lr=1.8255e-05) (hash(x)=27611501) +9560 train 6.693452 (lr=1.8251e-05) (hash(x)=29650270) +9561 train 6.474484 (lr=1.8248e-05) (hash(x)=28167272) +9562 train 6.506302 (lr=1.8245e-05) (hash(x)=25311136) +9563 train 6.603876 (lr=1.8241e-05) (hash(x)=24943881) +9564 train 6.660891 (lr=1.8238e-05) (hash(x)=24766191) +9565 train 6.676569 (lr=1.8234e-05) (hash(x)=26607112) +9566 train 6.677899 (lr=1.8231e-05) (hash(x)=27998770) +9567 train 6.549809 (lr=1.8228e-05) (hash(x)=23865952) +9568 train 6.392130 (lr=1.8224e-05) (hash(x)=22628795) +9569 train 6.746309 (lr=1.8221e-05) (hash(x)=26457444) +9570 train 7.496500 (lr=1.8218e-05) (hash(x)=31848488) +9571 train 6.873035 (lr=1.8214e-05) (hash(x)=28042679) +9572 train 6.708699 (lr=1.8211e-05) (hash(x)=24203086) +9573 train 6.870916 (lr=1.8208e-05) (hash(x)=26331287) +9574 train 6.815663 (lr=1.8204e-05) (hash(x)=26384130) +9575 train 6.837406 (lr=1.8201e-05) (hash(x)=28592301) +9576 train 6.795073 (lr=1.8198e-05) (hash(x)=25249714) +9577 train 6.482063 (lr=1.8194e-05) (hash(x)=23735941) +9578 train 6.798395 (lr=1.8191e-05) (hash(x)=26558014) +9579 train 6.981979 (lr=1.8188e-05) (hash(x)=26698961) +9580 train 7.018449 (lr=1.8185e-05) (hash(x)=25273228) +9581 train 6.413362 (lr=1.8181e-05) (hash(x)=24993350) +9582 train 6.866115 (lr=1.8178e-05) (hash(x)=27448692) +9583 train 6.709152 (lr=1.8175e-05) (hash(x)=24914468) +9584 train 6.528789 (lr=1.8172e-05) (hash(x)=23659347) +9585 train 6.672948 (lr=1.8168e-05) (hash(x)=27507785) +9586 train 6.540416 (lr=1.8165e-05) (hash(x)=23861508) +9587 train 6.653435 (lr=1.8162e-05) (hash(x)=23370468) +9588 train 6.575575 (lr=1.8159e-05) (hash(x)=23993390) +9589 train 6.543588 (lr=1.8156e-05) (hash(x)=24092258) +9590 train 6.662971 (lr=1.8152e-05) (hash(x)=23943461) +9591 train 6.480010 (lr=1.8149e-05) (hash(x)=24384388) +9592 train 6.760436 (lr=1.8146e-05) (hash(x)=25830546) +9593 train 7.058511 (lr=1.8143e-05) (hash(x)=28711454) +9594 train 6.541890 (lr=1.8140e-05) (hash(x)=25322851) +9595 train 6.618227 (lr=1.8137e-05) (hash(x)=27913989) +9596 train 6.536243 (lr=1.8134e-05) (hash(x)=22319103) +9597 train 6.748787 (lr=1.8130e-05) (hash(x)=25163695) +9598 train 6.560527 (lr=1.8127e-05) (hash(x)=22772099) +9599 train 6.494976 (lr=1.8124e-05) (hash(x)=26315175) +9600 val loss 6.6275 +9600 val perplexity 755.6265 +9600 train 6.798603 (lr=1.8121e-05) (hash(x)=27550675) +9601 train 6.755212 (lr=1.8118e-05) (hash(x)=25508455) +9602 train 6.989453 (lr=1.8115e-05) (hash(x)=25887982) +9603 train 7.192092 (lr=1.8112e-05) (hash(x)=28274242) +9604 train 6.917615 (lr=1.8109e-05) (hash(x)=27856065) +9605 train 6.834986 (lr=1.8106e-05) (hash(x)=28351168) +9606 train 6.735683 (lr=1.8103e-05) (hash(x)=24449905) +9607 train 6.407715 (lr=1.8100e-05) (hash(x)=22918470) +9608 train 6.728075 (lr=1.8097e-05) (hash(x)=24743215) +9609 train 6.717165 (lr=1.8093e-05) (hash(x)=23327707) +9610 train 6.706145 (lr=1.8090e-05) (hash(x)=29576160) +9611 train 6.600067 (lr=1.8087e-05) (hash(x)=23125925) +9612 train 6.171123 (lr=1.8084e-05) (hash(x)=18623602) +9613 train 6.709985 (lr=1.8081e-05) (hash(x)=26735602) +9614 train 6.809079 (lr=1.8078e-05) (hash(x)=26350297) +9615 train 6.777637 (lr=1.8075e-05) (hash(x)=27937309) +9616 train 7.648152 (lr=1.8072e-05) (hash(x)=37412189) +9617 train 6.487126 (lr=1.8069e-05) (hash(x)=22490761) +9618 train 6.658111 (lr=1.8067e-05) (hash(x)=25844945) +9619 train 6.642128 (lr=1.8064e-05) (hash(x)=25195068) +9620 train 6.782279 (lr=1.8061e-05) (hash(x)=26724055) +9621 train 6.545681 (lr=1.8058e-05) (hash(x)=21904722) +9622 train 6.852112 (lr=1.8055e-05) (hash(x)=26981654) +9623 train 6.784061 (lr=1.8052e-05) (hash(x)=27886968) +9624 train 6.590042 (lr=1.8049e-05) (hash(x)=26046354) +9625 train 6.872417 (lr=1.8046e-05) (hash(x)=29433556) +9626 train 6.683673 (lr=1.8043e-05) (hash(x)=22012980) +9627 train 6.614124 (lr=1.8040e-05) (hash(x)=23485347) +9628 train 6.451033 (lr=1.8037e-05) (hash(x)=22123935) +9629 train 6.306006 (lr=1.8034e-05) (hash(x)=22493606) +9630 train 6.905403 (lr=1.8032e-05) (hash(x)=29397261) +9631 train 7.290701 (lr=1.8029e-05) (hash(x)=34599262) +9632 train 6.573567 (lr=1.8026e-05) (hash(x)=25321255) +9633 train 7.167003 (lr=1.8023e-05) (hash(x)=30036062) +9634 train 6.672487 (lr=1.8020e-05) (hash(x)=24364935) +9635 train 6.230239 (lr=1.8017e-05) (hash(x)=20353349) +9636 train 6.545549 (lr=1.8014e-05) (hash(x)=23827923) +9637 train 6.820453 (lr=1.8012e-05) (hash(x)=25760669) +9638 train 6.786849 (lr=1.8009e-05) (hash(x)=26227581) +9639 train 6.794942 (lr=1.8006e-05) (hash(x)=25334969) +9640 train 6.693344 (lr=1.8003e-05) (hash(x)=27750988) +9641 train 6.862511 (lr=1.8000e-05) (hash(x)=27117336) +9642 train 6.804912 (lr=1.7998e-05) (hash(x)=26555836) +9643 train 6.754022 (lr=1.7995e-05) (hash(x)=25699316) +9644 train 7.027779 (lr=1.7992e-05) (hash(x)=25411415) +9645 train 7.090257 (lr=1.7989e-05) (hash(x)=23911830) +9646 train 6.707155 (lr=1.7987e-05) (hash(x)=24813292) +9647 train 6.737587 (lr=1.7984e-05) (hash(x)=24324896) +9648 train 7.174470 (lr=1.7981e-05) (hash(x)=24988546) +9649 train 7.350432 (lr=1.7978e-05) (hash(x)=25360579) +9650 val loss 6.6273 +9650 val perplexity 755.4111 +9650 train 7.059467 (lr=1.7976e-05) (hash(x)=27313790) +9651 train 7.065022 (lr=1.7973e-05) (hash(x)=26929072) +9652 train 6.876623 (lr=1.7970e-05) (hash(x)=25570907) +9653 train 6.682262 (lr=1.7968e-05) (hash(x)=26096902) +9654 train 6.899339 (lr=1.7965e-05) (hash(x)=29824611) +9655 train 6.609900 (lr=1.7962e-05) (hash(x)=26313083) +9656 train 6.879210 (lr=1.7960e-05) (hash(x)=28196014) +9657 train 6.296894 (lr=1.7957e-05) (hash(x)=20152619) +9658 train 6.586798 (lr=1.7954e-05) (hash(x)=23231883) +9659 train 6.718304 (lr=1.7952e-05) (hash(x)=25438870) +9660 train 6.820211 (lr=1.7949e-05) (hash(x)=24751096) +9661 train 6.671391 (lr=1.7946e-05) (hash(x)=25289162) +9662 train 6.602863 (lr=1.7944e-05) (hash(x)=23502755) +9663 train 6.681098 (lr=1.7941e-05) (hash(x)=26055347) +9664 train 6.846771 (lr=1.7938e-05) (hash(x)=25490771) +9665 train 6.620496 (lr=1.7936e-05) (hash(x)=23627679) +9666 train 6.736623 (lr=1.7933e-05) (hash(x)=27363171) +9667 train 6.563251 (lr=1.7931e-05) (hash(x)=24235722) +9668 train 6.625404 (lr=1.7928e-05) (hash(x)=23603021) +9669 train 6.521871 (lr=1.7925e-05) (hash(x)=24876480) +9670 train 6.788293 (lr=1.7923e-05) (hash(x)=26741644) +9671 train 6.292087 (lr=1.7920e-05) (hash(x)=21210095) +9672 train 6.730882 (lr=1.7918e-05) (hash(x)=26197806) +9673 train 6.404602 (lr=1.7915e-05) (hash(x)=22798140) +9674 train 6.825677 (lr=1.7913e-05) (hash(x)=27291808) +9675 train 6.685586 (lr=1.7910e-05) (hash(x)=26018160) +9676 train 6.849890 (lr=1.7908e-05) (hash(x)=25682681) +9677 train 6.700789 (lr=1.7905e-05) (hash(x)=24654150) +9678 train 6.694034 (lr=1.7903e-05) (hash(x)=25031227) +9679 train 6.745415 (lr=1.7900e-05) (hash(x)=25357824) +9680 train 6.503310 (lr=1.7898e-05) (hash(x)=23418379) +9681 train 6.624546 (lr=1.7895e-05) (hash(x)=25346455) +9682 train 6.841268 (lr=1.7893e-05) (hash(x)=25764596) +9683 train 6.539710 (lr=1.7890e-05) (hash(x)=24845093) +9684 train 6.501302 (lr=1.7888e-05) (hash(x)=23625628) +9685 train 6.901855 (lr=1.7885e-05) (hash(x)=27675298) +9686 train 6.704573 (lr=1.7883e-05) (hash(x)=23828308) +9687 train 6.587399 (lr=1.7880e-05) (hash(x)=26632445) +9688 train 6.881157 (lr=1.7878e-05) (hash(x)=29933765) +9689 train 7.017597 (lr=1.7876e-05) (hash(x)=25194529) +9690 train 6.415782 (lr=1.7873e-05) (hash(x)=25565364) +9691 train 6.448279 (lr=1.7871e-05) (hash(x)=23101760) +9692 train 6.700776 (lr=1.7868e-05) (hash(x)=24202905) +9693 train 7.042711 (lr=1.7866e-05) (hash(x)=27950939) +9694 train 6.532596 (lr=1.7864e-05) (hash(x)=26087664) +9695 train 6.617165 (lr=1.7861e-05) (hash(x)=25344330) +9696 train 6.241926 (lr=1.7859e-05) (hash(x)=19844247) +9697 train 6.692228 (lr=1.7857e-05) (hash(x)=25486355) +9698 train 6.476626 (lr=1.7854e-05) (hash(x)=25545972) +9699 train 6.388285 (lr=1.7852e-05) (hash(x)=21521108) +9700 val loss 6.6233 +9700 val perplexity 752.4488 +9700 train 6.576160 (lr=1.7850e-05) (hash(x)=24450546) +9701 train 6.623181 (lr=1.7847e-05) (hash(x)=26944327) +9702 train 6.654329 (lr=1.7845e-05) (hash(x)=22206743) +9703 train 6.613834 (lr=1.7843e-05) (hash(x)=24385783) +9704 train 6.681016 (lr=1.7840e-05) (hash(x)=23798090) +9705 train 6.783237 (lr=1.7838e-05) (hash(x)=23779118) +9706 train 6.725793 (lr=1.7836e-05) (hash(x)=25406777) +9707 train 6.546516 (lr=1.7833e-05) (hash(x)=21789023) +9708 train 6.590432 (lr=1.7831e-05) (hash(x)=23348544) +9709 train 7.000099 (lr=1.7829e-05) (hash(x)=26376972) +9710 train 6.864233 (lr=1.7827e-05) (hash(x)=25895694) +9711 train 6.791059 (lr=1.7824e-05) (hash(x)=26624604) +9712 train 6.534097 (lr=1.7822e-05) (hash(x)=24128122) +9713 train 6.505449 (lr=1.7820e-05) (hash(x)=22943939) +9714 train 6.383578 (lr=1.7818e-05) (hash(x)=20988081) +9715 train 6.721500 (lr=1.7816e-05) (hash(x)=26621084) +9716 train 6.949356 (lr=1.7813e-05) (hash(x)=27925936) +9717 train 6.378376 (lr=1.7811e-05) (hash(x)=22344979) +9718 train 6.316219 (lr=1.7809e-05) (hash(x)=22088865) +9719 train 6.602457 (lr=1.7807e-05) (hash(x)=25046324) +9720 train 6.647167 (lr=1.7805e-05) (hash(x)=25944364) +9721 train 6.650392 (lr=1.7802e-05) (hash(x)=22143304) +9722 train 6.671707 (lr=1.7800e-05) (hash(x)=25402579) +9723 train 6.743122 (lr=1.7798e-05) (hash(x)=24690201) +9724 train 7.458191 (lr=1.7796e-05) (hash(x)=34621549) +9725 train 7.253826 (lr=1.7794e-05) (hash(x)=31493562) +9726 train 7.247913 (lr=1.7792e-05) (hash(x)=30529535) +9727 train 7.208033 (lr=1.7790e-05) (hash(x)=34680076) +9728 train 7.002101 (lr=1.7787e-05) (hash(x)=27882445) +9729 train 7.326796 (lr=1.7785e-05) (hash(x)=31511201) +9730 train 7.239143 (lr=1.7783e-05) (hash(x)=32553865) +9731 train 7.129915 (lr=1.7781e-05) (hash(x)=29510291) +9732 train 7.350110 (lr=1.7779e-05) (hash(x)=32117635) +9733 train 7.456738 (lr=1.7777e-05) (hash(x)=34492741) +9734 train 7.337523 (lr=1.7775e-05) (hash(x)=31166617) +9735 train 6.689580 (lr=1.7773e-05) (hash(x)=26107052) +9736 train 6.773361 (lr=1.7771e-05) (hash(x)=26824538) +9737 train 6.871569 (lr=1.7769e-05) (hash(x)=27554702) +9738 train 6.793041 (lr=1.7767e-05) (hash(x)=25967213) +9739 train 6.652777 (lr=1.7765e-05) (hash(x)=24784210) +9740 train 6.333805 (lr=1.7763e-05) (hash(x)=20345900) +9741 train 6.517246 (lr=1.7761e-05) (hash(x)=23108340) +9742 train 6.779601 (lr=1.7759e-05) (hash(x)=27252649) +9743 train 6.579821 (lr=1.7757e-05) (hash(x)=24137475) +9744 train 6.644639 (lr=1.7755e-05) (hash(x)=23655487) +9745 train 6.459642 (lr=1.7753e-05) (hash(x)=22077480) +9746 train 6.679059 (lr=1.7751e-05) (hash(x)=25469597) +9747 train 6.823856 (lr=1.7749e-05) (hash(x)=27346373) +9748 train 6.499948 (lr=1.7747e-05) (hash(x)=23830979) +9749 train 6.552519 (lr=1.7745e-05) (hash(x)=25068050) +9750 val loss 6.6276 +9750 val perplexity 755.6439 +9750 train 6.629551 (lr=1.7743e-05) (hash(x)=25853134) +9751 train 6.650467 (lr=1.7741e-05) (hash(x)=24653821) +9752 train 6.560411 (lr=1.7739e-05) (hash(x)=23563128) +9753 train 6.584816 (lr=1.7737e-05) (hash(x)=24110242) +9754 train 6.862218 (lr=1.7735e-05) (hash(x)=26385373) +9755 train 6.519277 (lr=1.7733e-05) (hash(x)=21433979) +9756 train 6.627697 (lr=1.7731e-05) (hash(x)=26744771) +9757 train 6.684622 (lr=1.7729e-05) (hash(x)=22251777) +9758 train 6.649547 (lr=1.7728e-05) (hash(x)=25911356) +9759 train 6.876200 (lr=1.7726e-05) (hash(x)=26335191) +9760 train 6.719705 (lr=1.7724e-05) (hash(x)=25236730) +9761 train 6.437563 (lr=1.7722e-05) (hash(x)=22961140) +9762 train 6.730866 (lr=1.7720e-05) (hash(x)=27606402) +9763 train 6.288253 (lr=1.7718e-05) (hash(x)=21415049) +9764 train 6.705127 (lr=1.7716e-05) (hash(x)=24343200) +9765 train 6.904052 (lr=1.7715e-05) (hash(x)=25647138) +9766 train 6.894706 (lr=1.7713e-05) (hash(x)=27022394) +9767 train 6.854208 (lr=1.7711e-05) (hash(x)=27318715) +9768 train 6.437309 (lr=1.7709e-05) (hash(x)=22378861) +9769 train 6.389501 (lr=1.7707e-05) (hash(x)=27014767) +9770 train 6.464531 (lr=1.7706e-05) (hash(x)=25619807) +9771 train 6.607042 (lr=1.7704e-05) (hash(x)=26967264) +9772 train 7.187820 (lr=1.7702e-05) (hash(x)=36233889) +9773 train 7.045088 (lr=1.7700e-05) (hash(x)=32130680) +9774 train 6.622045 (lr=1.7698e-05) (hash(x)=24514124) +9775 train 6.994377 (lr=1.7697e-05) (hash(x)=22779375) +9776 train 7.479234 (lr=1.7695e-05) (hash(x)=28171729) +9777 train 6.397460 (lr=1.7693e-05) (hash(x)=21943332) +9778 train 6.746257 (lr=1.7691e-05) (hash(x)=26445301) +9779 train 7.051172 (lr=1.7690e-05) (hash(x)=29516471) +9780 train 6.864750 (lr=1.7688e-05) (hash(x)=27717580) +9781 train 6.498474 (lr=1.7686e-05) (hash(x)=22236777) +9782 train 6.497322 (lr=1.7685e-05) (hash(x)=24851031) +9783 train 6.877132 (lr=1.7683e-05) (hash(x)=27926071) +9784 train 6.611963 (lr=1.7681e-05) (hash(x)=22264800) +9785 train 6.781676 (lr=1.7680e-05) (hash(x)=26996604) +9786 train 6.516033 (lr=1.7678e-05) (hash(x)=22114203) +9787 train 6.510620 (lr=1.7676e-05) (hash(x)=27403718) +9788 train 6.496858 (lr=1.7675e-05) (hash(x)=22943197) +9789 train 6.688640 (lr=1.7673e-05) (hash(x)=23287371) +9790 train 6.688694 (lr=1.7671e-05) (hash(x)=25900029) +9791 train 6.811934 (lr=1.7670e-05) (hash(x)=29420094) +9792 train 6.552627 (lr=1.7668e-05) (hash(x)=24549382) +9793 train 6.836104 (lr=1.7666e-05) (hash(x)=27609315) +9794 train 6.389493 (lr=1.7665e-05) (hash(x)=22044421) +9795 train 6.771943 (lr=1.7663e-05) (hash(x)=27362231) +9796 train 6.917333 (lr=1.7662e-05) (hash(x)=28504416) +9797 train 6.872102 (lr=1.7660e-05) (hash(x)=29741057) +9798 train 6.476828 (lr=1.7659e-05) (hash(x)=25013871) +9799 train 6.518807 (lr=1.7657e-05) (hash(x)=24724693) +9800 val loss 6.6237 +9800 val perplexity 752.7348 +9800 train 6.753479 (lr=1.7655e-05) (hash(x)=24685053) +9801 train 6.707574 (lr=1.7654e-05) (hash(x)=25588946) +9802 train 6.771350 (lr=1.7652e-05) (hash(x)=25635158) +9803 train 6.658681 (lr=1.7651e-05) (hash(x)=26134002) +9804 train 6.708646 (lr=1.7649e-05) (hash(x)=23405766) +9805 train 6.575427 (lr=1.7648e-05) (hash(x)=21920337) +9806 train 6.293089 (lr=1.7646e-05) (hash(x)=19405829) +9807 train 6.895043 (lr=1.7645e-05) (hash(x)=25530610) +9808 train 6.940145 (lr=1.7643e-05) (hash(x)=29958393) +9809 train 6.979373 (lr=1.7642e-05) (hash(x)=30778880) +9810 train 6.646286 (lr=1.7640e-05) (hash(x)=25702954) +9811 train 6.451168 (lr=1.7639e-05) (hash(x)=22707499) +9812 train 6.433398 (lr=1.7637e-05) (hash(x)=23186442) +9813 train 6.794138 (lr=1.7636e-05) (hash(x)=26191644) +9814 train 6.708197 (lr=1.7634e-05) (hash(x)=25948816) +9815 train 6.855505 (lr=1.7633e-05) (hash(x)=24576066) +9816 train 6.874444 (lr=1.7632e-05) (hash(x)=27457412) +9817 train 6.684479 (lr=1.7630e-05) (hash(x)=25162926) +9818 train 6.826702 (lr=1.7629e-05) (hash(x)=26851142) +9819 train 6.460628 (lr=1.7627e-05) (hash(x)=22984864) +9820 train 6.564542 (lr=1.7626e-05) (hash(x)=21249792) +9821 train 6.619092 (lr=1.7625e-05) (hash(x)=22973380) +9822 train 6.897115 (lr=1.7623e-05) (hash(x)=25300031) +9823 train 6.628147 (lr=1.7622e-05) (hash(x)=24790903) +9824 train 6.798761 (lr=1.7620e-05) (hash(x)=25862946) +9825 train 6.991826 (lr=1.7619e-05) (hash(x)=26290724) +9826 train 6.795081 (lr=1.7618e-05) (hash(x)=25883557) +9827 train 6.534810 (lr=1.7616e-05) (hash(x)=24664220) +9828 train 6.139971 (lr=1.7615e-05) (hash(x)=19166701) +9829 train 6.619659 (lr=1.7614e-05) (hash(x)=24589979) +9830 train 6.534562 (lr=1.7612e-05) (hash(x)=25911823) +9831 train 6.327268 (lr=1.7611e-05) (hash(x)=23458862) +9832 train 6.752789 (lr=1.7610e-05) (hash(x)=25548466) +9833 train 7.024621 (lr=1.7608e-05) (hash(x)=30400028) +9834 train 7.124156 (lr=1.7607e-05) (hash(x)=31206029) +9835 train 6.740859 (lr=1.7606e-05) (hash(x)=27652913) +9836 train 6.779277 (lr=1.7605e-05) (hash(x)=27777136) +9837 train 6.566629 (lr=1.7603e-05) (hash(x)=24316879) +9838 train 6.802760 (lr=1.7602e-05) (hash(x)=24801801) +9839 train 6.969020 (lr=1.7601e-05) (hash(x)=24772439) +9840 train 6.561179 (lr=1.7599e-05) (hash(x)=23829352) +9841 train 6.649835 (lr=1.7598e-05) (hash(x)=24069548) +9842 train 6.807308 (lr=1.7597e-05) (hash(x)=23125968) +9843 train 6.585530 (lr=1.7596e-05) (hash(x)=26262696) +9844 train 6.830000 (lr=1.7595e-05) (hash(x)=27296697) +9845 train 6.877733 (lr=1.7593e-05) (hash(x)=27952317) +9846 train 6.535289 (lr=1.7592e-05) (hash(x)=27038524) +9847 train 6.685058 (lr=1.7591e-05) (hash(x)=24746143) +9848 train 6.434391 (lr=1.7590e-05) (hash(x)=24296550) +9849 train 6.673583 (lr=1.7589e-05) (hash(x)=24492187) +9850 val loss 6.6214 +9850 val perplexity 750.9656 +9850 train 6.670907 (lr=1.7587e-05) (hash(x)=26015762) +9851 train 6.559958 (lr=1.7586e-05) (hash(x)=20511054) +9852 train 6.547571 (lr=1.7585e-05) (hash(x)=20580871) +9853 train 6.623352 (lr=1.7584e-05) (hash(x)=20713568) +9854 train 6.467204 (lr=1.7583e-05) (hash(x)=24203940) +9855 train 6.469763 (lr=1.7582e-05) (hash(x)=24375937) +9856 train 6.246242 (lr=1.7581e-05) (hash(x)=22760185) +9857 train 6.674377 (lr=1.7579e-05) (hash(x)=25113375) +9858 train 6.631579 (lr=1.7578e-05) (hash(x)=24775950) +9859 train 6.808460 (lr=1.7577e-05) (hash(x)=28464631) +9860 train 6.607402 (lr=1.7576e-05) (hash(x)=23890107) +9861 train 6.563800 (lr=1.7575e-05) (hash(x)=22495620) +9862 train 6.496695 (lr=1.7574e-05) (hash(x)=22339587) +9863 train 6.476694 (lr=1.7573e-05) (hash(x)=24488508) +9864 train 6.683815 (lr=1.7572e-05) (hash(x)=25865328) +9865 train 6.679141 (lr=1.7571e-05) (hash(x)=26647302) +9866 train 6.751907 (lr=1.7570e-05) (hash(x)=28142009) +9867 train 6.674211 (lr=1.7569e-05) (hash(x)=24587565) +9868 train 6.839609 (lr=1.7568e-05) (hash(x)=27071939) +9869 train 6.492093 (lr=1.7567e-05) (hash(x)=22935230) +9870 train 6.425191 (lr=1.7566e-05) (hash(x)=23731831) +9871 train 6.988696 (lr=1.7565e-05) (hash(x)=32753768) +9872 train 6.720996 (lr=1.7564e-05) (hash(x)=26599661) +9873 train 6.530798 (lr=1.7563e-05) (hash(x)=24471729) +9874 train 6.770559 (lr=1.7562e-05) (hash(x)=23871697) +9875 train 6.503647 (lr=1.7561e-05) (hash(x)=24132259) +9876 train 6.758611 (lr=1.7560e-05) (hash(x)=23213877) +9877 train 6.698001 (lr=1.7559e-05) (hash(x)=25884855) +9878 train 6.787299 (lr=1.7558e-05) (hash(x)=28879452) +9879 train 6.514466 (lr=1.7557e-05) (hash(x)=23771552) +9880 train 6.624969 (lr=1.7556e-05) (hash(x)=24621461) +9881 train 6.566062 (lr=1.7555e-05) (hash(x)=24391635) +9882 train 6.420064 (lr=1.7554e-05) (hash(x)=21709959) +9883 train 6.749828 (lr=1.7553e-05) (hash(x)=28525125) +9884 train 6.826711 (lr=1.7552e-05) (hash(x)=26112485) +9885 train 6.719436 (lr=1.7551e-05) (hash(x)=29288233) +9886 train 6.964332 (lr=1.7551e-05) (hash(x)=28049729) +9887 train 6.643034 (lr=1.7550e-05) (hash(x)=25921960) +9888 train 6.731618 (lr=1.7549e-05) (hash(x)=24762129) +9889 train 6.676109 (lr=1.7548e-05) (hash(x)=24750726) +9890 train 6.804097 (lr=1.7547e-05) (hash(x)=27364542) +9891 train 6.426523 (lr=1.7546e-05) (hash(x)=23100325) +9892 train 6.728117 (lr=1.7545e-05) (hash(x)=25115516) +9893 train 6.398834 (lr=1.7544e-05) (hash(x)=21912752) +9894 train 6.873877 (lr=1.7544e-05) (hash(x)=25775189) +9895 train 6.770405 (lr=1.7543e-05) (hash(x)=25935286) +9896 train 6.762613 (lr=1.7542e-05) (hash(x)=25765262) +9897 train 6.937081 (lr=1.7541e-05) (hash(x)=25626296) +9898 train 7.495525 (lr=1.7540e-05) (hash(x)=30086285) +9899 train 7.074179 (lr=1.7540e-05) (hash(x)=28217068) +9900 val loss 6.6206 +9900 val perplexity 750.3657 +9900 train 6.591760 (lr=1.7539e-05) (hash(x)=24666478) +9901 train 6.756729 (lr=1.7538e-05) (hash(x)=19718801) +9902 train 6.899304 (lr=1.7537e-05) (hash(x)=20302187) +9903 train 6.837378 (lr=1.7537e-05) (hash(x)=21297332) +9904 train 6.785165 (lr=1.7536e-05) (hash(x)=20251412) +9905 train 6.955602 (lr=1.7535e-05) (hash(x)=26220102) +9906 train 6.490457 (lr=1.7534e-05) (hash(x)=24959359) +9907 train 6.585446 (lr=1.7534e-05) (hash(x)=25231284) +9908 train 6.439789 (lr=1.7533e-05) (hash(x)=21073750) +9909 train 6.717966 (lr=1.7532e-05) (hash(x)=21976453) +9910 train 6.970323 (lr=1.7531e-05) (hash(x)=27532340) +9911 train 6.452223 (lr=1.7531e-05) (hash(x)=23289133) +9912 train 6.813228 (lr=1.7530e-05) (hash(x)=23682137) +9913 train 6.740706 (lr=1.7529e-05) (hash(x)=26094218) +9914 train 6.615112 (lr=1.7529e-05) (hash(x)=24538577) +9915 train 6.503009 (lr=1.7528e-05) (hash(x)=24065141) +9916 train 6.964579 (lr=1.7527e-05) (hash(x)=24032822) +9917 train 6.600816 (lr=1.7527e-05) (hash(x)=24630785) +9918 train 6.787798 (lr=1.7526e-05) (hash(x)=29520891) +9919 train 6.334460 (lr=1.7526e-05) (hash(x)=22772079) +9920 train 6.572235 (lr=1.7525e-05) (hash(x)=25393369) +9921 train 6.508809 (lr=1.7524e-05) (hash(x)=20892794) +9922 train 6.672440 (lr=1.7524e-05) (hash(x)=24121962) +9923 train 6.553819 (lr=1.7523e-05) (hash(x)=17700344) +9924 train 6.654447 (lr=1.7522e-05) (hash(x)=24147940) +9925 train 6.513005 (lr=1.7522e-05) (hash(x)=18375850) +9926 train 6.495038 (lr=1.7521e-05) (hash(x)=16761874) +9927 train 6.734456 (lr=1.7521e-05) (hash(x)=23930354) +9928 train 6.518666 (lr=1.7520e-05) (hash(x)=24371030) +9929 train 6.954237 (lr=1.7520e-05) (hash(x)=26051426) +9930 train 6.876967 (lr=1.7519e-05) (hash(x)=27342765) +9931 train 7.091850 (lr=1.7519e-05) (hash(x)=31777609) +9932 train 6.731048 (lr=1.7518e-05) (hash(x)=26443656) +9933 train 6.530615 (lr=1.7517e-05) (hash(x)=23731877) +9934 train 6.617046 (lr=1.7517e-05) (hash(x)=24164943) +9935 train 6.595483 (lr=1.7516e-05) (hash(x)=24716940) +9936 train 6.658479 (lr=1.7516e-05) (hash(x)=25392810) +9937 train 6.744084 (lr=1.7515e-05) (hash(x)=26867707) +9938 train 6.482147 (lr=1.7515e-05) (hash(x)=21703100) +9939 train 6.541847 (lr=1.7514e-05) (hash(x)=22583493) +9940 train 6.373763 (lr=1.7514e-05) (hash(x)=22800802) +9941 train 6.494759 (lr=1.7514e-05) (hash(x)=22307538) +9942 train 6.484715 (lr=1.7513e-05) (hash(x)=21679939) +9943 train 6.532034 (lr=1.7513e-05) (hash(x)=23069742) +9944 train 6.687399 (lr=1.7512e-05) (hash(x)=25806292) +9945 train 6.752448 (lr=1.7512e-05) (hash(x)=26883443) +9946 train 6.170459 (lr=1.7511e-05) (hash(x)=19607896) +9947 train 6.597703 (lr=1.7511e-05) (hash(x)=24452580) +9948 train 6.445303 (lr=1.7511e-05) (hash(x)=25109914) +9949 train 6.538164 (lr=1.7510e-05) (hash(x)=26095064) +9950 val loss 6.6160 +9950 val perplexity 746.9714 +9950 train 6.682744 (lr=1.7510e-05) (hash(x)=25632214) +9951 train 6.425879 (lr=1.7509e-05) (hash(x)=20707899) +9952 train 6.391460 (lr=1.7509e-05) (hash(x)=22703033) +9953 train 6.774211 (lr=1.7509e-05) (hash(x)=29389932) +9954 train 6.763661 (lr=1.7508e-05) (hash(x)=28620018) +9955 train 6.720230 (lr=1.7508e-05) (hash(x)=25291392) +9956 train 6.684812 (lr=1.7508e-05) (hash(x)=27336189) +9957 train 6.667816 (lr=1.7507e-05) (hash(x)=26594498) +9958 train 6.508184 (lr=1.7507e-05) (hash(x)=23732224) +9959 train 6.598456 (lr=1.7507e-05) (hash(x)=24393903) +9960 train 6.760669 (lr=1.7506e-05) (hash(x)=27226010) +9961 train 6.600742 (lr=1.7506e-05) (hash(x)=24885810) +9962 train 6.661861 (lr=1.7506e-05) (hash(x)=24770685) +9963 train 6.953546 (lr=1.7505e-05) (hash(x)=28354988) +9964 train 6.789593 (lr=1.7505e-05) (hash(x)=24184978) +9965 train 6.441139 (lr=1.7505e-05) (hash(x)=24443616) +9966 train 6.777231 (lr=1.7504e-05) (hash(x)=26136701) +9967 train 6.890470 (lr=1.7504e-05) (hash(x)=27117479) +9968 train 6.527462 (lr=1.7504e-05) (hash(x)=23978418) +9969 train 6.220551 (lr=1.7504e-05) (hash(x)=20094160) +9970 train 7.244711 (lr=1.7503e-05) (hash(x)=29872343) +9971 train 6.498462 (lr=1.7503e-05) (hash(x)=23580999) +9972 train 6.398592 (lr=1.7503e-05) (hash(x)=23897318) +9973 train 6.730612 (lr=1.7503e-05) (hash(x)=28725805) +9974 train 6.636234 (lr=1.7503e-05) (hash(x)=24958270) +9975 train 6.708601 (lr=1.7502e-05) (hash(x)=24301798) +9976 train 6.580379 (lr=1.7502e-05) (hash(x)=24584038) +9977 train 6.815181 (lr=1.7502e-05) (hash(x)=28678215) +9978 train 6.620433 (lr=1.7502e-05) (hash(x)=26565150) +9979 train 6.722952 (lr=1.7502e-05) (hash(x)=25414024) +9980 train 6.600241 (lr=1.7502e-05) (hash(x)=24891322) +9981 train 6.893816 (lr=1.7501e-05) (hash(x)=28925598) +9982 train 6.296970 (lr=1.7501e-05) (hash(x)=20964228) +9983 train 6.645416 (lr=1.7501e-05) (hash(x)=22931350) +9984 train 6.552756 (lr=1.7501e-05) (hash(x)=23346527) +9985 train 6.777167 (lr=1.7501e-05) (hash(x)=27012668) +9986 train 6.481418 (lr=1.7501e-05) (hash(x)=23775772) +9987 train 6.562741 (lr=1.7501e-05) (hash(x)=24584825) +9988 train 6.738826 (lr=1.7501e-05) (hash(x)=25881483) +9989 train 6.589532 (lr=1.7500e-05) (hash(x)=25408780) +9990 train 6.808540 (lr=1.7500e-05) (hash(x)=27075019) +9991 train 6.637045 (lr=1.7500e-05) (hash(x)=25191623) +9992 train 6.869874 (lr=1.7500e-05) (hash(x)=28565631) +9993 train 6.653084 (lr=1.7500e-05) (hash(x)=24025482) +9994 train 6.485544 (lr=1.7500e-05) (hash(x)=20243460) +9995 train 6.683347 (lr=1.7500e-05) (hash(x)=26166513) +9996 train 6.678082 (lr=1.7500e-05) (hash(x)=24816779) +9997 train 6.709316 (lr=1.7500e-05) (hash(x)=23481468) +9998 train 6.440124 (lr=1.7500e-05) (hash(x)=25368164) +9999 val loss 6.6157 +9999 val perplexity 746.7107 +9999 train 6.990719 (lr=1.7500e-05) (hash(x)=30307737) diff --git a/lr1.75e-4_total_batch_size5120_seq_len256_decay_lrtrue_attention_kindselective_warmup_steps1/model_02500.pt b/lr1.75e-4_total_batch_size5120_seq_len256_decay_lrtrue_attention_kindselective_warmup_steps1/model_02500.pt new file mode 100644 index 0000000000000000000000000000000000000000..05adc377799be32290512f1b9ad1dbf174869f4d --- /dev/null +++ b/lr1.75e-4_total_batch_size5120_seq_len256_decay_lrtrue_attention_kindselective_warmup_steps1/model_02500.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4db6fa30dbbb8c2648218f4b72aebf05b842e6e86a099e6e9e8f189ef160f389 +size 38587970 diff --git a/lr1.75e-4_total_batch_size5120_seq_len256_decay_lrtrue_attention_kindselective_warmup_steps1/model_05000.pt b/lr1.75e-4_total_batch_size5120_seq_len256_decay_lrtrue_attention_kindselective_warmup_steps1/model_05000.pt new file mode 100644 index 0000000000000000000000000000000000000000..9d71cfa49485e731ab2977f3d40a2d66fccfcf47 --- /dev/null +++ b/lr1.75e-4_total_batch_size5120_seq_len256_decay_lrtrue_attention_kindselective_warmup_steps1/model_05000.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cfad97a57d3a17da622b5256ed0437f0605ce440ce29635de46737dcfc8952bb +size 38587970 diff --git a/lr1.75e-4_total_batch_size5120_seq_len256_decay_lrtrue_attention_kindselective_warmup_steps1/model_07500.pt b/lr1.75e-4_total_batch_size5120_seq_len256_decay_lrtrue_attention_kindselective_warmup_steps1/model_07500.pt new file mode 100644 index 0000000000000000000000000000000000000000..cff24d59bc4da165408ddac01f5cd84eb348ac79 --- /dev/null +++ b/lr1.75e-4_total_batch_size5120_seq_len256_decay_lrtrue_attention_kindselective_warmup_steps1/model_07500.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0cef1d9fccd384ca8579ce766ccac8cffc1a000a0bc291ca4d9ce695cc5c7a5d +size 38587970 diff --git a/lr1.75e-4_total_batch_size5120_seq_len256_decay_lrtrue_attention_kindselective_warmup_steps1/model_09999.pt b/lr1.75e-4_total_batch_size5120_seq_len256_decay_lrtrue_attention_kindselective_warmup_steps1/model_09999.pt new file mode 100644 index 0000000000000000000000000000000000000000..0c9102bd689146c6669a0b390118a290fc0cc670 --- /dev/null +++ b/lr1.75e-4_total_batch_size5120_seq_len256_decay_lrtrue_attention_kindselective_warmup_steps1/model_09999.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7f74f2bdd1e295e3b28349a3ab741a07f769f2311c4c83bf114363b53e65ebc0 +size 38587970 diff --git a/lr1.75e-4_total_batch_size5120_seq_len256_decay_lrtrue_attention_kindselective_warmup_steps1/optimizer_02500.pt b/lr1.75e-4_total_batch_size5120_seq_len256_decay_lrtrue_attention_kindselective_warmup_steps1/optimizer_02500.pt new file mode 100644 index 0000000000000000000000000000000000000000..e532ac0cfb1e155fabbe91c39d0c008f339b08fa --- /dev/null +++ b/lr1.75e-4_total_batch_size5120_seq_len256_decay_lrtrue_attention_kindselective_warmup_steps1/optimizer_02500.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a2bb800e7fd627375a06373c84133e8a8066e722b915d9e635e127ca410306fc +size 70895430 diff --git a/lr1.75e-4_total_batch_size5120_seq_len256_decay_lrtrue_attention_kindselective_warmup_steps1/optimizer_05000.pt b/lr1.75e-4_total_batch_size5120_seq_len256_decay_lrtrue_attention_kindselective_warmup_steps1/optimizer_05000.pt new file mode 100644 index 0000000000000000000000000000000000000000..1a821156d0835712878c5243c3f4de895897a9df --- /dev/null +++ b/lr1.75e-4_total_batch_size5120_seq_len256_decay_lrtrue_attention_kindselective_warmup_steps1/optimizer_05000.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ed9f39127bb1239485cb3fc993e33c95452d7cdcbd26843b3e8db62cba57babd +size 70895430 diff --git a/lr1.75e-4_total_batch_size5120_seq_len256_decay_lrtrue_attention_kindselective_warmup_steps1/optimizer_07500.pt b/lr1.75e-4_total_batch_size5120_seq_len256_decay_lrtrue_attention_kindselective_warmup_steps1/optimizer_07500.pt new file mode 100644 index 0000000000000000000000000000000000000000..da3967aa53e604848eb8125065c1505c7a1ac33a --- /dev/null +++ b/lr1.75e-4_total_batch_size5120_seq_len256_decay_lrtrue_attention_kindselective_warmup_steps1/optimizer_07500.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d72628188484e0c8f42d104d1a07f18614432e78855b5be822429865e4b84a5d +size 70895430 diff --git a/lr1.75e-4_total_batch_size5120_seq_len256_decay_lrtrue_attention_kindselective_warmup_steps1/optimizer_09999.pt b/lr1.75e-4_total_batch_size5120_seq_len256_decay_lrtrue_attention_kindselective_warmup_steps1/optimizer_09999.pt new file mode 100644 index 0000000000000000000000000000000000000000..7c41d2330153cea9f96a375df999077f723ba6b1 --- /dev/null +++ b/lr1.75e-4_total_batch_size5120_seq_len256_decay_lrtrue_attention_kindselective_warmup_steps1/optimizer_09999.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:01ace8edd6f82273317c7c55731bd5c0d724b215df8e35c3093d21e529d6d576 +size 70895430