diff --git a/.gitattributes b/.gitattributes index a6344aac8c09253b3b630fb776ae94478aa0275b..28117bd384fafa326be2034e925fd429bf91621e 100644 --- a/.gitattributes +++ b/.gitattributes @@ -33,3 +33,11 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text *.zip filter=lfs diff=lfs merge=lfs -text *.zst filter=lfs diff=lfs merge=lfs -text *tfevents* filter=lfs diff=lfs merge=lfs -text +visualizations/embedding_similarity.png filter=lfs diff=lfs merge=lfs -text +visualizations/embedding_tsne_multilingual.png filter=lfs diff=lfs merge=lfs -text +visualizations/ngram_coverage.png filter=lfs diff=lfs merge=lfs -text +visualizations/performance_dashboard.png filter=lfs diff=lfs merge=lfs -text +visualizations/position_encoding_comparison.png filter=lfs diff=lfs merge=lfs -text +visualizations/tsne_sentences.png filter=lfs diff=lfs merge=lfs -text +visualizations/tsne_words.png filter=lfs diff=lfs merge=lfs -text +visualizations/zipf_law.png filter=lfs diff=lfs merge=lfs -text diff --git a/README.md b/README.md new file mode 100644 index 0000000000000000000000000000000000000000..ef5cfa0cab4bc3a16780e212469030cb8a77119f --- /dev/null +++ b/README.md @@ -0,0 +1,761 @@ +--- +language: ty +language_name: Tahitian +language_family: austronesian_polynesian +tags: + - wikilangs + - nlp + - tokenizer + - embeddings + - n-gram + - markov + - wikipedia + - feature-extraction + - sentence-similarity + - tokenization + - n-grams + - markov-chain + - text-mining + - fasttext + - babelvec + - vocabulous + - vocabulary + - monolingual + - family-austronesian_polynesian +license: mit +library_name: wikilangs +pipeline_tag: text-generation +datasets: + - omarkamali/wikipedia-monthly +dataset_info: + name: wikipedia-monthly + description: Monthly snapshots of Wikipedia articles across 300+ languages +metrics: + - name: best_compression_ratio + type: compression + value: 3.561 + - name: best_isotropy + type: isotropy + value: 0.0301 + - name: vocabulary_size + type: vocab + value: 0 +generated: 2026-01-11 +--- + +# Tahitian - Wikilangs Models +## Comprehensive Research Report & Full Ablation Study + +This repository contains NLP models trained and evaluated by Wikilangs, specifically on **Tahitian** Wikipedia data. +We analyze tokenizers, n-gram models, Markov chains, vocabulary statistics, and word embeddings. + +## 📋 Repository Contents + +### Models & Assets + +- Tokenizers (8k, 16k, 32k, 64k) +- N-gram models (2, 3, 4, 5-gram) +- Markov chains (context of 1, 2, 3, 4 and 5) +- Subword N-gram and Markov chains +- Embeddings in various sizes and dimensions (aligned and unaligned) +- Language Vocabulary +- Language Statistics + +![Performance Dashboard](visualizations/performance_dashboard.png) + +### Analysis and Evaluation + +- [1. Tokenizer Evaluation](#1-tokenizer-evaluation) +- [2. N-gram Model Evaluation](#2-n-gram-model-evaluation) +- [3. Markov Chain Evaluation](#3-markov-chain-evaluation) +- [4. Vocabulary Analysis](#4-vocabulary-analysis) +- [5. Word Embeddings Evaluation](#5-word-embeddings-evaluation) +- [6. Morphological Analysis (Experimental)](#6--morphological-analysis-experimental) +- [7. Summary & Recommendations](#7-summary--recommendations) +- [Metrics Glossary](#appendix-metrics-glossary--interpretation-guide) +- [Visualizations Index](#visualizations-index) + +--- +## 1. Tokenizer Evaluation + +![Tokenizer Compression](visualizations/tokenizer_compression.png) + +![Tokenizer Fertility](visualizations/tokenizer_fertility.png) + +![Tokenizer OOV](visualizations/tokenizer_oov.png) + +![Total Tokens](visualizations/tokenizer_total_tokens.png) + +### Results + +| Vocab Size | Compression | Avg Token Len | UNK Rate | Total Tokens | +|------------|-------------|---------------|----------|--------------| +| **8k** | 3.455x | 3.48 | 0.1990% | 40,695 | +| **16k** | 3.561x 🏆 | 3.59 | 0.2052% | 39,479 | + +### Tokenization Examples + +Below are sample sentences tokenized with each vocabulary size: + +**Sample 1:** `’O Sant Miquel de Campmajor te hō’ē ’oire iti nō Tatarūnia. mau ’oire iti nō Tat...` + +| Vocab | Tokens | Count | +|-------|--------|-------| +| 8k | `▁’ o ▁sant ▁miquel ▁de ▁camp major ▁te ▁hō ’ ... (+13 more)` | 23 | +| 16k | `▁’ o ▁sant ▁miquel ▁de ▁campmajor ▁te ▁hō ’ ē ... (+12 more)` | 22 | + +**Sample 2:** `Ò Hakahau te òire rahi aè no Ua Pou i Pōrīnetia farāni. ènata` + +| Vocab | Tokens | Count | +|-------|--------|-------| +| 8k | `▁ò ▁hakahau ▁te ▁òire ▁rahi ▁aè ▁no ▁ua ▁pou ▁i ... (+4 more)` | 14 | +| 16k | `▁ò ▁hakahau ▁te ▁òire ▁rahi ▁aè ▁no ▁ua ▁pou ▁i ... (+4 more)` | 14 | + +**Sample 3:** `’O te hō’ē ’oire iti nō Soria. mau ’oire iti nō Soria` + +| Vocab | Tokens | Count | +|-------|--------|-------| +| 8k | `▁’ o ▁te ▁hō ’ ē ▁’ oire ▁iti ▁nō ... (+8 more)` | 18 | +| 16k | `▁’ o ▁te ▁hō ’ ē ▁’ oire ▁iti ▁nō ... (+8 more)` | 18 | + + +### Key Findings + +- **Best Compression:** 16k achieves 3.561x compression +- **Lowest UNK Rate:** 8k with 0.1990% unknown tokens +- **Trade-off:** Larger vocabularies improve compression but increase model size +- **Recommendation:** 32k vocabulary provides optimal balance for production use + +--- +## 2. N-gram Model Evaluation + +![N-gram Perplexity](visualizations/ngram_perplexity.png) + +![N-gram Unique](visualizations/ngram_unique.png) + +![N-gram Coverage](visualizations/ngram_coverage.png) + +### Results + +| N-gram | Variant | Perplexity | Entropy | Unique N-grams | Top-100 Coverage | Top-1000 Coverage | +|--------|---------|------------|---------|----------------|------------------|-------------------| +| **2-gram** | Word | 422 | 8.72 | 1,465 | 56.1% | 93.7% | +| **2-gram** | Subword | 157 🏆 | 7.29 | 1,040 | 80.2% | 99.9% | +| **3-gram** | Word | 804 | 9.65 | 2,559 | 47.1% | 82.0% | +| **3-gram** | Subword | 845 | 9.72 | 5,412 | 45.0% | 86.0% | +| **4-gram** | Word | 1,231 | 10.27 | 4,355 | 43.3% | 70.6% | +| **4-gram** | Subword | 2,588 | 11.34 | 15,928 | 29.6% | 67.7% | +| **5-gram** | Word | 874 | 9.77 | 3,200 | 48.9% | 75.5% | +| **5-gram** | Subword | 4,432 | 12.11 | 22,183 | 24.4% | 57.5% | + +### Top 5 N-grams by Size + +**2-grams (Word):** + +| Rank | N-gram | Count | +|------|--------|-------| +| 1 | `i te` | 2,291 | +| 2 | `te mau` | 1,467 | +| 3 | `o te` | 1,091 | +| 4 | `oire iti` | 927 | +| 5 | `iti nō` | 927 | + +**3-grams (Word):** + +| Rank | N-gram | Count | +|------|--------|-------| +| 1 | `oire iti nō` | 927 | +| 2 | `te hō ē` | 509 | +| 3 | `hō ē oire` | 499 | +| 4 | `ē oire iti` | 472 | +| 5 | `mau oire iti` | 455 | + +**4-grams (Word):** + +| Rank | N-gram | Count | +|------|--------|-------| +| 1 | `te hō ē oire` | 499 | +| 2 | `ē oire iti nō` | 472 | +| 3 | `hō ē oire iti` | 472 | +| 4 | `mau oire iti nō` | 455 | +| 5 | `oire iti nō tatarūnia` | 451 | + +**5-grams (Word):** + +| Rank | N-gram | Count | +|------|--------|-------| +| 1 | `te hō ē oire iti` | 472 | +| 2 | `hō ē oire iti nō` | 472 | +| 3 | `o te hō ē oire` | 228 | +| 4 | `mau oire iti nō tatarūnia` | 226 | +| 5 | `tatarūnia mau oire iti nō` | 225 | + +**2-grams (Subword):** + +| Rank | N-gram | Count | +|------|--------|-------| +| 1 | `e _` | 14,698 | +| 2 | `_ t` | 13,338 | +| 3 | `a _` | 13,137 | +| 4 | `t e` | 10,307 | +| 5 | `i _` | 9,732 | + +**3-grams (Subword):** + +| Rank | N-gram | Count | +|------|--------|-------| +| 1 | `_ t e` | 8,324 | +| 2 | `t e _` | 8,198 | +| 3 | `_ m a` | 4,382 | +| 4 | `_ i _` | 3,923 | +| 5 | `i _ t` | 3,482 | + +**4-grams (Subword):** + +| Rank | N-gram | Count | +|------|--------|-------| +| 1 | `_ t e _` | 7,569 | +| 2 | `i _ t e` | 2,795 | +| 3 | `_ i _ t` | 2,691 | +| 4 | `e _ m a` | 2,393 | +| 5 | `t e _ m` | 2,331 | + +**5-grams (Subword):** + +| Rank | N-gram | Count | +|------|--------|-------| +| 1 | `i _ t e _` | 2,677 | +| 2 | `_ i _ t e` | 2,345 | +| 3 | `t e _ m a` | 2,135 | +| 4 | `_ t e _ m` | 2,091 | +| 5 | `_ m a u _` | 2,082 | + + +### Key Findings + +- **Best Perplexity:** 2-gram (subword) with 157 +- **Entropy Trend:** Decreases with larger n-grams (more predictable) +- **Coverage:** Top-1000 patterns cover ~58% of corpus +- **Recommendation:** 4-gram or 5-gram for best predictive performance + +--- +## 3. Markov Chain Evaluation + +![Markov Entropy](visualizations/markov_entropy.png) + +![Markov Contexts](visualizations/markov_contexts.png) + +![Markov Branching](visualizations/markov_branching.png) + +### Results + +| Context | Variant | Avg Entropy | Perplexity | Branching Factor | Unique Contexts | Predictability | +|---------|---------|-------------|------------|------------------|-----------------|----------------| +| **1** | Word | 0.5459 | 1.460 | 3.10 | 6,845 | 45.4% | +| **1** | Subword | 1.3451 | 2.541 | 10.23 | 217 | 0.0% | +| **2** | Word | 0.2579 | 1.196 | 1.61 | 21,075 | 74.2% | +| **2** | Subword | 1.0621 | 2.088 | 5.21 | 2,216 | 0.0% | +| **3** | Word | 0.1372 | 1.100 | 1.25 | 33,605 | 86.3% | +| **3** | Subword | 0.7095 | 1.635 | 2.86 | 11,525 | 29.1% | +| **4** | Word | 0.0708 🏆 | 1.050 | 1.11 | 41,713 | 92.9% | +| **4** | Subword | 0.3985 | 1.318 | 1.79 | 32,904 | 60.2% | + +### Generated Text Samples (Word-based) + +Below are text samples generated from each word-based Markov chain model: + +**Context Size 1:** + +1. `te matahiti te reo wiwi me te apooraa ua riro oia ana i te fare haapiiraa` +2. `i ma il sung te repupirita no ghana e te haere oia ei tauturu a era` +3. `e rave a te matahiti ua huru o te purūmu hātua e rave e tae atu` + +**Context Size 2:** + +1. `i te 27 no mē tai ivuaro peretiteni o te taata nei e nina atoa hia o` +2. `te mau mea atoa ta na ïa i rave no te mau tupuna i afa i mai` +3. `o te repūpirita michael sata 23 no tiurai herēni peretiteni o te papori me te aro o` + +**Context Size 3:** + +1. `oire iti nō tatarūnia mau oire iti nō tatarūnia mau oire iti nō soria mau oire iti nō` +2. `te hō ē oire iti nō tatarūnia mau oire iti nō soria mau oire iti nō soria mau` +3. `hō ē oire iti nō tatarūnia mau oire iti nō fenua marite huira atira 681 090 ta ata` + +**Context Size 4:** + +1. `te hō ē oire iti nō soria mau oire iti nō soria mau oire iti nō tatarūnia mau oire` +2. `ē oire iti nō soria mau oire iti nō soria mau oire iti nō tatarūnia mau oire iti nō` +3. `hō ē oire iti nō tatarūnia mau oire iti nō tatarūnia mau oire iti nō soria mau oire iti` + + +### Generated Text Samples (Subword-based) + +Below are text samples generated from each subword-based Markov chain model: + +**Context Size 1:** + +1. `_fētitoino_nurât` +2. `a,_tetu_hnafena_` +3. `i_i_nō_tē_no,_oa` + +**Context Size 2:** + +1. `e_te_14_nov._utom` +2. `_te_ia_te_mē_’oia` +3. `a_ra_faapera,_ó_t` + +**Context Size 3:** + +1. `_te_aorené_paraa_f` +2. `te_faata_no_tupu_p` +3. `_mau_fāna_nei_o_tu` + +**Context Size 4:** + +1. `_te_mau_poritita_na` +2. `i_te_repūpirita_mot` +3. `_i_te_di_rave_rapaa` + + +### Key Findings + +- **Best Predictability:** Context-4 (word) with 92.9% predictability +- **Branching Factor:** Decreases with context size (more deterministic) +- **Memory Trade-off:** Larger contexts require more storage (32,904 contexts) +- **Recommendation:** Context-3 or Context-4 for text generation + +--- +## 4. Vocabulary Analysis + +![Zipf's Law](visualizations/zipf_law.png) + +![Top Words](visualizations/top20_words.png) + +![Coverage Curve](visualizations/vocab_coverage.png) + +### Statistics + +| Metric | Value | +|--------|-------| +| Vocabulary Size | 2,668 | +| Total Tokens | 62,941 | +| Mean Frequency | 23.59 | +| Median Frequency | 3 | +| Frequency Std Dev | 206.25 | + +### Most Common Words + +| Rank | Word | Frequency | +|------|------|-----------| +| 1 | te | 7,849 | +| 2 | i | 4,463 | +| 3 | e | 2,642 | +| 4 | o | 2,217 | +| 5 | no | 2,165 | +| 6 | mau | 2,091 | +| 7 | a | 1,691 | +| 8 | nō | 1,108 | +| 9 | oire | 1,030 | +| 10 | iti | 946 | + +### Least Common Words (from vocabulary) + +| Rank | Word | Frequency | +|------|------|-----------| +| 1 | antitumor | 2 | +| 2 | mcgill | 2 | +| 3 | polanyi | 2 | +| 4 | stanford | 2 | +| 5 | lehn | 2 | +| 6 | uttar | 2 | +| 7 | pradesh | 2 | +| 8 | papu | 2 | +| 9 | tarutaru | 2 | +| 10 | anavai | 2 | + +### Zipf's Law Analysis + +| Metric | Value | +|--------|-------| +| Zipf Coefficient | 1.1618 | +| R² (Goodness of Fit) | 0.985563 | +| Adherence Quality | **excellent** | + +### Coverage Analysis + +| Top N Words | Coverage | +|-------------|----------| +| Top 100 | 72.0% | +| Top 1,000 | 93.5% | +| Top 5,000 | 0.0% | +| Top 10,000 | 0.0% | + +### Key Findings + +- **Zipf Compliance:** R²=0.9856 indicates excellent adherence to Zipf's law +- **High Frequency Dominance:** Top 100 words cover 72.0% of corpus +- **Long Tail:** -7,332 words needed for remaining 100.0% coverage + +--- +## 5. Word Embeddings Evaluation + +![Embedding Isotropy](visualizations/embedding_isotropy.png) + +![Similarity Matrix](visualizations/embedding_similarity.png) + +![t-SNE Words](visualizations/tsne_words.png) + +![t-SNE Sentences](visualizations/tsne_sentences.png) + + +### 5.1 Cross-Lingual Alignment + +![Alignment Quality](visualizations/embedding_alignment_quality.png) + +![Multilingual t-SNE](visualizations/embedding_tsne_multilingual.png) + + +### 5.2 Model Comparison + +| Model | Dimension | Isotropy | Semantic Density | Alignment R@1 | Alignment R@10 | +|-------|-----------|----------|------------------|---------------|----------------| +| **mono_32d** | 32 | 0.0301 | 0.6381 | N/A | N/A | +| **mono_64d** | 64 | 0.0049 | 0.6224 | N/A | N/A | +| **mono_128d** | 128 | 0.0009 | 0.6655 | N/A | N/A | +| **aligned_32d** | 32 | 0.0301 🏆 | 0.6684 | 0.0028 | 0.0499 | +| **aligned_64d** | 64 | 0.0049 | 0.6410 | 0.0028 | 0.0748 | +| **aligned_128d** | 128 | 0.0009 | 0.6513 | 0.0055 | 0.0914 | + +### Key Findings + +- **Best Isotropy:** aligned_32d with 0.0301 (more uniform distribution) +- **Semantic Density:** Average pairwise similarity of 0.6478. Lower values indicate better semantic separation. +- **Alignment Quality:** Aligned models achieve up to 0.6% R@1 in cross-lingual retrieval. +- **Recommendation:** 128d aligned for best cross-lingual performance + +--- +## 6. Morphological Analysis (Experimental) + +This section presents an automated morphological analysis derived from the statistical divergence between word-level and subword-level models. By analyzing where subword predictability spikes and where word-level coverage fails, we can infer linguistic structures without supervised data. + +### 6.1 Productivity & Complexity + +| Metric | Value | Interpretation | Recommendation | +|--------|-------|----------------|----------------| +| Productivity Index | **5.000** | High morphological productivity | Reliable analysis | +| Idiomaticity Gap | **0.313** | High formulaic/idiomatic content | - | + +### 6.2 Affix Inventory (Productive Units) + +These are the most productive prefixes and suffixes identified by sampling the vocabulary for global substitutability patterns. A unit is considered an affix if stripping it leaves a valid stem that appears in other contexts. + +#### Productive Prefixes +| Prefix | Examples | +|--------|----------| +| `-t` | tau, tauaparauraa, tapearaa | +| `-a` | anuanua, apooraa, agnes | +| `-m` | mori, mesia, mǎta | +| `-p` | pou, piahi, ph | +| `-ta` | tau, tauaparauraa, tapearaa | +| `-ma` | maha, maurice, maoro | +| `-fa` | farii, fakarava, faaoreraa | +| `-pa` | paari, paradisiaca, paturaa | + +#### Productive Suffixes +| Suffix | Examples | +|--------|----------| +| `-a` | fakarava, anuanua, apooraa | +| `-e` | òe, grace, ne | +| `-ia` | mesia, citrifolia, māìtihia | +| `-i` | fifi, farii, mori | +| `-aa` | apooraa, oraraa, itiraa | +| `-ra` | atira, mētera, tera | +| `-na` | ghana, taina, raihana | +| `-ta` | mǎta, poritita, rekoata | + +### 6.3 Bound Stems (Lexical Roots) + +Bound stems are high-frequency subword units that are semantically cohesive but rarely appear as standalone words. These often correspond to the 'core' of a word that requires inflection or derivation to be valid. + +| Stem | Cohesion | Substitutability | Examples | +|------|----------|------------------|----------| +| `anga` | 1.54x | 13 contexts | hangai, whanga, umanga | +| `ahit` | 1.37x | 7 contexts | tahiti, mahiti, tahito | +| `faah` | 1.39x | 6 contexts | faahi, faaho, faahou | +| `tira` | 1.37x | 6 contexts | atira, itiraa, raatira | +| `aama` | 1.36x | 5 contexts | raama, haamau, haamata | +| `haam` | 1.36x | 4 contexts | haamo, haamau, haamou | + +### 6.4 Affix Compatibility (Co-occurrence) + +This table shows which prefixes and suffixes most frequently co-occur on the same stems, revealing the 'stacking' rules of the language's morphology. + +| Prefix | Suffix | Frequency | Examples | +|--------|--------|-----------|----------| +| `-t` | `-a` | 68 words | tauaparauraa, tapearaa | +| `-m` | `-a` | 49 words | mesia, mǎta | +| `-a` | `-a` | 44 words | anuanua, apooraa | +| `-fa` | `-a` | 41 words | fakarava, faaoreraa | +| `-p` | `-a` | 41 words | poritita, paradisiaca | +| `-fa` | `-aa` | 21 words | faaoreraa, faaotiraa | +| `-t` | `-aa` | 19 words | tauaparauraa, tapearaa | +| `-t` | `-ia` | 18 words | torovenia, tureia | +| `-t` | `-i` | 16 words | tauatini, tieti | +| `-p` | `-ia` | 15 words | pipiria, punaauia | + +### 6.5 Recursive Morpheme Segmentation + +Using **Recursive Hierarchical Substitutability**, we decompose complex words into their constituent morphemes. This approach handles nested affixes (e.g., `prefix-prefix-root-suffix`). + +| Word | Suggested Split | Confidence | Stem | +|------|-----------------|------------|------| +| tauaparauraa | **`tauaparaur-a-a`** | 7.5 | `a` | +| faaoreraa | **`faaorer-a-a`** | 7.5 | `a` | +| faaotiraa | **`faaotir-a-a`** | 7.5 | `a` | +| faaohiparaa | **`faaohipar-a-a`** | 7.5 | `a` | +| feruriraa | **`ferurir-a-a`** | 7.5 | `a` | +| faanavairaa | **`faanavair-a-a`** | 7.5 | `a` | +| boraginaceae | **`boraginace-a-e`** | 7.5 | `a` | +| faaûruraa | **`faaûrur-a-a`** | 7.5 | `a` | +| haaparuparu | **`haaparup-a-ru`** | 7.5 | `a` | +| haapiiraa | **`haapiir-a-a`** | 7.5 | `a` | +| faahororaa | **`faahoror-a-a`** | 7.5 | `a` | +| misionare | **`mision-a-re`** | 7.5 | `a` | +| faaineineraa | **`faaineiner-a-a`** | 7.5 | `a` | +| rapaauraa | **`rapaaur-a-a`** | 7.5 | `a` | +| faataaraa | **`faataa-ra-a`** | 7.5 | `ra` | + +### 6.6 Linguistic Interpretation + +> **Automated Insight:** +The language Tahitian shows high morphological productivity. The subword models are significantly more efficient than word models, suggesting a rich system of affixation or compounding. + +> **Note on Idiomaticity:** The high Idiomaticity Gap suggests a large number of frequent multi-word expressions or formulaic sequences that are statistically distinct from their component parts. + +--- +## 7. Summary & Recommendations + +![Performance Dashboard](visualizations/performance_dashboard.png) + +### Production Recommendations + +| Component | Recommended | Rationale | +|-----------|-------------|-----------| +| Tokenizer | **16k BPE** | Best compression (3.56x) | +| N-gram | **2-gram** | Lowest perplexity (157) | +| Markov | **Context-4** | Highest predictability (92.9%) | +| Embeddings | **100d** | Balanced semantic capture and isotropy | + + +--- +## Appendix: Metrics Glossary & Interpretation Guide + +This section provides definitions, intuitions, and guidance for interpreting the metrics used throughout this report. + +### Tokenizer Metrics + +**Compression Ratio** +> *Definition:* The ratio of characters to tokens (chars/token). Measures how efficiently the tokenizer represents text. +> +> *Intuition:* Higher compression means fewer tokens needed to represent the same text, reducing sequence lengths for downstream models. A 3x compression means ~3 characters per token on average. +> +> *What to seek:* Higher is generally better for efficiency, but extremely high compression may indicate overly aggressive merging that loses morphological information. + +**Average Token Length (Fertility)** +> *Definition:* Mean number of characters per token produced by the tokenizer. +> +> *Intuition:* Reflects the granularity of tokenization. Longer tokens capture more context but may struggle with rare words; shorter tokens are more flexible but increase sequence length. +> +> *What to seek:* Balance between 2-5 characters for most languages. Arabic/morphologically-rich languages may benefit from slightly longer tokens. + +**Unknown Token Rate (OOV Rate)** +> *Definition:* Percentage of tokens that map to the unknown/UNK token, indicating words the tokenizer cannot represent. +> +> *Intuition:* Lower OOV means better vocabulary coverage. High OOV indicates the tokenizer encounters many unseen character sequences. +> +> *What to seek:* Below 1% is excellent; below 5% is acceptable. BPE tokenizers typically achieve very low OOV due to subword fallback. + +### N-gram Model Metrics + +**Perplexity** +> *Definition:* Measures how "surprised" the model is by test data. Mathematically: 2^(cross-entropy). Lower values indicate better prediction. +> +> *Intuition:* If perplexity is 100, the model is as uncertain as if choosing uniformly among 100 options at each step. A perplexity of 10 means effectively choosing among 10 equally likely options. +> +> *What to seek:* Lower is better. Perplexity decreases with larger n-grams (more context). Values vary widely by language and corpus size. + +**Entropy** +> *Definition:* Average information content (in bits) needed to encode the next token given the context. Related to perplexity: perplexity = 2^entropy. +> +> *Intuition:* High entropy means high uncertainty/randomness; low entropy means predictable patterns. Natural language typically has entropy between 1-4 bits per character. +> +> *What to seek:* Lower entropy indicates more predictable text patterns. Entropy should decrease as n-gram size increases. + +**Coverage (Top-K)** +> *Definition:* Percentage of corpus occurrences explained by the top K most frequent n-grams. +> +> *Intuition:* High coverage with few patterns indicates repetitive/formulaic text; low coverage suggests diverse vocabulary usage. +> +> *What to seek:* Depends on use case. For language modeling, moderate coverage (40-60% with top-1000) is typical for natural text. + +### Markov Chain Metrics + +**Average Entropy** +> *Definition:* Mean entropy across all contexts, measuring average uncertainty in next-word prediction. +> +> *Intuition:* Lower entropy means the model is more confident about what comes next. Context-1 has high entropy (many possible next words); Context-4 has low entropy (few likely continuations). +> +> *What to seek:* Decreasing entropy with larger context sizes. Very low entropy (<0.1) indicates highly deterministic transitions. + +**Branching Factor** +> *Definition:* Average number of unique next tokens observed for each context. +> +> *Intuition:* High branching = many possible continuations (flexible but uncertain); low branching = few options (predictable but potentially repetitive). +> +> *What to seek:* Branching factor should decrease with context size. Values near 1.0 indicate nearly deterministic chains. + +**Predictability** +> *Definition:* Derived metric: (1 - normalized_entropy) × 100%. Indicates how deterministic the model's predictions are. +> +> *Intuition:* 100% predictability means the next word is always certain; 0% means completely random. Real text falls between these extremes. +> +> *What to seek:* Higher predictability for text generation quality, but too high (>98%) may produce repetitive output. + +### Vocabulary & Zipf's Law Metrics + +**Zipf's Coefficient** +> *Definition:* The slope of the log-log plot of word frequency vs. rank. Zipf's law predicts this should be approximately -1. +> +> *Intuition:* A coefficient near -1 indicates the corpus follows natural language patterns where a few words are very common and most words are rare. +> +> *What to seek:* Values between -0.8 and -1.2 indicate healthy natural language distribution. Deviations may suggest domain-specific or artificial text. + +**R² (Coefficient of Determination)** +> *Definition:* Measures how well the linear fit explains the frequency-rank relationship. Ranges from 0 to 1. +> +> *Intuition:* R² near 1.0 means the data closely follows Zipf's law; lower values indicate deviation from expected word frequency patterns. +> +> *What to seek:* R² > 0.95 is excellent; > 0.99 indicates near-perfect Zipf adherence typical of large natural corpora. + +**Vocabulary Coverage** +> *Definition:* Cumulative percentage of corpus tokens accounted for by the top N words. +> +> *Intuition:* Shows how concentrated word usage is. If top-100 words cover 50% of text, the corpus relies heavily on common words. +> +> *What to seek:* Top-100 covering 30-50% is typical. Higher coverage indicates more repetitive text; lower suggests richer vocabulary. + +### Word Embedding Metrics + +**Isotropy** +> *Definition:* Measures how uniformly distributed vectors are in the embedding space. Computed as the ratio of minimum to maximum singular values. +> +> *Intuition:* High isotropy (near 1.0) means vectors spread evenly in all directions; low isotropy means vectors cluster in certain directions, reducing expressiveness. +> +> *What to seek:* Higher isotropy generally indicates better-quality embeddings. Values > 0.1 are reasonable; > 0.3 is good. Lower-dimensional embeddings tend to have higher isotropy. + +**Average Norm** +> *Definition:* Mean magnitude (L2 norm) of word vectors in the embedding space. +> +> *Intuition:* Indicates the typical "length" of vectors. Consistent norms suggest stable training; high variance may indicate some words are undertrained. +> +> *What to seek:* Relatively consistent norms across models. The absolute value matters less than consistency (low std deviation). + +**Cosine Similarity** +> *Definition:* Measures angular similarity between vectors, ranging from -1 (opposite) to 1 (identical direction). +> +> *Intuition:* Words with similar meanings should have high cosine similarity. This is the standard metric for semantic relatedness in embeddings. +> +> *What to seek:* Semantically related words should score > 0.5; unrelated words should be near 0. Synonyms often score > 0.7. + +**t-SNE Visualization** +> *Definition:* t-Distributed Stochastic Neighbor Embedding - a dimensionality reduction technique that preserves local structure for visualization. +> +> *Intuition:* Clusters in t-SNE plots indicate groups of semantically related words. Spread indicates vocabulary diversity; tight clusters suggest semantic coherence. +> +> *What to seek:* Meaningful clusters (e.g., numbers together, verbs together). Avoid over-interpreting distances - t-SNE preserves local, not global, structure. + +### General Interpretation Guidelines + +1. **Compare within model families:** Metrics are most meaningful when comparing models of the same type (e.g., 8k vs 64k tokenizer). +2. **Consider trade-offs:** Better performance on one metric often comes at the cost of another (e.g., compression vs. OOV rate). +3. **Context matters:** Optimal values depend on downstream tasks. Text generation may prioritize different metrics than classification. +4. **Corpus influence:** All metrics are influenced by corpus characteristics. Wikipedia text differs from social media or literature. +5. **Language-specific patterns:** Morphologically rich languages (like Arabic) may show different optimal ranges than analytic languages. + + +### Visualizations Index + +| Visualization | Description | +|---------------|-------------| +| Tokenizer Compression | Compression ratios by vocabulary size | +| Tokenizer Fertility | Average token length by vocabulary | +| Tokenizer OOV | Unknown token rates | +| Tokenizer Total Tokens | Total tokens by vocabulary | +| N-gram Perplexity | Perplexity by n-gram size | +| N-gram Entropy | Entropy by n-gram size | +| N-gram Coverage | Top pattern coverage | +| N-gram Unique | Unique n-gram counts | +| Markov Entropy | Entropy by context size | +| Markov Branching | Branching factor by context | +| Markov Contexts | Unique context counts | +| Zipf's Law | Frequency-rank distribution with fit | +| Vocab Frequency | Word frequency distribution | +| Top 20 Words | Most frequent words | +| Vocab Coverage | Cumulative coverage curve | +| Embedding Isotropy | Vector space uniformity | +| Embedding Norms | Vector magnitude distribution | +| Embedding Similarity | Word similarity heatmap | +| Nearest Neighbors | Similar words for key terms | +| t-SNE Words | 2D word embedding visualization | +| t-SNE Sentences | 2D sentence embedding visualization | +| Position Encoding | Encoding method comparison | +| Model Sizes | Storage requirements | +| Performance Dashboard | Comprehensive performance overview | + +--- +## About This Project + +### Data Source + +Models trained on [wikipedia-monthly](https://huggingface.co/datasets/omarkamali/wikipedia-monthly) - a monthly snapshot of Wikipedia articles across 300+ languages. + +### Project + +A project by **[Wikilangs](https://wikilangs.org)** - Open-source NLP models for every Wikipedia language. + +### Maintainer + +[Omar Kamali](https://omarkamali.com) - [Omneity Labs](https://omneitylabs.com) + +### Citation + +If you use these models in your research, please cite: + +```bibtex +@misc{wikilangs2025, + author = {Kamali, Omar}, + title = {Wikilangs: Open NLP Models for Wikipedia Languages}, + year = {2025}, + doi = {10.5281/zenodo.18073153}, + publisher = {Zenodo}, + url = {https://huggingface.co/wikilangs} + institution = {Omneity Labs} +} +``` + +### License + +MIT License - Free for academic and commercial use. + +### Links + +- 🌐 Website: [wikilangs.org](https://wikilangs.org) +- 🤗 Models: [huggingface.co/wikilangs](https://huggingface.co/wikilangs) +- 📊 Data: [wikipedia-monthly](https://huggingface.co/datasets/omarkamali/wikipedia-monthly) +- 👤 Author: [Omar Kamali](https://huggingface.co/omarkamali) +- 🤝 Sponsor: [Featherless AI](https://featherless.ai) +--- +*Generated by Wikilangs Models Pipeline* + +*Report Date: 2026-01-11 02:05:21* diff --git a/models/embeddings/aligned/ty_128d.bin b/models/embeddings/aligned/ty_128d.bin new file mode 100644 index 0000000000000000000000000000000000000000..d39fbc7fecb698bbf95feaa6254322aef22c871b --- /dev/null +++ b/models/embeddings/aligned/ty_128d.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b282a6acc9f7e58cf07234c17083b7a52459e5759569fb22604eb48ceb5aba8f +size 1025020730 diff --git a/models/embeddings/aligned/ty_128d.meta.json b/models/embeddings/aligned/ty_128d.meta.json new file mode 100644 index 0000000000000000000000000000000000000000..bc0b4c114e32de5cffe5ee8d03eaabe4260e738d --- /dev/null +++ b/models/embeddings/aligned/ty_128d.meta.json @@ -0,0 +1 @@ +{"lang": "ty", "dim": 128, "max_seq_len": 512, "is_aligned": true} \ No newline at end of file diff --git a/models/embeddings/aligned/ty_128d.projection.npy b/models/embeddings/aligned/ty_128d.projection.npy new file mode 100644 index 0000000000000000000000000000000000000000..6eda33db53c4d5b091b5b2af13654a6d53e0c12f --- /dev/null +++ b/models/embeddings/aligned/ty_128d.projection.npy @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:06d8a6ef5b01a90530b3fc3537f439c934e3d8903ff7c21430ae900e2271fa61 +size 65664 diff --git a/models/embeddings/aligned/ty_128d_metadata.json b/models/embeddings/aligned/ty_128d_metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..ff9e14797a48235ab338c3edd575e307e33075e5 --- /dev/null +++ b/models/embeddings/aligned/ty_128d_metadata.json @@ -0,0 +1,8 @@ +{ + "language": "ty", + "dimension": 128, + "version": "aligned", + "hub_language": "en", + "seed_vocab_size": 361, + "vocab_size": 982 +} \ No newline at end of file diff --git a/models/embeddings/aligned/ty_32d.bin b/models/embeddings/aligned/ty_32d.bin new file mode 100644 index 0000000000000000000000000000000000000000..084d6fece1bb57edc4e0c1ed8708f6426c4ea55e --- /dev/null +++ b/models/embeddings/aligned/ty_32d.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:83018465ae9390795521c83abbb7126b386c0e67723caedfc782647309efc8ae +size 256266554 diff --git a/models/embeddings/aligned/ty_32d.meta.json b/models/embeddings/aligned/ty_32d.meta.json new file mode 100644 index 0000000000000000000000000000000000000000..4ef93977a15cfd3632217458e9b5da5ce7aee6f1 --- /dev/null +++ b/models/embeddings/aligned/ty_32d.meta.json @@ -0,0 +1 @@ +{"lang": "ty", "dim": 32, "max_seq_len": 512, "is_aligned": true} \ No newline at end of file diff --git a/models/embeddings/aligned/ty_32d.projection.npy b/models/embeddings/aligned/ty_32d.projection.npy new file mode 100644 index 0000000000000000000000000000000000000000..c13253dff21d390b9d5b24842d63a7f488e09884 --- /dev/null +++ b/models/embeddings/aligned/ty_32d.projection.npy @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:09acf0053e1caaa31820e1b14b57b171bda931f5fc336afab7ae99c88468daee +size 4224 diff --git a/models/embeddings/aligned/ty_32d_metadata.json b/models/embeddings/aligned/ty_32d_metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..ff155b79231e5cc8cd2bcbe360e233cc73cbe179 --- /dev/null +++ b/models/embeddings/aligned/ty_32d_metadata.json @@ -0,0 +1,8 @@ +{ + "language": "ty", + "dimension": 32, + "version": "aligned", + "hub_language": "en", + "seed_vocab_size": 361, + "vocab_size": 982 +} \ No newline at end of file diff --git a/models/embeddings/aligned/ty_64d.bin b/models/embeddings/aligned/ty_64d.bin new file mode 100644 index 0000000000000000000000000000000000000000..48c8f70de108303bdb8ea69c659f0a0f83fb42ad --- /dev/null +++ b/models/embeddings/aligned/ty_64d.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:516a3619c9bc48aefae7cdac13acc370e680d10352e977d3447211484b1d020e +size 512517946 diff --git a/models/embeddings/aligned/ty_64d.meta.json b/models/embeddings/aligned/ty_64d.meta.json new file mode 100644 index 0000000000000000000000000000000000000000..bd79061d49598df0f886e9cacd458b9d63d5e479 --- /dev/null +++ b/models/embeddings/aligned/ty_64d.meta.json @@ -0,0 +1 @@ +{"lang": "ty", "dim": 64, "max_seq_len": 512, "is_aligned": true} \ No newline at end of file diff --git a/models/embeddings/aligned/ty_64d.projection.npy b/models/embeddings/aligned/ty_64d.projection.npy new file mode 100644 index 0000000000000000000000000000000000000000..7497b9b2aaf177ad0edf0ab3b3d6607222433644 --- /dev/null +++ b/models/embeddings/aligned/ty_64d.projection.npy @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d73fa690c971d6d8609db9a887379b065370e9eb28247b884c160998190e45e5 +size 16512 diff --git a/models/embeddings/aligned/ty_64d_metadata.json b/models/embeddings/aligned/ty_64d_metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..28a7ef8a645c374853eb352f062ca0ef60f33256 --- /dev/null +++ b/models/embeddings/aligned/ty_64d_metadata.json @@ -0,0 +1,8 @@ +{ + "language": "ty", + "dimension": 64, + "version": "aligned", + "hub_language": "en", + "seed_vocab_size": 361, + "vocab_size": 982 +} \ No newline at end of file diff --git a/models/embeddings/monolingual/ty_128d.bin b/models/embeddings/monolingual/ty_128d.bin new file mode 100644 index 0000000000000000000000000000000000000000..d39fbc7fecb698bbf95feaa6254322aef22c871b --- /dev/null +++ b/models/embeddings/monolingual/ty_128d.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b282a6acc9f7e58cf07234c17083b7a52459e5759569fb22604eb48ceb5aba8f +size 1025020730 diff --git a/models/embeddings/monolingual/ty_128d.meta.json b/models/embeddings/monolingual/ty_128d.meta.json new file mode 100644 index 0000000000000000000000000000000000000000..675d878841b8449a270580ca94a1fdab9026fd8b --- /dev/null +++ b/models/embeddings/monolingual/ty_128d.meta.json @@ -0,0 +1 @@ +{"lang": "ty", "dim": 128, "max_seq_len": 512, "is_aligned": false} \ No newline at end of file diff --git a/models/embeddings/monolingual/ty_128d_metadata.json b/models/embeddings/monolingual/ty_128d_metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..dea81fd239dea97062c40af977dd5b7a8ef4d08f --- /dev/null +++ b/models/embeddings/monolingual/ty_128d_metadata.json @@ -0,0 +1,16 @@ +{ + "language": "ty", + "dimension": 128, + "version": "monolingual", + "training_params": { + "algorithm": "skipgram", + "min_count": 5, + "window": 5, + "negative": 5, + "epochs": 5, + "encoding_method": "rope", + "dim": 128, + "threads": 5 + }, + "vocab_size": 982 +} \ No newline at end of file diff --git a/models/embeddings/monolingual/ty_32d.bin b/models/embeddings/monolingual/ty_32d.bin new file mode 100644 index 0000000000000000000000000000000000000000..084d6fece1bb57edc4e0c1ed8708f6426c4ea55e --- /dev/null +++ b/models/embeddings/monolingual/ty_32d.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:83018465ae9390795521c83abbb7126b386c0e67723caedfc782647309efc8ae +size 256266554 diff --git a/models/embeddings/monolingual/ty_32d.meta.json b/models/embeddings/monolingual/ty_32d.meta.json new file mode 100644 index 0000000000000000000000000000000000000000..457880457f7b535f54b8efb66d76f811036d6099 --- /dev/null +++ b/models/embeddings/monolingual/ty_32d.meta.json @@ -0,0 +1 @@ +{"lang": "ty", "dim": 32, "max_seq_len": 512, "is_aligned": false} \ No newline at end of file diff --git a/models/embeddings/monolingual/ty_32d_metadata.json b/models/embeddings/monolingual/ty_32d_metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..a109a7c35bf9e530b79063d3bf3b4fd75d8484bb --- /dev/null +++ b/models/embeddings/monolingual/ty_32d_metadata.json @@ -0,0 +1,16 @@ +{ + "language": "ty", + "dimension": 32, + "version": "monolingual", + "training_params": { + "algorithm": "skipgram", + "min_count": 5, + "window": 5, + "negative": 5, + "epochs": 5, + "encoding_method": "rope", + "dim": 32, + "threads": 5 + }, + "vocab_size": 982 +} \ No newline at end of file diff --git a/models/embeddings/monolingual/ty_64d.bin b/models/embeddings/monolingual/ty_64d.bin new file mode 100644 index 0000000000000000000000000000000000000000..48c8f70de108303bdb8ea69c659f0a0f83fb42ad --- /dev/null +++ b/models/embeddings/monolingual/ty_64d.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:516a3619c9bc48aefae7cdac13acc370e680d10352e977d3447211484b1d020e +size 512517946 diff --git a/models/embeddings/monolingual/ty_64d.meta.json b/models/embeddings/monolingual/ty_64d.meta.json new file mode 100644 index 0000000000000000000000000000000000000000..4d758df4642c320f6ea949b70e71d039849e5050 --- /dev/null +++ b/models/embeddings/monolingual/ty_64d.meta.json @@ -0,0 +1 @@ +{"lang": "ty", "dim": 64, "max_seq_len": 512, "is_aligned": false} \ No newline at end of file diff --git a/models/embeddings/monolingual/ty_64d_metadata.json b/models/embeddings/monolingual/ty_64d_metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..d056ff798e8835b708bb18cb1e0ba539c047b6f0 --- /dev/null +++ b/models/embeddings/monolingual/ty_64d_metadata.json @@ -0,0 +1,16 @@ +{ + "language": "ty", + "dimension": 64, + "version": "monolingual", + "training_params": { + "algorithm": "skipgram", + "min_count": 5, + "window": 5, + "negative": 5, + "epochs": 5, + "encoding_method": "rope", + "dim": 64, + "threads": 5 + }, + "vocab_size": 982 +} \ No newline at end of file diff --git a/models/subword_markov/ty_markov_ctx1_subword.parquet b/models/subword_markov/ty_markov_ctx1_subword.parquet new file mode 100644 index 0000000000000000000000000000000000000000..1ccbabfaac839a643b811e38ea99647f47acfa5a --- /dev/null +++ b/models/subword_markov/ty_markov_ctx1_subword.parquet @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:93577288b2d955ab425c0b00ab80e544dfc134106b6455123f81e3d795203ee1 +size 20562 diff --git a/models/subword_markov/ty_markov_ctx1_subword_metadata.json b/models/subword_markov/ty_markov_ctx1_subword_metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..beb97eca7c3d188d72654a3370b613a5c81263ef --- /dev/null +++ b/models/subword_markov/ty_markov_ctx1_subword_metadata.json @@ -0,0 +1,7 @@ +{ + "context_size": 1, + "variant": "subword", + "language": "ty", + "unique_contexts": 217, + "total_transitions": 312100 +} \ No newline at end of file diff --git a/models/subword_markov/ty_markov_ctx2_subword.parquet b/models/subword_markov/ty_markov_ctx2_subword.parquet new file mode 100644 index 0000000000000000000000000000000000000000..2e6d28dfc232717c1d6a580b6a59c53b736bb669 --- /dev/null +++ b/models/subword_markov/ty_markov_ctx2_subword.parquet @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:05434986abfedf156dac0710a108c83576d655b545b8846d8fcea728e558a92b +size 87769 diff --git a/models/subword_markov/ty_markov_ctx2_subword_metadata.json b/models/subword_markov/ty_markov_ctx2_subword_metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..601a9d0c3c3e2f56a61f04658dff890b5513df03 --- /dev/null +++ b/models/subword_markov/ty_markov_ctx2_subword_metadata.json @@ -0,0 +1,7 @@ +{ + "context_size": 2, + "variant": "subword", + "language": "ty", + "unique_contexts": 2216, + "total_transitions": 310842 +} \ No newline at end of file diff --git a/models/subword_markov/ty_markov_ctx3_subword.parquet b/models/subword_markov/ty_markov_ctx3_subword.parquet new file mode 100644 index 0000000000000000000000000000000000000000..53c3ccbb4975cac34be391e8d0acc83cc493ee68 --- /dev/null +++ b/models/subword_markov/ty_markov_ctx3_subword.parquet @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e24021431ff12a4e9243ce89beda035fd8fc92717592e83811e9a733303fe26a +size 239012 diff --git a/models/subword_markov/ty_markov_ctx3_subword_metadata.json b/models/subword_markov/ty_markov_ctx3_subword_metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..467ed6acf42e4f887610336f6fd68370dbcdea1d --- /dev/null +++ b/models/subword_markov/ty_markov_ctx3_subword_metadata.json @@ -0,0 +1,7 @@ +{ + "context_size": 3, + "variant": "subword", + "language": "ty", + "unique_contexts": 11525, + "total_transitions": 309584 +} \ No newline at end of file diff --git a/models/subword_markov/ty_markov_ctx4_subword.parquet b/models/subword_markov/ty_markov_ctx4_subword.parquet new file mode 100644 index 0000000000000000000000000000000000000000..bcc881f95657028c0f7a5fb5516f052a7ad2f0b8 --- /dev/null +++ b/models/subword_markov/ty_markov_ctx4_subword.parquet @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e0510fccb431f59bb958c43301d10276a9c80e192ed8520dbd6bf4217d4ae47d +size 522118 diff --git a/models/subword_markov/ty_markov_ctx4_subword_metadata.json b/models/subword_markov/ty_markov_ctx4_subword_metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..68372a1847433af3ed2f8e7bd89b20334eed7e59 --- /dev/null +++ b/models/subword_markov/ty_markov_ctx4_subword_metadata.json @@ -0,0 +1,7 @@ +{ + "context_size": 4, + "variant": "subword", + "language": "ty", + "unique_contexts": 32904, + "total_transitions": 308326 +} \ No newline at end of file diff --git a/models/subword_ngram/ty_2gram_subword.parquet b/models/subword_ngram/ty_2gram_subword.parquet new file mode 100644 index 0000000000000000000000000000000000000000..1dd25105bed3d3b15ef5c321b0be1a8bcbbe89c9 --- /dev/null +++ b/models/subword_ngram/ty_2gram_subword.parquet @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1598f0facd04c5225ae517ed2be168a00135d9ed471cfe2c11ac3feb0a4e5a79 +size 14431 diff --git a/models/subword_ngram/ty_2gram_subword_metadata.json b/models/subword_ngram/ty_2gram_subword_metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..ebea87d58fc40292af4c7c4850e3448fb4fc391d --- /dev/null +++ b/models/subword_ngram/ty_2gram_subword_metadata.json @@ -0,0 +1,7 @@ +{ + "n": 2, + "variant": "subword", + "language": "ty", + "unique_ngrams": 1040, + "total_ngrams": 312100 +} \ No newline at end of file diff --git a/models/subword_ngram/ty_3gram_subword.parquet b/models/subword_ngram/ty_3gram_subword.parquet new file mode 100644 index 0000000000000000000000000000000000000000..c27705ce32ee04f8ad54a47386a51552583462cf --- /dev/null +++ b/models/subword_ngram/ty_3gram_subword.parquet @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:060e0059bf79195688f98e14684fcc6df9c0e6e565a0332c279643e8620ac37a +size 60557 diff --git a/models/subword_ngram/ty_3gram_subword_metadata.json b/models/subword_ngram/ty_3gram_subword_metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..28df14e5fd769432712d80cfb77f1772aa7e6856 --- /dev/null +++ b/models/subword_ngram/ty_3gram_subword_metadata.json @@ -0,0 +1,7 @@ +{ + "n": 3, + "variant": "subword", + "language": "ty", + "unique_ngrams": 5412, + "total_ngrams": 310842 +} \ No newline at end of file diff --git a/models/subword_ngram/ty_4gram_subword.parquet b/models/subword_ngram/ty_4gram_subword.parquet new file mode 100644 index 0000000000000000000000000000000000000000..e6d1e4d36df025ef06fbbf0970b8d82cf773fe27 --- /dev/null +++ b/models/subword_ngram/ty_4gram_subword.parquet @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:76cc5a0dc9099a680b5ef4badb3f90d4f1fb8ee41c8bc9f16f8209103482f39c +size 185694 diff --git a/models/subword_ngram/ty_4gram_subword_metadata.json b/models/subword_ngram/ty_4gram_subword_metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..ef0947cb45b0d5e41a88fe56ee013074cbd07df1 --- /dev/null +++ b/models/subword_ngram/ty_4gram_subword_metadata.json @@ -0,0 +1,7 @@ +{ + "n": 4, + "variant": "subword", + "language": "ty", + "unique_ngrams": 15928, + "total_ngrams": 309584 +} \ No newline at end of file diff --git a/models/subword_ngram/ty_5gram_subword.parquet b/models/subword_ngram/ty_5gram_subword.parquet new file mode 100644 index 0000000000000000000000000000000000000000..8cd2a157c4c3599679915f56d2b0aa0497ccf853 --- /dev/null +++ b/models/subword_ngram/ty_5gram_subword.parquet @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8fa325c5447ab17c25ce729b0a393b0ab2185e6125847bbfab2239a7f97ca1e3 +size 273718 diff --git a/models/subword_ngram/ty_5gram_subword_metadata.json b/models/subword_ngram/ty_5gram_subword_metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..a709a90c115781659e6783e8827c43e8a0a630ae --- /dev/null +++ b/models/subword_ngram/ty_5gram_subword_metadata.json @@ -0,0 +1,7 @@ +{ + "n": 5, + "variant": "subword", + "language": "ty", + "unique_ngrams": 22183, + "total_ngrams": 308326 +} \ No newline at end of file diff --git a/models/tokenizer/ty_tokenizer_16k.model b/models/tokenizer/ty_tokenizer_16k.model new file mode 100644 index 0000000000000000000000000000000000000000..8b47e1a2aebbf58f3f80f6a1319e8fd14f817c7d --- /dev/null +++ b/models/tokenizer/ty_tokenizer_16k.model @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:80c5ee7a62f1139594ba049d18afd8bf5347f7949b1aef1ebdab95ce90a4048b +size 490994 diff --git a/models/tokenizer/ty_tokenizer_16k.vocab b/models/tokenizer/ty_tokenizer_16k.vocab new file mode 100644 index 0000000000000000000000000000000000000000..669531c73f94a065e4f905360c70cd4484a35440 --- /dev/null +++ b/models/tokenizer/ty_tokenizer_16k.vocab @@ -0,0 +1,16000 @@ + 0 + 0 + 0 + 0 +▁t -0 +▁te -1 +▁m -2 +▁i -3 +ra -4 +▁n -5 +▁ma -6 +re -7 +ti -8 +▁f -9 +▁p -10 +▁h -11 +ta -12 +ia -13 +▁ta -14 +▁’ -15 +▁mau -16 +▁e -17 +ua -18 +▁no -19 +▁o -20 +▁a -21 +na -22 +hi -23 +ire -24 +▁fa -25 +▁nō -26 +raa -27 +ot -28 +oire -29 +▁iti -30 +te -31 +or -32 +ne -33 +▁s -34 +en -35 +▁ha -36 +ri -37 +ni -38 +otu -39 +▁pa -40 +▁mā -41 +▁ò -42 +ro -43 +▁ra -44 +▁mata -45 +ha -46 +▁hō -47 +nia -48 +va -49 +▁ua -50 +enua -51 +rū -52 +▁fenua -53 +▁tata -54 +motu -55 +rūnia -56 +▁tatarūnia -57 +▁tu -58 +ma -59 +pa -60 +▁r -61 +hiti -62 +▁taa -63 +he -64 +oria -65 +iraa -66 +▁d -67 +▁soria -68 +▁faa -69 +hia -70 +▁b -71 +to -72 +▁k -73 +▁matahiti -74 +la -75 +tia -76 +▁po -77 +rā -78 +pi -79 +rāni -80 +▁farāni -81 +▁( -82 +▁na -83 +rau -84 +▁haa -85 +▁to -86 +tere -87 +▁c -88 +ura -89 +▁mai -90 +▁parau -91 +ka -92 +▁pō -93 +le -94 +rī -95 +▁re -96 +▁ti -97 +tu -98 +netia -99 +▁g -100 +ere -101 +▁taamotu -102 +▁ho -103 +li -104 +▁oia -105 +▁pōrī -106 +▁pōrīnetia -107 +▁haapi -108 +▁fare -109 +ur -110 +▁me -111 +āna -112 +ho -113 +oto -114 +ara -115 +▁pohe -116 +▁fāna -117 +er -118 +ng -119 +vi -120 +▁motu -121 +▁pohera -122 +▁fānaura -123 +po -124 +āmotu -125 +▁tene -126 +▁haapiiraa -127 +▁tuāmotu -128 +▁tenetere -129 +pu -130 +▁roto -131 +ve -132 +▁de -133 +▁pu -134 +au -135 +os -136 +▁mo -137 +▁ni -138 +▁tua -139 +si -140 +▁rahi -141 +ui -142 +tihia -143 +▁ia -144 +▁va -145 +▁ei -146 +ea -147 +ei -148 +tor -149 +haa -150 +ìtihia -151 +hana -152 +lo -153 +▁taata -154 +▁māìtihia -155 +an -156 +▁òire -157 +▁u -158 +▁hoê -159 +oraa -160 +▁w -161 +▁ri -162 +es -163 +us -164 +▁òna -165 +▁tā -166 +▁hau -167 +▁pae -168 +▁tuhaa -169 +ie -170 +toru -171 +iti -172 +▁ro -173 +▁tuatoru -174 +on -175 +are -176 +tua -177 +fi -178 +), -179 +hipa -180 +▁j -181 +me -182 +tira -183 +urg -184 +rii -185 +ru -186 +▁- -187 +▁l -188 +oro -189 +▁â -190 +▁burg -191 +▁pere -192 +no -193 +▁burgos -194 +ca -195 +▁vi -196 +▁ghana -197 +mi -198 +▁hi -199 +▁hu -200 +da -201 +ga -202 +▁nei -203 +▁rā -204 +pe -205 +▁rave -206 +ata -207 +▁por -208 +▁. -209 +▁' -210 +▁riro -211 +▁ohipa -212 +is -213 +ite -214 +▁fē -215 +▁pā -216 +▁reo -217 +▁puna -218 +nd -219 +eae -220 +ira -221 +ceae -222 +hine -223 +▁fēti -224 +el -225 +▁pū -226 +▁ca -227 +▁atu -228 +fa -229 +▁la -230 +▁tama -231 +pooraa -232 +▁faatere -233 +nga -234 +▁ato -235 +▁ora -236 +mo -237 +nu -238 +uri -239 +uru -240 +areva -241 +ba -242 +▁huiraa -243 +▁huiraatira -244 +ote -245 +▁ka -246 +teni -247 +se -248 +▁è -249 +▁sa -250 +itita -251 +▁poritita -252 +mu -253 +▁ai -254 +titeni -255 +▁v -256 +les -257 +▁tei -258 +hu -259 +ora -260 +tou -261 +▁ara -262 +▁raro -263 +ku -264 +▁: -265 +▁tià -266 +oa -267 +fic -268 +tai -269 +▁tahiti -270 +▁mari -271 +▁reira -272 +▁haere -273 +▁" -274 +mua -275 +▁roa -276 +▁tau -277 +ki -278 +ria -279 +rahi -280 +▁peretiteni -281 +tea -282 +▁fe -283 +▁of -284 +rama -285 +▁taote -286 +wa -287 +ya -288 +òhi -289 +▁ki -290 +▁mi -291 +▁san -292 +▁māòhi -293 +ce -294 +de -295 +naa -296 +▁af -297 +▁tae -298 +▁rapa -299 +qu -300 +▁mea -301 +▁âpooraa -302 +ol -303 +▁pupu -304 +▁maareva -305 +▁au -306 +▁pe -307 +▁pi -308 +araa -309 +▁tahi -310 +▁marite -311 +sa -312 +ore -313 +uhia -314 +▁muri -315 +▁reva -316 +▁iho -317 +ficie -318 +▁atoa -319 +▁pārahi -320 +ll -321 +tā -322 +uka -323 +▁vahine -324 +). -325 +di -326 +▁matamua -327 +eu -328 +▁rē -329 +▁afri -330 +▁nati -331 +do -332 +sz -333 +▁ko -334 +▁nga -335 +ch -336 +co -337 +▁nu -338 +▁hui -339 +▁farii -340 +▁haapii -341 +▁maitai -342 +ko -343 +um -344 +sia -345 +ter -346 +▁mou -347 +▁raa -348 +▁buka -349 +▁rēni -350 +ci -351 +▁ne -352 +▁so -353 +▁wha -354 +miraa -355 +▁papa -356 +▁tamarii -357 +ny -358 +ran -359 +▁ite -360 +▁teie -361 +faa -362 +per -363 +auraa -364 +▁mana -365 +▁haama -366 +ke -367 +st -368 +ana -369 +▁an -370 +▁in -371 +▁le -372 +den -373 +men -374 +▁ba -375 +euro -376 +▁maimiraa -377 +▁rapaauraa -378 +il -379 +▁‘ -380 +era -381 +▁am -382 +▁horo -383 +▁sant -384 +europa -385 +▁afrika -386 +in -387 +▁li -388 +▁râ -389 +atira -390 +▁fana -391 +▁y -392 +nei -393 +roa -394 +▁co -395 +▁he -396 +▁su -397 +▁mouà -398 +▁faana -399 +▁huira -400 +▁ku -401 +▁nā -402 +mani -403 +hō -404 +ss -405 +▁à -406 +▁ʻ -407 +pua -408 +▁ao -409 +tion -410 +▁noa -411 +▁tai -412 +▁vai -413 +siden -414 +▁metua -415 +▁ratou -416 +▁oraraa -417 +hōê -418 +sti -419 +▁lo -420 +nata -421 +tahi -422 +tita -423 +vini -424 +▁fau -425 +▁ken -426 +hōêraa -427 +▁tāhōêraa -428 +du -429 +go -430 +ts -431 +ça -432 +net -433 +āta -434 +▁wa -435 +▁apa -436 +▁mar -437 +▁fran -438 +▁tāne -439 +bi -440 +th -441 +lia -442 +lla -443 +lle -444 +que -445 +▁di -446 +▁km -447 +▁èn -448 +tepa -449 +▁amui -450 +▁atua -451 +▁huru -452 +▁noho -453 +▁poli -454 +▁whaka -455 +▁ènāta -456 +tī -457 +▁al -458 +▁da -459 +▁se -460 +▁melo -461 +▁piti -462 +▁site -463 +▁taua -464 +▁mesia -465 +▁moana -466 +▁rahiraa -467 +am -468 +gi -469 +né -470 +ito -471 +pea -472 +toa -473 +▁ac -474 +▁ve -475 +▁ana -476 +▁oro -477 +▁the -478 +▁para -479 +▁mahana -480 +perficie -481 +▁faanaho -482 +▁politita -483 +ly -484 +ou -485 +ari -486 +sie -487 +▁() -488 +vihi -489 +▁feia -490 +▁here -491 +▁pape -492 +▁apooraa -493 +▁aravihi -494 +▁peresiden -495 +▁superficie -496 +gh -497 +lu -498 +rd -499 +▁) -500 +che -501 +hau -502 +ipo -503 +ris -504 +rua -505 +tre -506 +mona -507 +oromona -508 +▁marama -509 +▁peresideni -510 +ge -511 +▁• -512 +ord -513 +tif -514 +▁(, -515 +▁be -516 +iete -517 +tiraa -518 +▁vahi -519 +▁vila -520 +▁ènata -521 +▁faufaa -522 +ck -523 +gu -524 +ye -525 +▁z -526 +▁ô -527 +▁do -528 +▁ga -529 +▁ru -530 +pura -531 +uraa -532 +▁ani -533 +▁ter -534 +nette -535 +▁faaho -536 +▁officie -537 +▁fanauhia -538 +ai -539 +ns -540 +nt -541 +▁; -542 +ngi -543 +ola -544 +roo -545 +áre -546 +▁ap -547 +▁aè -548 +rita -549 +▁hoa -550 +metua -551 +▁tere -552 +▁tumu -553 +▁faaite -554 +▁moromona -555 +▁officiel -556 +▁faanahoraa -557 +pō -558 +ré -559 +ïa -560 +▁« -561 +▁ê -562 +▁ā -563 +ber -564 +car -565 +ete -566 +ohi -567 +oni -568 +ton -569 +▁jo -570 +tara -571 +▁tao -572 +▁vig -573 +▁poly -574 +ororaa -575 +▁apato -576 +▁faahi -577 +▁tatou -578 +▁oraora -579 +▁tuamotu -580 +▁vignette -581 +ph -582 +cia -583 +gra -584 +rus -585 +ász -586 +▁fi -587 +▁ja -588 +▁lu -589 +▁tō -590 +çais -591 +▁kuf -592 +▁tor -593 +▁manu -594 +▁tupu -595 +▁faatereraa -596 +.. -597 +mb -598 +pû -599 +sc -600 +za -601 +▁ù -602 +ihi -603 +man -604 +tal -605 +▁go -606 +▁mu -607 +▁tē -608 +▁ïa -609 +ahia -610 +pere -611 +poto -612 +tera -613 +▁ava -614 +▁eka -615 +▁kwa -616 +▁nui -617 +▁tia -618 +einaa -619 +lesia -620 +▁aita -621 +▁faah -622 +▁hiva -623 +▁piha -624 +▁tara -625 +▁tavini -626 +▁ekalesia -627 +▁français -628 +▁mataeinaa -629 +__ -630 +ao -631 +so -632 +hua -633 +ose -634 +pha -635 +ver -636 +▁ab -637 +▁et -638 +fare -639 +hene -640 +mala -641 +ment -642 +▁and -643 +▁des -644 +▁nia -645 +▁rus -646 +amotu -647 +nésie -648 +rīihi -649 +▁faao -650 +▁faata -651 +▁paari -652 +▁rotopu -653 +▁parīihi -654 +▁fānauhia -655 +▁heremani -656 +▁orometua -657 +be -658 +mp -659 +ama -660 +cra -661 +esu -662 +nes -663 +ori -664 +phe -665 +pia -666 +qui -667 +uor -668 +▁ar -669 +▁du -670 +rana -671 +turu -672 +▁hua -673 +▁pua -674 +▁upo -675 +puare -676 +▁iesu -677 +▁otea -678 +▁pāti -679 +▁utua -680 +taiete -681 +▁nunaa -682 +▁kufuor -683 +▁tapura -684 +▁tetepa -685 +▁fepuare -686 +▁oteania -687 +▁utuafare -688 +▁polynésie -689 +fo -690 +hn -691 +ká -692 +rs -693 +dia -694 +paì -695 +ren -696 +reo -697 +res -698 +sen -699 +▁bi -700 +▁os -701 +▁rê -702 +itei -703 +▁apî -704 +▁ari -705 +▁bra -706 +▁com -707 +▁den -708 +▁eva -709 +▁hiv -710 +▁les -711 +▁par -712 +▁pro -713 +▁arii -714 +▁atoà -715 +▁mahi -716 +▁mili -717 +▁niho -718 +▁oire -719 +▁repu -720 +▁upoo -721 +naceae -722 +▁accra -723 +▁kenya -724 +▁maria -725 +▁tahaa -726 +▁faaroo -727 +▁tahito -728 +▁teitei -729 +▁animala -730 +▁haereere -731 +▁tamahine -732 +▁maramarama -733 +je -734 +ld -735 +ry -736 +té -737 +vo -738 +ger -739 +nge -740 +nui -741 +tri -742 +usa -743 +▁ci -744 +▁en -745 +▁ju -746 +▁si -747 +orea -748 +tura -749 +ātia -750 +ndola -751 +▁aore -752 +▁nuku -753 +▁raua -754 +▁tane -755 +▁tera -756 +▁tooa -757 +henehe -758 +▁kwagh -759 +▁tahua -760 +▁nehenehe -761 +▁française -762 +▁faahororaa -763 +ja -764 +pǔ -765 +ul -766 +ão -767 +▁с -768 +bia -769 +can -770 +chi -771 +ita -772 +los -773 +ndi -774 +nua -775 +rit -776 +unu -777 +▁as -778 +▁ge -779 +▁lá -780 +▁mē -781 +▁tī -782 +ihia -783 +nana -784 +piti -785 +tāne -786 +vema -787 +▁cha -788 +▁fer -789 +▁gra -790 +▁maa -791 +▁mua -792 +▁raì -793 +▁tea -794 +nelia -795 +▁faaa -796 +▁fara -797 +▁fatu -798 +▁hiro -799 +▁john -800 +▁maha -801 +▁mala -802 +▁papû -803 +▁tema -804 +▁ture -805 +itihia -806 +perera -807 +▁faatu -808 +▁haapa -809 +▁varua -810 +▁pōrana -811 +▁tāvini -812 +▁evanelia -813 +ls -814 +pū -815 +▁* -816 +aro -817 +bli -818 +ina -819 +iva -820 +ona -821 +tes -822 +tro -823 +utu -824 +ven -825 +▁hā -826 +▁rū -827 +ston -828 +tifā -829 +▁ali -830 +▁ere -831 +▁hoi -832 +▁hou -833 +▁ihi -834 +▁pau -835 +atere -836 +ngata -837 +rophe -838 +▁iose -839 +▁puka -840 +▁puta -841 +▁tapu -842 +▁toro -843 +ipoipo -844 +pearaa -845 +pirita -846 +▁pāpaì -847 +▁tiunu -848 +▁haamau -849 +▁novema -850 +aterehau -851 +▁haamata -852 +▁iosepha -853 +▁milioni -854 +▁tauturu -855 +▁pātitifā -856 +▁sotaiete -857 +▁faaipoipo -858 +▁repupirita -859 +bu -860 +cs -861 +ct -862 +ky -863 +nk -864 +tr -865 +tō -866 +ze -867 +▁? -868 +ell -869 +iri -870 +mfi -871 +mon -872 +phi -873 +ste -874 +tin -875 +tta -876 +vai -877 +ǔpǔ -878 +▁em -879 +▁gr -880 +▁ny -881 +▁or -882 +▁tm -883 +ctor -884 +dade -885 +erau -886 +here -887 +puka -888 +pōrū -889 +rava -890 +sier -891 +tete -892 +▁adu -893 +▁are -894 +▁boa -895 +▁chi -896 +▁con -897 +▁cse -898 +▁mal -899 +▁pou -900 +▁pre -901 +▁pré -902 +▁sta -903 +▁tel -904 +▁utu -905 +faaho -906 +ndica -907 +stitu -908 +▁anaa -909 +▁auta -910 +▁mate -911 +▁moni -912 +▁pǔpǔ -913 +▁raau -914 +▁rima -915 +▁taho -916 +▁tini -917 +▁tino -918 +▁offic -919 +▁osier -920 +▁rūtia -921 +▁taime -922 +▁ùpōrū -923 +ropheta -924 +▁gaston -925 +▁indica -926 +▁faatupu -927 +▁huahine -928 +▁malaria -929 +▁tupuraa -930 +▁peropheta -931 +nc -932 +op -933 +ty -934 +tá -935 +иј -936 +▁, -937 +amu -938 +dre -939 +ian -940 +ley -941 +lin -942 +mpa -943 +opo -944 +rei -945 +▁bo -946 +▁cu -947 +▁hī -948 +▁ii -949 +▁is -950 +▁ke -951 +▁lā -952 +▁vo -953 +▁wi -954 +ford -955 +iata -956 +itai -957 +manu -958 +masi -959 +mene -960 +mite -961 +ogra -962 +olia -963 +poku -964 +ques -965 +reva -966 +tema -967 +vana -968 +▁ale -969 +▁aro -970 +▁aru -971 +▁grâ -972 +▁hen -973 +▁jac -974 +▁kai -975 +▁mei -976 +▁mer -977 +▁one -978 +▁sel -979 +niora -980 +parau -981 +yamfi -982 +▁bela -983 +▁faaà -984 +▁hiti -985 +▁mani -986 +▁toru -987 +▁ware -988 +faahou -989 +firita -990 +riiraa -991 +▁hopea -992 +▁opoku -993 +▁òhipa -994 +▁hamani -995 +▁kumasi -996 +▁institu -997 +▁papeete -998 +▁tahoera -999 +▁terepia -1000 +▁faaohipa -1001 +▁grândola -1002 +". -1003 +.: -1004 +dy -1005 +fe -1006 +hā -1007 +má -1008 +sh -1009 +sá -1010 +рб -1011 +▁+ -1012 +▁[ -1013 +▁x -1014 +▁» -1015 +▁é -1016 +... -1017 +___ -1018 +est -1019 +gas -1020 +gen -1021 +han -1022 +kye -1023 +moa -1024 +nda -1025 +num -1026 +ort -1027 +osa -1028 +phy -1029 +rea -1030 +rum -1031 +sis -1032 +son -1033 +sta -1034 +▁il -1035 +▁je -1036 +▁ox -1037 +▁ph -1038 +dona -1039 +enei -1040 +land -1041 +line -1042 +pora -1043 +rika -1044 +riti -1045 +tava -1046 +toro -1047 +рбиј -1048 +▁___ -1049 +▁ada -1050 +▁ahu -1051 +▁bro -1052 +▁dis -1053 +▁esc -1054 +▁hei -1055 +▁hia -1056 +▁jea -1057 +▁mon -1058 +▁niu -1059 +▁pla -1060 +▁sha -1061 +▁ven -1062 +ivava -1063 +▁cseb -1064 +▁hoho -1065 +▁juli -1066 +▁mada -1067 +▁make -1068 +▁musa -1069 +▁māti -1070 +▁nana -1071 +▁peri -1072 +▁popa -1073 +▁taia -1074 +▁taka -1075 +gyamfi -1076 +ngatau -1077 +▁boadu -1078 +▁maoro -1079 +▁rusia -1080 +▁santa -1081 +▁selva -1082 +▁србиј -1083 +biaceae -1084 +āfirita -1085 +▁faaora -1086 +▁tinitō -1087 +▁tomite -1088 +▁upooti -1089 +▁belarus -1090 +▁paniora -1091 +▁raapoto -1092 +▁tuahine -1093 +▁fangatau -1094 +▁fariiraa -1095 +., -1096 +hī -1097 +ix -1098 +lá -1099 +nē -1100 +oà -1101 +▁/ -1102 +ano -1103 +api -1104 +atu -1105 +bal -1106 +cha -1107 +chy -1108 +cum -1109 +des -1110 +dio -1111 +dor -1112 +emp -1113 +ial -1114 +iao -1115 +kij -1116 +lei -1117 +lor -1118 +mei -1119 +nas -1120 +ngo -1121 +nha -1122 +nsk -1123 +our -1124 +qua -1125 +shi -1126 +siw -1127 +tau -1128 +tte -1129 +uma -1130 +zil -1131 +āni -1132 +▁ed -1133 +▁eu -1134 +▁ly -1135 +▁st -1136 +▁sz -1137 +▁tw -1138 +▁tū -1139 +▁vī -1140 +bera -1141 +doua -1142 +ella -1143 +esse -1144 +huru -1145 +ingi -1146 +jata -1147 +lles -1148 +mita -1149 +nati -1150 +orle -1151 +pera -1152 +pōnē -1153 +ream -1154 +resa -1155 +rica -1156 +sité -1157 +tero -1158 +tini -1159 +topa -1160 +tori -1161 +èraa -1162 +ātea -1163 +▁aha -1164 +▁ame -1165 +▁ano -1166 +▁bla -1167 +▁can -1168 +▁del -1169 +▁fra -1170 +▁mba -1171 +▁oli -1172 +▁que -1173 +▁sur -1174 +▁tui -1175 +▁uni -1176 +▁vau -1177 +▁vie -1178 +▁âva -1179 +losse -1180 +nuare -1181 +reraa -1182 +ritch -1183 +tanga -1184 +teria -1185 +tāmua -1186 +ōhipa -1187 +▁cast -1188 +▁faka -1189 +▁goka -1190 +▁hana -1191 +▁jean -1192 +▁link -1193 +▁mono -1194 +▁mora -1195 +▁patu -1196 +▁pora -1197 +▁sang -1198 +▁taha -1199 +▁tahu -1200 +▁tapo -1201 +▁tuni -1202 +douard -1203 +taceae -1204 +vairaa -1205 +▁atepa -1206 +▁atopa -1207 +▁hitia -1208 +▁korle -1209 +▁paris -1210 +▁tiger -1211 +hanahia -1212 +▁africa -1213 +▁brazil -1214 +▁faataa -1215 +▁flosse -1216 +▁fritch -1217 +▁moorea -1218 +▁oxford -1219 +▁semita -1220 +▁taiete -1221 +▁tāpōnē -1222 +▁utuutu -1223 +▁србије -1224 +▁alijata -1225 +▁csebász -1226 +▁edouard -1227 +▁mātāmua -1228 +▁theresa -1229 +▁maìtihia -1230 +▁indicatif -1231 +▁faanavairaa -1232 +ad -1233 +al -1234 +bo -1235 +by -1236 +cy -1237 +ds -1238 +dé -1239 +if -1240 +ir -1241 +km -1242 +lt -1243 +mā -1244 +tt -1245 +wi -1246 +▁á -1247 +bre -1248 +cal -1249 +cen -1250 +eti -1251 +for -1252 +ges -1253 +gye -1254 +her -1255 +hle -1256 +iro -1257 +itā -1258 +las -1259 +lau -1260 +llo -1261 +log -1262 +mer -1263 +ney -1264 +nio -1265 +nyi -1266 +orū -1267 +pen -1268 +pra -1269 +ssi -1270 +tho -1271 +tum -1272 +uba -1273 +vid -1274 +zer -1275 +▁ad -1276 +▁ae -1277 +▁el -1278 +▁fo -1279 +▁kū -1280 +▁mc -1281 +▁ng -1282 +▁on -1283 +▁ow -1284 +▁ré -1285 +▁we -1286 +▁ya -1287 +▁ye -1288 +berg -1289 +ller -1290 +mata -1291 +mera -1292 +misi -1293 +nsis -1294 +oane -1295 +ordà -1296 +otea -1297 +para -1298 +rapu -1299 +rles -1300 +tane -1301 +tapu -1302 +teti -1303 +trus -1304 +tītī -1305 +urai -1306 +▁afi -1307 +▁aku -1308 +▁ata -1309 +▁bas -1310 +▁bis -1311 +▁car -1312 +▁gar -1313 +▁han -1314 +▁ice -1315 +▁ino -1316 +▁lla -1317 +▁moi -1318 +▁nen -1319 +▁nià -1320 +▁ona -1321 +▁ore -1322 +▁phi -1323 +▁ref -1324 +▁sar -1325 +▁uru -1326 +▁ver -1327 +▁you -1328 +▁ôoà -1329 +enana -1330 +erorū -1331 +meida -1332 +menia -1333 +mpane -1334 +phyll -1335 +riraa -1336 +senta -1337 +tiare -1338 +urutu -1339 +áresz -1340 +▁anua -1341 +▁arai -1342 +▁cana -1343 +▁cata -1344 +▁faai -1345 +▁hehe -1346 +▁hill -1347 +▁huka -1348 +▁kilo -1349 +▁lone -1350 +▁maui -1351 +▁pato -1352 +▁rava -1353 +▁rock -1354 +▁roma -1355 +▁roro -1356 +▁sain -1357 +▁tana -1358 +▁tano -1359 +▁taui -1360 +▁teva -1361 +▁tita -1362 +▁âvaè -1363 +▁ātea -1364 +gascar -1365 +itāria -1366 +ivavae -1367 +manuel -1368 +▁adamu -1369 +▁aotea -1370 +▁arata -1371 +▁cream -1372 +▁faufa -1373 +▁hesse -1374 +▁hāmoa -1375 +▁māori -1376 +▁oscar -1377 +▁rapae -1378 +▁sahle -1379 +▁tahuà -1380 +▁terra -1381 +▁zingi -1382 +▁âtopa -1383 +empordà -1384 +▁manihi -1385 +▁napuka -1386 +▁piihia -1387 +▁pōtītī -1388 +▁rurutu -1389 +▁russie -1390 +▁taonga -1391 +▁temaru -1392 +▁tetahi -1393 +▁tiurai -1394 +▁tuarua -1395 +beraceae -1396 +erorūtia -1397 +ramarama -1398 +▁afirika -1399 +▁almeida -1400 +▁charles -1401 +▁maupiti -1402 +▁sotiare -1403 +▁tahuata -1404 +▁tamaiti -1405 +▁tauiraa -1406 +▁tempane -1407 +▁tenuare -1408 +▁êperera -1409 +sentation -1410 +▁aotearoa -1411 +▁institut -1412 +▁lonedona -1413 +▁maitiraa -1414 +▁manureva -1415 +▁official -1416 +▁paratāne -1417 +▁peretāne -1418 +▁porapora -1419 +▁raivavae -1420 +▁rimatara -1421 +▁taatiraa -1422 +▁taiarapu -1423 +▁tapearaa -1424 +▁apatoerau -1425 +▁paraparau -1426 +▁rubiaceae -1427 +▁madagascar -1428 +▁pierorūtia -1429 +▁présentation -1430 +▁zingiberaceae -1431 +", -1432 +.) -1433 +ah -1434 +ar -1435 +ed -1436 +ff -1437 +ks -1438 +oe -1439 +oi -1440 +pl -1441 +pā -1442 +pŭ -1443 +su -1444 +tí -1445 +ue -1446 +vá -1447 +xi -1448 +zy -1449 +». -1450 +òa -1451 +ós -1452 +на -1453 +▁× -1454 +▁р -1455 +amā -1456 +ati -1457 +bar -1458 +bla -1459 +bri -1460 +csi -1461 +dan -1462 +del -1463 +epi -1464 +eru -1465 +fan -1466 +gau -1467 +gor -1468 +gua -1469 +hui -1470 +iat -1471 +ine -1472 +isz -1473 +kwa -1474 +lar -1475 +len -1476 +lez -1477 +lis -1478 +mar -1479 +mau -1480 +nca -1481 +nea -1482 +nel -1483 +ner -1484 +oso -1485 +pel -1486 +pus -1487 +rac -1488 +ric -1489 +ted -1490 +tià -1491 +uar -1492 +uis -1493 +use -1494 +ves -1495 +wai -1496 +xan -1497 +yev -1498 +ìte -1499 +ēra -1500 +ŭpŭ -1501 +▁ag -1502 +▁bu -1503 +▁ch -1504 +▁dé -1505 +▁má -1506 +▁oa -1507 +▁qu -1508 +▁sc -1509 +atua -1510 +bert -1511 +burg -1512 +enko -1513 +fera -1514 +gory -1515 +hara -1516 +hiva -1517 +humb -1518 +iahi -1519 +koto -1520 +lium -1521 +logy -1522 +mana -1523 +maru -1524 +mihi -1525 +musa -1526 +nell -1527 +pala -1528 +pani -1529 +pehe -1530 +puai -1531 +rela -1532 +ster -1533 +tina -1534 +tipe -1535 +vern -1536 +ītia -1537 +▁afa -1538 +▁aka -1539 +▁amu -1540 +▁ave -1541 +▁bor -1542 +▁bre -1543 +▁cor -1544 +▁csi -1545 +▁dna -1546 +▁est -1547 +▁fro -1548 +▁hao -1549 +▁hiò -1550 +▁iii -1551 +▁imi -1552 +▁kau -1553 +▁lau -1554 +▁llo -1555 +▁man -1556 +▁maì -1557 +▁men -1558 +▁māi -1559 +▁ngā -1560 +▁non -1561 +▁nuu -1562 +▁oti -1563 +▁phd -1564 +▁pri -1565 +▁qua -1566 +▁qui -1567 +▁rua -1568 +▁sal -1569 +▁sou -1570 +▁tar -1571 +▁tro -1572 +▁uta -1573 +▁web -1574 +aceae -1575 +ctory -1576 +episo -1577 +hanti -1578 +irobi -1579 +kueru -1580 +moana -1581 +muera -1582 +naaro -1583 +neine -1584 +ngton -1585 +pûraa -1586 +rāria -1587 +tānia -1588 +ászop -1589 +▁aamu -1590 +▁afua -1591 +▁aman -1592 +▁anto -1593 +▁feli -1594 +▁fifi -1595 +▁gita -1596 +▁king -1597 +▁kāna -1598 +▁mais -1599 +▁maka -1600 +▁maro -1601 +▁meià -1602 +▁mele -1603 +▁nene -1604 +▁open -1605 +▁opua -1606 +▁popu -1607 +▁pŭpŭ -1608 +▁raia -1609 +▁reao -1610 +▁slei -1611 +▁taea -1612 +▁tani -1613 +▁teri -1614 +▁tona -1615 +▁tong -1616 +▁tuva -1617 +▁tīri -1618 +▁vict -1619 +▁vren -1620 +▁vītī -1621 +▁well -1622 +▁àere -1623 +carpus -1624 +eaèraa -1625 +gauche -1626 +gyekye -1627 +mation -1628 +metera -1629 +ngarau -1630 +tavake -1631 +ururaa -1632 +▁brong -1633 +▁david -1634 +▁faaea -1635 +▁faito -1636 +▁grace -1637 +▁hanna -1638 +▁ioane -1639 +▁matau -1640 +▁minsk -1641 +▁oware -1642 +▁papai -1643 +▁piahi -1644 +▁ranei -1645 +▁ravea -1646 +▁saint -1647 +▁tiare -1648 +▁tieti -1649 +▁tonga -1650 +▁touri -1651 +▁tātou -1652 +▁villa -1653 +iatpala -1654 +phyllum -1655 +tahiraa -1656 +tipetia -1657 +▁apatoa -1658 +▁arutua -1659 +▁bissiw -1660 +▁chirac -1661 +▁disney -1662 +▁farani -1663 +▁govern -1664 +▁hīmene -1665 +▁lāmihi -1666 +▁mahiti -1667 +▁makemo -1668 +▁nászop -1669 +▁setepa -1670 +▁tiaraa -1671 +▁titema -1672 +▁tuiroo -1673 +▁tupuai -1674 +▁tureia -1675 +▁varela -1676 +▁waiata -1677 +episodio -1678 +▁ashanti -1679 +▁densité -1680 +▁hikueru -1681 +▁hinaaro -1682 +▁jacques -1683 +▁nairobi -1684 +▁opuaraa -1685 +▁raatira -1686 +▁sleiman -1687 +▁taairaa -1688 +▁takaroa -1689 +▁taravai -1690 +▁whakama -1691 +▁areteria -1692 +▁fakarava -1693 +▁fanauraa -1694 +▁peretane -1695 +▁tahitien -1696 +▁faaineine -1697 +▁vitipetia -1698 +▁autaeaèraa -1699 +▁mauiatpala -1700 +▁nukutavake -1701 +▁amuitahiraa -1702 +▁faahopearaa -1703 +▁haamaramarama -1704 +cu -1705 +cé -1706 +dc -1707 +ft -1708 +hr -1709 +ji -1710 +jo -1711 +ps -1712 +px -1713 +rē -1714 +sp -1715 +wo -1716 +ys -1717 +ło -1718 +ик -1719 +ال -1720 +▁б -1721 +▁в -1722 +▁г -1723 +▁т -1724 +▁– -1725 +ahu -1726 +apa -1727 +ape -1728 +bez -1729 +bhi -1730 +bou -1731 +cel -1732 +ces -1733 +cro -1734 +cti -1735 +din -1736 +dri -1737 +ear -1738 +ena -1739 +ens -1740 +faì -1741 +fes -1742 +fia -1743 +fri -1744 +gar -1745 +ght -1746 +gli -1747 +gue -1748 +hio -1749 +ihā -1750 +jan -1751 +kar -1752 +kau -1753 +ker -1754 +kyi -1755 +nde -1756 +nie -1757 +nya -1758 +nye -1759 +nyá -1760 +osc -1761 +pae -1762 +pho -1763 +raì -1764 +rie -1765 +rio -1766 +rne -1767 +rot -1768 +sah -1769 +sil -1770 +sme -1771 +ssa -1772 +sua -1773 +tim -1774 +trá -1775 +urt -1776 +usz -1777 +val -1778 +vio -1779 +yol -1780 +āpo -1781 +īne -1782 +ōpu -1783 +ōpū -1784 +▁at -1785 +▁ea -1786 +▁es -1787 +▁fé -1788 +▁kī -1789 +▁lí -1790 +▁my -1791 +▁ou -1792 +▁pû -1793 +▁um -1794 +▁òe -1795 +▁ùo -1796 +▁ło -1797 +aore -1798 +auia -1799 +bhit -1800 +cher -1801 +dium -1802 +enta -1803 +erra -1804 +fana -1805 +haro -1806 +hune -1807 +itea -1808 +kozy -1809 +lata -1810 +lena -1811 +lifi -1812 +lika -1813 +llet -1814 +mina -1815 +mini -1816 +mira -1817 +nald -1818 +ness -1819 +ngli -1820 +noto -1821 +olle -1822 +onal -1823 +papa -1824 +pium -1825 +port -1826 +raro -1827 +rena -1828 +ring -1829 +roto -1830 +sion -1831 +tani -1832 +taru -1833 +tome -1834 +tres -1835 +tutu -1836 +āito -1837 +ōire -1838 +▁ahi -1839 +▁bar -1840 +▁ber -1841 +▁bes -1842 +▁bré -1843 +▁csá -1844 +▁flo -1845 +▁fon -1846 +▁gam -1847 +▁gua -1848 +▁her -1849 +▁hoe -1850 +▁how -1851 +▁hōê -1852 +▁isa -1853 +▁iva -1854 +▁iòa -1855 +▁kua -1856 +▁lee -1857 +▁lui -1858 +▁mul -1859 +▁nao -1860 +▁nor -1861 +▁ofa -1862 +▁peu -1863 +▁pra -1864 +▁rau -1865 +▁shi -1866 +▁sil -1867 +▁ste -1868 +▁tha -1869 +▁toi -1870 +▁tou -1871 +▁von -1872 +▁wes -1873 +▁wil -1874 +amaru -1875 +drell -1876 +earch -1877 +fenua -1878 +heira -1879 +koata -1880 +maiao -1881 +natae -1882 +oseph -1883 +piuma -1884 +rench -1885 +rutea -1886 +terni -1887 +ticia -1888 +tress -1889 +tunga -1890 +ānira -1891 +īneti -1892 +ōpuhi -1893 +▁agot -1894 +▁aids -1895 +▁ange -1896 +▁anno -1897 +▁anti -1898 +▁auro -1899 +▁aute -1900 +▁avec -1901 +▁bian -1902 +▁blay -1903 +▁cada -1904 +▁caro -1905 +▁dire -1906 +▁elia -1907 +▁gene -1908 +▁hotu -1909 +▁huna -1910 +▁mara -1911 +▁mere -1912 +▁mont -1913 +▁namu -1914 +▁nico -1915 +▁nova -1916 +▁paki -1917 +▁pera -1918 +▁pili -1919 +▁poro -1920 +▁port -1921 +▁repo -1922 +▁rosa -1923 +▁ruga -1924 +▁sapi -1925 +▁tape -1926 +▁taru -1927 +▁tena -1928 +▁tohu -1929 +▁topa -1930 +▁tote -1931 +▁tuha -1932 +▁turu -1933 +▁twer -1934 +▁tāma -1935 +▁veve -1936 +▁vous -1937 +▁wiki -1938 +auitai -1939 +chelor -1940 +ihānia -1941 +inetia -1942 +inītia -1943 +itoito -1944 +oturaa -1945 +perēra -1946 +ration -1947 +stique -1948 +ubakar -1949 +ulenta -1950 +uruuru -1951 +vaceae -1952 +▁ahafo -1953 +▁anuan -1954 +▁atete -1955 +▁atura -1956 +▁feliu -1957 +▁horoa -1958 +▁inter -1959 +▁iriti -1960 +▁lanca -1961 +▁lydia -1962 +▁maimi -1963 +▁maira -1964 +▁martí -1965 +▁nengo -1966 +▁patri -1967 +▁paulo -1968 +▁pihai -1969 +▁tamau -1970 +▁teura -1971 +▁thumb -1972 +▁tuata -1973 +▁tuete -1974 +▁tunis -1975 +▁vaihī -1976 +▁vietu -1977 +▁washi -1978 +▁whare -1979 +▁âtete -1980 +▁łobez -1981 +ographi -1982 +▁alexan -1983 +▁aroraa -1984 +▁autahu -1985 +▁canada -1986 +▁chapel -1987 +▁cīneti -1988 +▁dental -1989 +▁faaore -1990 +▁faaoti -1991 +▁feruri -1992 +▁french -1993 +▁gitata -1994 +▁joseph -1995 +▁julius -1996 +▁kilifi -1997 +▁lamisi -1998 +▁mahina -1999 +▁mariri -2000 +▁mauiui -2001 +▁morena -2002 +▁mētera -2003 +▁parahi -2004 +▁paturu -2005 +▁pātifi -2006 +▁quakyi -2007 +▁refere -2008 +▁tepoto -2009 +▁titeti -2010 +▁tupuna -2011 +▁tāpura -2012 +▁tītema -2013 +▁tōnoto -2014 +▁vairaa -2015 +▁vānira -2016 +▁wesley -2017 +▁actress -2018 +▁amankwa -2019 +▁araceae -2020 +▁armenia -2021 +▁faahana -2022 +▁faatura -2023 +▁hororaa -2024 +▁itenati -2025 +▁marutea -2026 +▁pariraa -2027 +▁poaceae -2028 +▁raiatea -2029 +▁rekoata -2030 +▁sarkozy -2031 +▁tamuera -2032 +▁tapuraa -2033 +▁tipiuma -2034 +▁tuatahi -2035 +ternidade -2036 +▁abubakar -2037 +▁bachelor -2038 +▁emmanuel -2039 +▁grandola -2040 +▁hanahana -2041 +▁kwaghfan -2042 +▁musaceae -2043 +▁officina -2044 +▁peritome -2045 +▁pilibhit -2046 +▁présiden -2047 +▁pukapuka -2048 +▁pāpaìraa -2049 +▁tatakoto -2050 +▁tōtaiete -2051 +▁vendrell -2052 +▁victoria -2053 +peretiteni -2054 +▁anaanatae -2055 +▁auterāria -2056 +▁csebásztá -2057 +▁directory -2058 +▁esculenta -2059 +▁faaiteraa -2060 +▁faaitoito -2061 +▁haamauraa -2062 +▁haapiihia -2063 +▁hamaniraa -2064 +▁malvaceae -2065 +▁taviniraa -2066 +▁annonaceae -2067 +▁cīnetienei -2068 +▁faahoturaa -2069 +▁government -2070 +▁haapapûraa -2071 +▁perititeni -2072 +▁washington -2073 +▁atepaihānia -2074 +▁tāmahanahia -2075 +▁faaipoipohia -2076 +▁fraternidade -2077 +], -2078 +dr -2079 +et -2080 +ig -2081 +ià -2082 +lk -2083 +lé -2084 +mc -2085 +mn -2086 +mē -2087 +ok -2088 +pf -2089 +rá -2090 +sy -2091 +tô -2092 +ud -2093 +up -2094 +we -2095 +ww -2096 +xa -2097 +yi -2098 +yo -2099 +zi -2100 +às -2101 +ço -2102 +çà -2103 +éa -2104 +ée -2105 +ôm -2106 +ši -2107 +ад -2108 +бл -2109 +еп -2110 +ич -2111 +ни -2112 +од -2113 +ри -2114 +▁< -2115 +▁| -2116 +▁î -2117 +▁ī -2118 +▁к -2119 +▁о -2120 +▁п -2121 +▁я -2122 +abi -2123 +aif -2124 +bil -2125 +bio -2126 +bun -2127 +cep -2128 +ció -2129 +cos -2130 +cse -2131 +cur -2132 +cus -2133 +dad -2134 +dis -2135 +eno -2136 +ert -2137 +eva -2138 +fau -2139 +gio -2140 +git -2141 +hea -2142 +hos -2143 +ily -2144 +ins -2145 +ius -2146 +jet -2147 +kon -2148 +kul -2149 +kyo -2150 +lab -2151 +lav -2152 +ldo -2153 +lev -2154 +lip -2155 +lit -2156 +lop -2157 +lou -2158 +lus -2159 +mes -2160 +mos -2161 +mpi -2162 +niu -2163 +nks -2164 +nle -2165 +nyà -2166 +oia -2167 +ors -2168 +oru -2169 +osé -2170 +pai -2171 +plô -2172 +pou -2173 +ppa -2174 +psi -2175 +ral -2176 +reg -2177 +rey -2178 +ros -2179 +sei -2180 +ssà -2181 +ssè -2182 +sul -2183 +szk -2184 +tat -2185 +taè -2186 +tey -2187 +thi -2188 +tio -2189 +tit -2190 +tsk -2191 +uni -2192 +uts -2193 +vea -2194 +vià -2195 +vol -2196 +vre -2197 +wha -2198 +zsá -2199 +áze -2200 +ção -2201 +епу -2202 +ике -2203 +▁), -2204 +▁." -2205 +▁ak -2206 +▁ce -2207 +▁cs -2208 +▁ec -2209 +▁er -2210 +▁gu -2211 +▁gé -2212 +▁jr -2213 +▁mp -2214 +▁nū -2215 +▁ue -2216 +▁ui -2217 +▁un -2218 +▁yô -2219 +▁», -2220 +▁àu -2221 +▁èo -2222 +▁āu -2223 +▁ši -2224 +abid -2225 +addo -2226 +anno -2227 +ante -2228 +anus -2229 +aroa -2230 +atoa -2231 +bier -2232 +cana -2233 +celo -2234 +cipa -2235 +come -2236 +cord -2237 +cská -2238 +dela -2239 +dena -2240 +ehia -2241 +elle -2242 +enga -2243 +ents -2244 +erca -2245 +erto -2246 +fran -2247 +gier -2248 +heti -2249 +hiru -2250 +iaca -2251 +iahu -2252 +inai -2253 +inne -2254 +irae -2255 +issa -2256 +jevo -2257 +kara -2258 +ksan -2259 +leia -2260 +lina -2261 +ling -2262 +lino -2263 +lius -2264 +lues -2265 +ming -2266 +mons -2267 +mota -2268 +naho -2269 +nand -2270 +nces -2271 +nder -2272 +nice -2273 +nuae -2274 +oast -2275 +olum -2276 +onel -2277 +peak -2278 +peci -2279 +piho -2280 +poro -2281 +puni -2282 +rade -2283 +riba -2284 +site -2285 +ssou -2286 +taki -2287 +tapo -2288 +tary -2289 +tata -2290 +tica -2291 +timé -2292 +tito -2293 +toni -2294 +ttar -2295 +ture -2296 +tārē -2297 +uisa -2298 +urae -2299 +urse -2300 +usée -2301 +vela -2302 +vina -2303 +viri -2304 +ward -2305 +çois -2306 +ìraa -2307 +▁aba -2308 +▁agu -2309 +▁alb -2310 +▁ama -2311 +▁api -2312 +▁bon -2313 +▁bos -2314 +▁cli -2315 +▁dro -2316 +▁edu -2317 +▁ela -2318 +▁fai -2319 +▁fal -2320 +▁for -2321 +▁fru -2322 +▁gen -2323 +▁gil -2324 +▁gon -2325 +▁gou -2326 +▁gui -2327 +▁hos -2328 +▁iba -2329 +▁ivi -2330 +▁jan -2331 +▁jes -2332 +▁kei -2333 +▁lli -2334 +▁loa -2335 +▁mis -2336 +▁môm -2337 +▁nan -2338 +▁ndc -2339 +▁new -2340 +▁nom -2341 +▁ola -2342 +▁ono -2343 +▁pas -2344 +▁rai -2345 +▁rea -2346 +▁rii -2347 +▁rik -2348 +▁rio -2349 +▁rop -2350 +▁sol -2351 +▁sot -2352 +▁sra -2353 +▁whi -2354 +▁www -2355 +▁xvi -2356 +▁àhu -2357 +▁ìte -2358 +▁òia -2359 +atoro -2360 +berto -2361 +bilia -2362 +blanc -2363 +blika -2364 +buntu -2365 +burgh -2366 +canus -2367 +chris -2368 +ction -2369 +denia -2370 +dirne -2371 +erere -2372 +folia -2373 +hanga -2374 +heraa -2375 +hinga -2376 +lands -2377 +llada -2378 +losop -2379 +lunya -2380 +maraa -2381 +mataì -2382 +media -2383 +mángo -2384 +ngila -2385 +ograd -2386 +oroni -2387 +ouest -2388 +pania -2389 +plôme -2390 +prage -2391 +ranta -2392 +rdoso -2393 +rihia -2394 +risci -2395 +risti -2396 +sioni -2397 +ssède -2398 +suari -2399 +szter -2400 +tapua -2401 +taraa -2402 +thoni -2403 +tiano -2404 +tista -2405 +tophe -2406 +uardo -2407 +ukash -2408 +umotu -2409 +utuna -2410 +whaka -2411 +блике -2412 +▁anaè -2413 +▁antô -2414 +▁ariā -2415 +▁arue -2416 +▁bara -2417 +▁bola -2418 +▁calo -2419 +▁cape -2420 +▁cate -2421 +▁colo -2422 +▁coro -2423 +▁edin -2424 +▁eiao -2425 +▁este -2426 +▁faba -2427 +▁faus -2428 +▁feti -2429 +▁fédé -2430 +▁glau -2431 +▁hara -2432 +▁huku -2433 +▁hōho -2434 +▁jack -2435 +▁josé -2436 +▁kato -2437 +▁kiri -2438 +▁kore -2439 +▁logo -2440 +▁lucy -2441 +▁lāli -2442 +▁medi -2443 +▁mihi -2444 +▁mira -2445 +▁moho -2446 +▁momo -2447 +▁nous -2448 +▁osma -2449 +▁paea -2450 +▁pehe -2451 +▁pina -2452 +▁pola -2453 +▁povo -2454 +▁pure -2455 +▁quem -2456 +▁rené -2457 +▁rohi -2458 +▁sara -2459 +▁scho -2460 +▁tapa -2461 +▁temp -2462 +▁teti -2463 +▁tika -2464 +▁tiro -2465 +▁tomo -2466 +▁tono -2467 +▁turo -2468 +▁yeke -2469 +▁àito -2470 +▁репу -2471 +annona -2472 +citrus -2473 +daceae -2474 +hiahia -2475 +issala -2476 +iteraa -2477 +itiraa -2478 +laceae -2479 +lation -2480 +linois -2481 +llande -2482 +maitai -2483 +ndanus -2484 +perara -2485 +sement -2486 +tersen -2487 +torika -2488 +tuania -2489 +▁abdel -2490 +▁ahuru -2491 +▁akufo -2492 +▁apiti -2493 +▁caste -2494 +▁chris -2495 +▁coast -2496 +▁cunha -2497 +▁docum -2498 +▁enana -2499 +▁etahi -2500 +▁garri -2501 +▁heheu -2502 +▁henry -2503 +▁hurae -2504 +▁infor -2505 +▁jonas -2506 +▁katoa -2507 +▁laura -2508 +▁maama -2509 +▁maeva -2510 +▁mahia -2511 +▁maohi -2512 +▁mataì -2513 +▁maupi -2514 +▁messi -2515 +▁mohio -2516 +▁najet -2517 +▁nurse -2518 +▁outou -2519 +▁palau -2520 +▁patia -2521 +▁pirae -2522 +▁popaā -2523 +▁press -2524 +▁proje -2525 +▁ramos -2526 +▁sofia -2527 +▁speak -2528 +▁speci -2529 +▁stati -2530 +▁tairi -2531 +▁tokyo -2532 +▁tupai -2533 +▁tāati -2534 +▁ville -2535 +▁vitor -2536 +▁yange -2537 +▁ètārē -2538 +ctorius -2539 +disiaca -2540 +enovela -2541 +mations -2542 +nyáresz -2543 +oscorea -2544 +otetani -2545 +rareraa -2546 +ritoria -2547 +timédia -2548 +waitara -2549 +▁ahurea -2550 +▁anokye -2551 +▁anotau -2552 +▁bianya -2553 +▁citrus -2554 +▁donald -2555 +▁faaapu -2556 +▁faahou -2557 +▁futuna -2558 +▁hatutu -2559 +▁hitiaa -2560 +▁ibadan -2561 +▁ingila -2562 +▁iteraa -2563 +▁kufour -2564 +▁laurey -2565 +▁lesley -2566 +▁lionel -2567 +▁louisa -2568 +▁manawa -2569 +▁manuae -2570 +▁martin -2571 +▁mbayev -2572 +▁meheti -2573 +▁mensah -2574 +▁metres -2575 +▁nainai -2576 +▁nicole -2577 +▁nuihau -2578 +▁numera -2579 +▁ordena -2580 +▁papara -2581 +▁parlez -2582 +▁patava -2583 +▁prisci -2584 +▁profes -2585 +▁pūerto -2586 +▁raìroa -2587 +▁rotopū -2588 +▁sangen -2589 +▁srairi -2590 +▁taatoa -2591 +▁tapiho -2592 +▁tereza -2593 +▁terihi -2594 +▁tuvaru -2595 +▁tāvana -2596 +▁united -2597 +▁univer -2598 +▁uturoa -2599 +▁vrenko -2600 +atuaiahu -2601 +losophia -2602 +tapuatea -2603 +tocarpus -2604 +▁aleksan -2605 +▁america -2606 +▁amuiraa -2607 +▁andrade -2608 +▁batista -2609 +▁beograd -2610 +▁bibilia -2611 +▁bolanle -2612 +▁cardoso -2613 +▁commons -2614 +▁diplôme -2615 +▁eduardo -2616 +▁faafana -2617 +▁faarahi -2618 +▁farerei -2619 +▁gambier -2620 +▁jesberg -2621 +▁llierca -2622 +▁mataura -2623 +▁misioni -2624 +▁muthoni -2625 +▁nyerere -2626 +▁patrick -2627 +▁paturaa -2628 +▁possède -2629 +▁pureraa -2630 +▁ravehia -2631 +▁raveraa -2632 +▁raìātea -2633 +▁riroraa -2634 +▁rorofaì -2635 +▁sissala -2636 +▁taheraa -2637 +▁tairoto -2638 +▁tangata -2639 +▁tumaraa -2640 +▁tunisia -2641 +▁tūāmotu -2642 +▁village -2643 +▁website -2644 +▁âperera -2645 +▁êperara -2646 +▁šiprage -2647 +ukashenko -2648 +▁amankwah -2649 +▁arapania -2650 +▁caroline -2651 +▁category -2652 +▁fabaceae -2653 +▁faustina -2654 +▁françois -2655 +▁ghanaian -2656 +▁haerenga -2657 +▁haereraa -2658 +▁heheuraa -2659 +▁hollande -2660 +▁katolika -2661 +▁katorika -2662 +▁maitihia -2663 +▁maìtiraa -2664 +▁moraceae -2665 +▁otitānia -2666 +▁pangarau -2667 +▁parauhia -2668 +▁pehepehe -2669 +▁punaauia -2670 +▁rituania -2671 +▁rutaceae -2672 +▁sarajevo -2673 +▁tapotapo -2674 +▁taputapu -2675 +▁tauatini -2676 +▁titauraa -2677 +▁toromona -2678 +▁uetersen -2679 +▁wellness -2680 +▁ètārētia -2681 +▁catalunya -2682 +▁documents -2683 +▁edinburgh -2684 +▁faahiahia -2685 +▁faaotiraa -2686 +▁institute -2687 +▁makeranta -2688 +▁parahiraa -2689 +▁parururaa -2690 +▁tectorius -2691 +▁tuatapapa -2692 +▁wikimedia -2693 +▁републике -2694 +▁kilometera -2695 +▁multimédia -2696 +▁population -2697 +▁porotetani -2698 +▁présidence -2699 +▁references -2700 +▁tapihooraa -2701 +▁telenovela -2702 +▁territoria -2703 +atuaiahutapu -2704 +▁faanahonaho -2705 +▁faaohiparaa -2706 +▁pakiwaitara -2707 +▁paradisiaca -2708 +▁peritomeraa -2709 +▁philosophia -2710 +▁faaineinehia -2711 +▁haaparareraa -2712 +▁taputapuatea -2713 +▁faahanahanahia -2714 +.[ -2715 +ac -2716 +aè -2717 +bb -2718 +bá -2719 +bé -2720 +cl -2721 +cê -2722 +df -2723 +dí -2724 +dó -2725 +fé -2726 +hy -2727 +ib -2728 +ju -2729 +kp -2730 +kā -2731 +lv -2732 +mm -2733 +mw -2734 +nō -2735 +oh -2736 +pī -2737 +rt -2738 +tì -2739 +tū -2740 +uk -2741 +un -2742 +ux -2743 +vō -2744 +wī -2745 +yd -2746 +yl -2747 +yu -2748 +zh -2749 +», -2750 +ás -2751 +ên -2752 +ît -2753 +ùo -2754 +āi -2755 +či -2756 +ед -2757 +ст -2758 +عب -2759 +▁# -2760 +▁= -2761 +▁° -2762 +▁û -2763 +▁ū -2764 +▁ʼ -2765 +▁ˈ -2766 +▁а -2767 +▁д -2768 +▁е -2769 +▁з -2770 +▁и -2771 +▁й -2772 +▁л -2773 +▁н -2774 +▁ц -2775 +▁ч -2776 +▁ш -2777 +▁ы -2778 +ale -2779 +ali -2780 +alo -2781 +ani -2782 +ank -2783 +ans -2784 +apu -2785 +arā -2786 +ase -2787 +aug -2788 +aux -2789 +ava -2790 +bes -2791 +bor -2792 +cie -2793 +com -2794 +cre -2795 +cri -2796 +day -2797 +dra -2798 +dua -2799 +ка -2800 +▁у -2801 +bis -2802 +bua -2803 +cto -2804 +ehi -2805 +eie -2806 +eue -2807 +fer -2808 +ffe -2809 +fim -2810 +fos -2811 +fre -2812 +gie -2813 +gos -2814 +gro -2815 +gui -2816 +har -2817 +hie -2818 +hin -2819 +hot -2820 +iar -2821 +ide -2822 +ini -2823 +isu -2824 +jor -2825 +kin -2826 +koa -2827 +kos -2828 +kru -2829 +lco -2830 +lls -2831 +lly -2832 +lol -2833 +lto -2834 +láu -2835 +mad -2836 +mah -2837 +mat -2838 +mgo -2839 +mia -2840 +mie -2841 +min -2842 +mir -2843 +mni -2844 +mor -2845 +mot -2846 +mui -2847 +nen -2848 +nho -2849 +nor -2850 +nou -2851 +nti -2852 +nva -2853 +nys -2854 +oha -2855 +ols -2856 +one -2857 +ono -2858 +onu -2859 +oti -2860 +ots -2861 +ous -2862 +paa -2863 +pal -2864 +pan -2865 +pii -2866 +pon -2867 +pos -2868 +pse -2869 +ras -2870 +reu -2871 +rid -2872 +riu -2873 +rni -2874 +rés -2875 +san -2876 +sea -2877 +sha -2878 +sit -2879 +siu -2880 +ski -2881 +sto -2882 +tan -2883 +teg -2884 +thy -2885 +tic -2886 +tie -2887 +tiu -2888 +toà -2889 +toè -2890 +ttu -2891 +tue -2892 +upa -2893 +urs -2894 +ute -2895 +vau -2896 +vel -2897 +vis -2898 +wen -2899 +af -2900 +ки -2901 +▁ó -2902 +bas -2903 +elr -2904 +iso -2905 +isy -2906 +mic -2907 +moe -2908 +ndo -2909 +noa -2910 +now -2911 +rdi -2912 +the -2913 +tty -2914 +whi -2915 +yij -2916 +zen -2917 +zes -2918 +zos -2919 +ûru -2920 +āpi -2921 +āto -2922 +čes -2923 +ītā -2924 +īwī -2925 +ōna -2926 +рад -2927 +род -2928 +▁(° -2929 +▁az -2930 +▁cé -2931 +▁dá -2932 +▁dä -2933 +▁ej -2934 +▁gi -2935 +▁gl -2936 +▁gá -2937 +▁io -2938 +▁iz -2939 +▁kā -2940 +▁mé -2941 +▁od -2942 +▁oè -2943 +▁pá -2944 +▁pē -2945 +▁pī -2946 +▁sp -2947 +▁sé -2948 +▁sí -2949 +▁th -2950 +▁ty -2951 +▁uk -2952 +▁us -2953 +▁vá -2954 +▁wh -2955 +▁ze -2956 +▁». -2957 +▁ту -2958 +▁ال -2959 +alpi -2960 +anth -2961 +arii -2962 +bayo -2963 +bral -2964 +ccha -2965 +cial -2966 +ción -2967 +cron -2968 +date -2969 +desh -2970 +divi -2971 +eira -2972 +elli -2973 +ence -2974 +enix -2975 +eren -2976 +eres -2977 +esca -2978 +esia -2979 +esti -2980 +fano -2981 +fski -2982 +gado -2983 +goso -2984 +gual -2985 +hapa -2986 +hata -2987 +heli -2988 +hena -2989 +hera -2990 +hina -2991 +hinu -2992 +hiro -2993 +hono -2994 +hora -2995 +iaki -2996 +iana -2997 +ibge -2998 +inda -2999 +ró -3000 +.). -3001 +dol -3002 +dom -3003 +eux -3004 +iki -3005 +kum -3006 +llà -3007 +nce -3008 +rst -3009 +▁". -3010 +▁). -3011 +amra -3012 +fata -3013 +grat -3014 +inga -3015 +jany -3016 +jour -3017 +kahu -3018 +kare -3019 +kava -3020 +keok -3021 +kete -3022 +kiro -3023 +kota -3024 +kume -3025 +kura -3026 +ladi -3027 +lano -3028 +lecu -3029 +left -3030 +lesz -3031 +lien -3032 +liki -3033 +lixa -3034 +llus -3035 +lnea -3036 +lori -3037 +lska -3038 +lter -3039 +léme -3040 +mara -3041 +mato -3042 +mbra -3043 +meka -3044 +meni -3045 +mont -3046 +mote -3047 +muna -3048 +nani -3049 +nato -3050 +nava -3051 +navi -3052 +ndis -3053 +ners -3054 +nges -3055 +ngoa -3056 +ngon -3057 +niak -3058 +nini -3059 +nira -3060 +nuve -3061 +onné -3062 +oriz -3063 +orro -3064 +osco -3065 +osus -3066 +otri -3067 +otro -3068 +oute -3069 +peri -3070 +piah -3071 +pipi -3072 +pohe -3073 +pool -3074 +puri -3075 +putu -3076 +quel -3077 +quer -3078 +quil -3079 +raka -3080 +rara -3081 +reia -3082 +ries -3083 +risi -3084 +ropo -3085 +rson -3086 +ruhi -3087 +ruve -3088 +rédé -3089 +rātā -3090 +sara -3091 +sien -3092 +siti -3093 +ssen -3094 +stor -3095 +sula -3096 +szte -3097 +tade -3098 +tahu -3099 +amâ -3100 +bel -3101 +kei -3102 +ong -3103 +ron -3104 +sso -3105 +une -3106 +àau -3107 +ère -3108 +▁zu -3109 +▁на -3110 +cast -3111 +cego -3112 +cide -3113 +cies -3114 +kowa -3115 +kále -3116 +nake -3117 +rike -3118 +stro -3119 +taro -3120 +tati -3121 +ther -3122 +thri -3123 +tifo -3124 +tika -3125 +tine -3126 +tiri -3127 +tsch -3128 +tska -3129 +tten -3130 +ttli -3131 +uaku -3132 +udad -3133 +urne -3134 +usta -3135 +uvea -3136 +uvre -3137 +vaco -3138 +vier -3139 +vila -3140 +viny -3141 +voir -3142 +vōta -3143 +wani -3144 +yama -3145 +áres -3146 +èrau -3147 +ètoè -3148 +état -3149 +être -3150 +íbal -3151 +òhia -3152 +āraì -3153 +рист -3154 +▁aau -3155 +▁abc -3156 +▁ahe -3157 +▁air -3158 +▁ake -3159 +▁ami -3160 +▁apo -3161 +▁arb -3162 +▁atâ -3163 +▁aua -3164 +▁aux -3165 +▁ben -3166 +▁beu -3167 +▁bol -3168 +▁bru -3169 +▁cam -3170 +▁cen -3171 +▁ceo -3172 +▁cla -3173 +▁die -3174 +▁din -3175 +▁dra -3176 +▁eie -3177 +▁eli -3178 +▁esz -3179 +▁fan -3180 +▁far -3181 +▁fil -3182 +▁flu -3183 +▁flá -3184 +▁fre -3185 +▁gif -3186 +▁gre -3187 +▁hea -3188 +▁hel -3189 +▁ina -3190 +▁ire -3191 +▁jus -3192 +▁kar -3193 +▁kni -3194 +▁koa -3195 +▁kom -3196 +▁kpi -3197 +▁lin -3198 +▁loi -3199 +at -3200 +ôr -3201 +bol -3202 +der -3203 +glo -3204 +ifo -3205 +luc -3206 +oko -3207 +pià -3208 +von -3209 +íso -3210 +▁fā -3211 +▁já -3212 +▁xh -3213 +▁za -3214 +aita -3215 +bird -3216 +bosa -3217 +cifo -3218 +eraa -3219 +gill -3220 +gues -3221 +káve -3222 +lder -3223 +mbre -3224 +ndão -3225 +polu -3226 +pure -3227 +pōra -3228 +rcia -3229 +rdia -3230 +rons -3231 +rump -3232 +soma -3233 +veta -3234 +ícia -3235 +▁acu -3236 +▁bio -3237 +▁los -3238 +▁lud -3239 +▁mlu -3240 +▁moe -3241 +▁myr -3242 +▁nas -3243 +▁nya -3244 +▁não -3245 +▁oba -3246 +▁oei -3247 +▁oto -3248 +▁oui -3249 +▁pad -3250 +▁pen -3251 +▁pep -3252 +▁per -3253 +▁pfi -3254 +▁pii -3255 +▁ple -3256 +▁pop -3257 +▁rei -3258 +▁res -3259 +▁roh -3260 +▁sad -3261 +▁sau -3262 +▁sci -3263 +▁sea -3264 +▁ses -3265 +▁sme -3266 +▁son -3267 +▁sti -3268 +▁sto -3269 +▁stu -3270 +▁ten -3271 +▁tom -3272 +▁toà -3273 +▁ufi -3274 +▁val -3275 +▁vea -3276 +▁vii -3277 +▁vir -3278 +▁yem -3279 +▁yes -3280 +▁zan -3281 +▁àif -3282 +▁àno -3283 +▁àti -3284 +▁âau -3285 +▁âià -3286 +▁âpī -3287 +▁ère -3288 +▁òro -3289 +▁ùru -3290 +ahotu -3291 +alofa -3292 +amana -3293 +ankro -3294 +apira -3295 +arava -3296 +arāau -3297 +atata -3298 +bbins -3299 +etu -3300 +jar -3301 +rià -3302 +▁ér -3303 +blic -3304 +dyta -3305 +java -3306 +lada -3307 +lité -3308 +melo -3309 +orld -3310 +phor -3311 +rapa -3312 +▁che -3313 +▁jau -3314 +▁six -3315 +▁tho -3316 +apeto -3317 +aturi -3318 +brega -3319 +casia -3320 +ching -3321 +chyum -3322 +ciano -3323 +colum -3324 +conia -3325 +crest -3326 +curma -3327 +deval -3328 +dinha -3329 +dulus -3330 +dísti -3331 +ehara -3332 +entum -3333 +féren -3334 +gegie -3335 +geria -3336 +gifer -3337 +gique -3338 +guaya -3339 +hangi -3340 +hação -3341 +hetia -3342 +hiata -3343 +hibis -3344 +hiraa -3345 +iland -3346 +illes -3347 +imira -3348 +inapo -3349 +irani -3350 +itihi -3351 +iātea -3352 +kehau -3353 +lcomb -3354 +leurs -3355 +llets -3356 +marie -3357 +mores -3358 +moteo -3359 +muaki -3360 +naldo -3361 +nells -3362 +nellà -3363 +nesco -3364 +nford -3365 +niara -3366 +nilla -3367 +niota -3368 +nshin -3369 +ntiif -3370 +nuraa -3371 +oragi -3372 +orata -3373 +ordor -3374 +oreau -3375 +orges -3376 +orpho -3377 +oscou -3378 +petit -3379 +piria -3380 +pital -3381 +publi -3382 +pāpaì -3383 +quise -3384 +rican -3385 +riket -3386 +riona -3387 +rothe -3388 +runga -3389 +silia -3390 +steur -3391 +story -3392 +sulté -3393 +tahaa -3394 +taima -3395 +taito -3396 +talum -3397 +tangi -3398 +teate -3399 +tilis -3400 +tinia -3401 +tonia -3402 +tráti -3403 +tuhaa -3404 +tumor -3405 +tures -3406 +uador -3407 +ubaix -3408 +univa -3409 +uraro -3410 +ution -3411 +vador -3412 +veira -3413 +verne -3414 +vesen -3415 +wanga -3416 +wango -3417 +yline -3418 +zalez -3419 +zerba -3420 +zosta -3421 +çanet -3422 +ïaraa -3423 +ānani -3424 +родна -3425 +▁achi -3426 +▁aito -3427 +▁aora -3428 +▁ashe -3429 +▁asia -3430 +▁aura -3431 +▁azin -3432 +▁baku -3433 +▁basi -3434 +▁boui -3435 +▁burt -3436 +▁caba -3437 +▁camb -3438 +▁camp -3439 +▁cara -3440 +▁city -3441 +▁cláu -3442 +▁cora -3443 +▁cour -3444 +▁cuba -3445 +▁curi -3446 +▁data -3447 +▁disz -3448 +▁domi -3449 +▁duck -3450 +▁duma -3451 +▁eaha -3452 +▁espo -3453 +▁esta -3454 +▁fine -3455 +▁flav -3456 +▁from -3457 +▁heli -3458 +▁hitu -3459 +▁hune -3460 +▁iyol -3461 +▁joan -3462 +▁kaha -3463 +▁kpaa -3464 +▁land -3465 +▁lehn -3466 +▁lins -3467 +▁lisa -3468 +▁lond -3469 +▁luiz -3470 +▁mama -3471 +▁mary -3472 +▁mati -3473 +▁meka -3474 +▁mena -3475 +▁miro -3476 +▁moli -3477 +▁mona -3478 +▁moru -3479 +▁moto -3480 +▁muni -3481 +▁name -3482 +▁nano -3483 +▁natī -3484 +▁nava -3485 +▁news -3486 +▁niau -3487 +▁niuē -3488 +▁nkru -3489 +▁noaa -3490 +▁nono -3491 +▁nuci -3492 +▁ohie -3493 +▁omua -3494 +▁oteg -3495 +▁otia -3496 +▁pala -3497 +▁papu -3498 +▁pati -3499 +▁patr -3500 +▁pene -3501 +▁pont -3502 +▁porī -3503 +▁poti -3504 +▁poto -3505 +▁pour -3506 +▁pres -3507 +▁prot -3508 +▁puig -3509 +▁reis -3510 +▁rien -3511 +▁riud -3512 +▁roll -3513 +▁ropu -3514 +▁rose -3515 +▁ruby -3516 +▁rōpū -3517 +▁sala -3518 +▁sali -3519 +▁sera -3520 +▁sert -3521 +▁seus -3522 +▁sine -3523 +▁snow -3524 +▁sola -3525 +▁suis -3526 +▁sule -3527 +▁surf -3528 +▁taro -3529 +▁teko -3530 +▁teme -3531 +▁tepa -3532 +▁tepo -3533 +▁teve -3534 +▁titi -3535 +▁toau -3536 +▁toka -3537 +▁tonu -3538 +▁tuhe -3539 +▁tuhu -3540 +▁tura -3541 +▁tutu -3542 +▁tōna -3543 +▁uira -3544 +▁vall -3545 +▁vana -3546 +▁vera -3547 +▁você -3548 +▁vāna -3549 +▁with -3550 +▁wīwī -3551 +▁âamu -3552 +▁âmui -3553 +▁îraa -3554 +africa -3555 +aifiti -3556 +amâraa -3557 +apiira -3558 +ataata -3559 +atuhia -3560 +cation -3561 +celona -3562 +center -3563 +chiman -3564 +donald -3565 +edirne -3566 +fauraa -3567 +fortia -3568 +gentea -3569 +heretō -3570 +hostal -3571 +huinga -3572 +hīmene -3573 +iriraa -3574 +ivavao -3575 +kareka -3576 +kuláre -3577 +llyday -3578 +lémena -3579 +marama -3580 +minist -3581 +misina -3582 +nglish -3583 +ngonui -3584 +numiti -3585 +nuvera -3586 +oniifo -3587 +prache -3588 +ribati -3589 +roella -3590 +ruhito -3591 +sident -3592 +silien -3593 +spesia -3594 +sticum -3595 +sulare -3596 +sypium -3597 +tepipi -3598 +terani -3599 +ticosa -3600 +tārava -3601 +urites -3602 +urunga -3603 +vatska -3604 +waiata -3605 +ìteraa -3606 +ристич -3607 +▁actua -3608 +▁adaku -3609 +▁adela -3610 +▁alata -3611 +▁alice -3612 +▁alpha -3613 +▁amanu -3614 +▁amaru -3615 +▁angli -3616 +▁arabi -3617 +▁aroha -3618 +▁auraa -3619 +▁award -3620 +▁betty -3621 +▁bisiw -3622 +▁blues -3623 +▁boute -3624 +▁bowen -3625 +▁brest -3626 +▁cassà -3627 +▁citri -3628 +▁commi -3629 +▁daily -3630 +▁daisy -3631 +▁denis -3632 +▁eesti -3633 +▁ejisu -3634 +▁etoni -3635 +▁faaau -3636 +▁faaru -3637 +▁faati -3638 +▁faith -3639 +▁falab -3640 +▁ferra -3641 +▁ferri -3642 +▁fetia -3643 +▁fetià -3644 +▁first -3645 +▁flori -3646 +▁franc -3647 +▁frédé -3648 +▁fānau -3649 +▁gusta -3650 +▁haamo -3651 +▁hanga -3652 +▁henen -3653 +▁henri -3654 +▁hiroà -3655 +▁huaai -3656 +▁hōreo -3657 +▁idade -3658 +▁igual -3659 +▁infos -3660 +▁ingoa -3661 +▁julià -3662 +▁jurei -3663 +▁kairo -3664 +▁katiu -3665 +▁komfo -3666 +▁konge -3667 +▁kwame -3668 +▁kwase -3669 +▁leone -3670 +▁liver -3671 +▁longa -3672 +▁lídia -3673 +▁manar -3674 +▁manui -3675 +▁mello -3676 +▁merci -3677 +▁methy -3678 +▁moluc -3679 +▁monte -3680 +▁mount -3681 +▁musée -3682 +▁names -3683 +▁negro -3684 +▁nenei -3685 +▁nepal -3686 +▁nephi -3687 +▁noreg -3688 +▁nyáze -3689 +▁opani -3690 +▁panda -3691 +▁papaa -3692 +▁parti -3693 +▁perez -3694 +▁photo -3695 +▁plaît -3696 +▁popaa -3697 +▁pouri -3698 +▁prado -3699 +▁premi -3700 +▁priva -3701 +▁puoro -3702 +▁pwani -3703 +▁pāpua -3704 +▁ratio -3705 +▁raveā -3706 +▁rocha -3707 +▁rodri -3708 +▁rosto -3709 +▁rātou -3710 +▁sabia -3711 +▁sagit -3712 +▁seven -3713 +▁silva -3714 +▁solia -3715 +▁souff -3716 +▁souza -3717 +▁staat -3718 +▁taato -3719 +▁taero -3720 +▁taite -3721 +▁tamaì -3722 +▁tapea -3723 +▁taruā -3724 +▁taure -3725 +▁teioa -3726 +▁temoe -3727 +▁temps -3728 +▁terai -3729 +▁tikei -3730 +▁tiwhi -3731 +▁toroa -3732 +▁trump -3733 +▁tuaro -3734 +▁tuite -3735 +▁tychy -3736 +▁uttar -3737 +▁vavai -3738 +▁visit -3739 +▁vladi -3740 +▁whana -3741 +▁world -3742 +▁àhuru -3743 +▁ânani -3744 +▁ènana -3745 +ahotura -3746 +alpinia -3747 +ccharum -3748 +cepción -3749 +ciparum -3750 +dytarum -3751 +dística -3752 +fritsch -3753 +heretue -3754 +kávetrá -3755 +manihia -3756 +minalia -3757 +navichy -3758 +ndaceae -3759 +ngifera -3760 +paraiso -3761 +paraíso -3762 +phallus -3763 +psidium -3764 +queline -3765 +ristina -3766 +ruvetia -3767 +stiques -3768 +tallada -3769 +taronia -3770 +tetiano -3771 +thosoma -3772 +tifolia -3773 +titohia -3774 +tsoreau -3775 +ttlikon -3776 +āitoraa -3777 +ōperera -3778 +▁aguiar -3779 +▁ahakoa -3780 +▁ahunui -3781 +▁akanva -3782 +▁akiaki -3783 +▁albert -3784 +▁anavai -3785 +▁andreu -3786 +▁anuanu -3787 +▁aníbal -3788 +▁aparau -3789 +▁apatoà -3790 +▁appiah -3791 +▁arorau -3792 +▁asante -3793 +▁ateate -3794 +▁azerba -3795 +▁baskin -3796 +▁batata -3797 +▁boragi -3798 +▁brasil -3799 +▁brésil -3800 +▁carlos -3801 +▁castro -3802 +▁cavaco -3803 +▁cidade -3804 +▁compan -3805 +▁decide -3806 +▁dentro -3807 +▁dordor -3808 +▁edulis -3809 +▁elaine -3810 +▁eliana -3811 +▁eliane -3812 +▁equise -3813 +▁ereraa -3814 +▁esteve -3815 +▁eunice -3816 +▁euphor -3817 +▁faatià -3818 +▁faaàhā -3819 +▁faaàpu -3820 +▁faaûru -3821 +▁farara -3822 +▁fatata -3823 +▁fluvià -3824 +▁flávio -3825 +▁france -3826 +▁haerea -3827 +▁henryk -3828 +▁herbal -3829 +▁hetero -3830 +▁howell -3831 +▁hīmeni -3832 +▁imiraa -3833 +▁itehia -3834 +▁jacqui -3835 +▁johnny -3836 +▁kauehi -3837 +▁kouaku -3838 +▁louvre -3839 +▁macron -3840 +▁manuïa -3841 +▁maraga -3842 +▁marcel -3843 +▁mature -3844 +▁mcgill -3845 +▁mekiro -3846 +▁merger -3847 +▁metera -3848 +▁miquel -3849 +▁mokowa -3850 +▁molecu -3851 +▁mollet -3852 +▁morane -3853 +▁moroni -3854 +▁moscou -3855 +▁márcia -3856 +▁mānava -3857 +▁nihiru -3858 +▁niuhia -3859 +▁nohora -3860 +▁nūmera -3861 +▁parani -3862 +▁paraoa -3863 +▁parisi -3864 +▁peehia -3865 +▁petero -3866 +▁pfizer -3867 +▁philip -3868 +▁pinaki -3869 +▁please -3870 +▁polska -3871 +▁polyne -3872 +▁portal -3873 +▁porter -3874 +▁rahira -3875 +▁raraka -3876 +▁raroia -3877 +▁ratere -3878 +▁riveta -3879 +▁roaraa -3880 +▁roszte -3881 +▁rēmuna -3882 +▁sahara -3883 +▁sandra -3884 +▁school -3885 +▁sierra -3886 +▁sombra -3887 +▁taenga -3888 +▁taiaro -3889 +▁takume -3890 +▁tamanu -3891 +▁tarahu -3892 +▁tauere -3893 +▁tauraa -3894 +▁taviri -3895 +▁taòhia -3896 +▁tearii -3897 +▁teatea -3898 +▁tekava -3899 +▁terera -3900 +▁thanks -3901 +▁tiaàau -3902 +▁tigers -3903 +▁tinito -3904 +▁tiàraa -3905 +▁tourne -3906 +▁toètoè -3907 +▁troglo -3908 +▁turiti -3909 +▁tuvalu -3910 +▁tāfano -3911 +▁tāhinu -3912 +▁tāporo -3913 +▁ubuntu -3914 +▁unesco -3915 +▁victor -3916 +▁vilada -3917 +▁vilama -3918 +▁whanga -3919 +▁whanui -3920 +▁whenua -3921 +▁wilson -3922 +▁yuniva -3923 +▁ànotau -3924 +▁àuhune -3925 +▁āmenia -3926 +atuahiva -3927 +aturiraa -3928 +cifolium -3929 +division -3930 +férences -3931 +gardenia -3932 +hibiscus -3933 +national -3934 +ografski -3935 +ographie -3936 +otropium -3937 +pandanus -3938 +parauraa -3939 +publique -3940 +pāpaìraa -3941 +tatihata -3942 +tifolium -3943 +whakaari -3944 +▁abankro -3945 +▁akamaru -3946 +▁altilis -3947 +▁amerika -3948 +▁angeles -3949 +▁antigen -3950 +▁antonio -3951 +▁antônio -3952 +▁anuvera -3953 +▁apataki -3954 +▁arairaa -3955 +▁aratika -3956 +▁atamira -3957 +▁atuaraa -3958 +▁barbosa -3959 +▁brandão -3960 +▁castell -3961 +▁casuari -3962 +▁catappa -3963 +▁comosus -3964 +▁corinne -3965 +▁cucurma -3966 +▁ecuador -3967 +▁english -3968 +▁faahapa -3969 +▁faahiti -3970 +▁faahoho -3971 +▁faatoro -3972 +▁faatumu -3973 +▁fagifer -3974 +▁fareata -3975 +▁fernand -3976 +▁fragoso -3977 +▁frogier -3978 +▁gregory -3979 +▁guajava -3980 +▁hanshin -3981 +▁haraiki -3982 +▁hercego -3983 +▁holcomb -3984 +▁hunaraa -3985 +▁hurihia -3986 +▁incanus -3987 +▁islands -3988 +▁jackson -3989 +▁kaukura -3990 +▁kawango -3991 +▁kingdom -3992 +▁kohinga -3993 +▁leticia -3994 +▁llémena -3995 +▁makaroa -3996 +▁makatea -3997 +▁malgrat -3998 +▁marokau -3999 +▁mataiva -4000 +▁maçanet -4001 +▁medical -4002 +▁miranda -4003 +▁miriona -4004 +▁moruroa -4005 +▁māniota -4006 +▁nigeria -4007 +▁nkrumah -4008 +▁nohoraa -4009 +▁odorata -4010 +▁omuaraa -4011 +▁orohena -4012 +▁orvesen -4013 +▁painapo -4014 +▁pasteur -4015 +▁pipiria -4016 +▁poheraa -4017 +▁polanyi -4018 +▁poszter -4019 +▁pradesh -4020 +▁project -4021 +▁prolixa -4022 +▁puarātā -4023 +▁pukarua -4024 +▁pētānia -4025 +▁pōtinia -4026 +▁raitihi -4027 +▁rapaeau -4028 +▁reitoru -4029 +▁rikitea -4030 +▁ronaldo -4031 +▁roubaix -4032 +▁sanquer -4033 +▁science -4034 +▁serafim -4035 +▁sotelli -4036 +▁tahanea -4037 +▁taioraa -4038 +▁tatuhaa -4039 +▁tauihaa -4040 +▁tehetia -4041 +▁teienei -4042 +▁tikanga -4043 +▁tikehau -4044 +▁timoteo -4045 +▁trojany -4046 +▁tuanake -4047 +▁tumuaki -4048 +▁vahanga -4049 +▁verrons -4050 +▁vontade -4051 +▁whakapu -4052 +▁àhuāraì -4053 +▁êperēra -4054 +▁народна -4055 +chimantia -4056 +guayaquil -4057 +hostalnou -4058 +montblanc -4059 +niuterani -4060 +ntiifolia -4061 +raromataì -4062 +ringtonia -4063 +taimareva -4064 +toronetia -4065 +vernement -4066 +▁achimota -4067 +▁adelaide -4068 +▁american -4069 +▁anglican -4070 +▁argentea -4071 +▁asiatica -4072 +▁basileia -4073 +▁bouissou -4074 +▁brasilia -4075 +▁consulté -4076 +▁cristina -4077 +▁dominiak -4078 +▁faafanau -4079 +▁fakahina -4080 +▁frédéric -4081 +▁gonzalez -4082 +▁hallyday -4083 +▁hangarau -4084 +▁hospital -4085 +▁illinois -4086 +▁insulare -4087 +▁kenyatta -4088 +▁komisina -4089 +▁malhação -4090 +▁manahune -4091 +▁manutahi -4092 +▁marotiri -4093 +▁maupihaa -4094 +▁mcdonald -4095 +▁mekameka -4096 +▁melekeok -4097 +▁military -4098 +▁mātiharo -4099 +▁māuruuru -4100 +▁nanumiti -4101 +▁naruhito -4102 +▁natīrara -4103 +▁nucifera -4104 +▁nászopki -4105 +▁oeillets -4106 +▁oliveira -4107 +▁otegbayo -4108 +▁patireia -4109 +▁patrícia -4110 +▁peralada -4111 +▁peretita -4112 +▁populnea -4113 +▁profesôr -4114 +▁pātifita -4115 +▁pātifitā -4116 +▁raparapa -4117 +▁ravahere -4118 +▁rekareka -4119 +▁research -4120 +▁rohipehe -4121 +▁rongonui -4122 +▁salvador -4123 +▁sinensis -4124 +▁snowbird -4125 +▁speciosa -4126 +▁stanford -4127 +▁sulemana -4128 +▁takapoto -4129 +▁taratara -4130 +▁tarutaru -4131 +▁teaching -4132 +▁tekokota -4133 +▁temeharo -4134 +▁tenararo -4135 +▁tepapuri -4136 +▁thailand -4137 +▁tiribati -4138 +▁titauhia -4139 +▁toroātia -4140 +▁tourisme -4141 +▁vaataata -4142 +▁vahitahi -4143 +▁vanavana -4144 +▁ventures -4145 +▁vladimir -4146 +▁wellcome -4147 +▁whakaaro -4148 +▁whakanui -4149 +▁òrometua -4150 +▁туристич -4151 +artocarpus -4152 +christophe -4153 +heretōvina -4154 +ographical -4155 +oniifolius -4156 +zostachyum -4157 +▁actualité -4158 +▁aleksandr -4159 +▁alexandre -4160 +▁americana -4161 +▁animation -4162 +▁antitumor -4163 +▁apatoèrau -4164 +▁azinheira -4165 +▁brésilien -4166 +▁csebászti -4167 +▁dioscorea -4168 +▁dättlikon -4169 +▁faaoraraa -4170 +▁faataahia -4171 +▁faataaraa -4172 +▁faaìteraa -4173 +▁falabella -4174 +▁feruriraa -4175 +▁fruticosa -4176 +▁haamaitai -4177 +▁heremoana -4178 +▁huitārava -4179 +▁hāmanihia -4180 +▁igualdade -4181 +▁kaiwaiata -4182 +▁lancaster -4183 +▁lancastro -4184 +▁liverpool -4185 +▁manuhangi -4186 +▁manuïaraa -4187 +▁motutunga -4188 +▁myrtaceae -4189 +▁noruvetia -4190 +▁parataito -4191 +▁porinetia -4192 +▁porīnetia -4193 +▁president -4194 +▁priscille -4195 +▁republika -4196 +▁sapientum -4197 +▁taitensis -4198 +▁tamataraa -4199 +▁taraehara -4200 +▁tematangi -4201 +▁tenarunga -4202 +▁tetaronia -4203 +▁tiwhikete -4204 +▁torinetia -4205 +▁torroella -4206 +▁totegegie -4207 +▁vairaatea -4208 +▁anuanuraro -4209 +▁asantehene -4210 +▁citrifolia -4211 +▁concepción -4212 +▁faaterehau -4213 +▁faatupuhia -4214 +▁falciparum -4215 +▁fangataufa -4216 +▁floridulus -4217 +▁fédération -4218 +▁géographie -4219 +▁haamataraa -4220 +▁inophyllum -4221 +▁jacqueline -4222 +▁kongeriket -4223 +▁lukashenko -4224 +▁matauranga -4225 +▁mohiotanga -4226 +▁mountcrest -4227 +▁nukutepipi -4228 +▁officinale -4229 +▁rohfritsch -4230 +▁références -4231 +▁république -4232 +▁solanaceae -4233 +▁tirometera -4234 +▁université -4235 +▁valparaíso -4236 +▁whakamahia -4237 +▁whakamaori -4238 +▁yunivasiti -4239 +▁àifāitoraa -4240 +devalparaiso -4241 +orphophallus -4242 +▁anuanurunga -4243 +▁baranavichy -4244 +▁companheira -4245 +▁haamauruuru -4246 +▁hereheretue -4247 +▁kaiwhakaari -4248 +▁methysticum -4249 +▁officinarum -4250 +▁pandanaceae -4251 +▁papetitohia -4252 +▁sapindaceae -4253 +▁statistique -4254 +▁techimantia -4255 +▁teritetiano -4256 +▁touristique -4257 +▁whakaatuhia -4258 +▁boraginaceae -4259 +▁geographical -4260 +▁glaucifolium -4261 +▁gouvernement -4262 +▁informations -4263 +▁matatatihata -4264 +▁matureivavao -4265 +▁tauaparauraa -4266 +▁territoriale -4267 +▁tournefortia -4268 +▁aurantiifolia -4269 +▁equisetifolia -4270 +▁euphorbiaceae -4271 +▁international -4272 +▁nászopkávetrá -4273 +▁paeoniifolius -4274 +▁sagittifolium -4275 +▁troglodytarum -4276 +▁faanahonahoraa -4277 +.[] -4278 +cdf -4279 +juï -4280 +mcm -4281 +nçà -4282 +ród -4283 +vāi -4284 +wee -4285 +why -4286 +yip -4287 +ziz -4288 +zzi -4289 +čić -4290 +ани -4291 +вни -4292 +едн -4293 +ени -4294 +лад -4295 +нка -4296 +▁ -6707 +cor -6708 +lij -6709 +pao -6710 +taa -6711 +▁jk -6712 +bcor -6713 +othè -6714 +urac -6715 +yves -6716 +▁der -6717 +▁emi -6718 +▁haè -6719 +▁nii -6720 +▁teu -6721 +▁vol -6722 +aaamu -6723 +rissa -6724 +tiale -6725 +trosi -6726 +ttare -6727 +verde -6728 +▁andr -6729 +▁août -6730 +▁fiti -6731 +▁ihoa -6732 +▁kadu -6733 +▁pays -6734 +▁petr -6735 +▁regi -6736 +▁rico -6737 +▁tīaì -6738 +bcorda -6739 +▁biden -6740 +▁eurac -6741 +▁ferre -6742 +▁flaçà -6743 +▁mutaa -6744 +▁málij -6745 +▁neuro -6746 +▁opbri -6747 +▁samoa -6748 +▁taoto -6749 +▁tapaò -6750 +▁tiaki -6751 +▁volta -6752 +bliothè -6753 +metrosi -6754 +otiteat -6755 +patiale -6756 +saverde -6757 +▁andrze -6758 +▁droite -6759 +▁emilin -6760 +▁geneva -6761 +▁kiloni -6762 +▁regina -6763 +▁sergio -6764 +▁solius -6765 +▁sílvio -6766 +▁vilana -6767 +averrhoa -6768 +bcordata -6769 +briciano -6770 +capsicum -6771 +chnitzel -6772 +collecti -6773 +commissa -6774 +cskumáre -6775 +ctionary -6776 +ductions -6777 +ellement -6778 +empúries -6779 +gasriika -6780 +gholough -6781 +glicério -6782 +gueiredo -6783 +hinensis -6784 +hocolate -6785 +hostoles -6786 +hrvatska -6787 +huatanga -6788 +huirecen -6789 +illinois -6790 +isztorul -6791 +ivotriko -6792 +licsárij -6793 +llastret -6794 +llobrega -6795 +légation -6796 +makitaki -6797 +matauhia -6798 +matology -6799 +)" -6800 +io -6801 +pt -6802 +pî -6803 +äc -6804 +end -6805 +eri -6806 +iaa -6807 +née -6808 +ynt -6809 +▁av -6810 +▁mk -6811 +dame -6812 +gram -6813 +nomi -6814 +quei -6815 +uang -6816 +ēera -6817 +▁(). -6818 +▁ito -6819 +▁may -6820 +▁pur -6821 +▁päc -6822 +▁teo -6823 +▁via -6824 +ciali -6825 +criti -6826 +elend -6827 +gizes -6828 +iaame -6829 +ruant -6830 +zania -6831 +▁avri -6832 +▁cale -6833 +▁cynt -6834 +▁oslo -6835 +▁prus -6836 +▁sept -6837 +▁viab -6838 +critic -6839 +gramme -6840 +liquei -6841 +nzania -6842 +▁arara -6843 +▁avril -6844 +▁hawai -6845 +▁huita -6846 +▁isabe -6847 +▁juang -6848 +▁kainu -6849 +▁mayer -6850 +▁tator -6851 +▁teeri -6852 +▁whiti -6853 +▁ûmara -6854 +perēera -6855 +rágizes -6856 +русский -6857 +▁bruant -6858 +▁faaapî -6859 +▁faatia -6860 +▁itoito -6861 +▁kelend -6862 +▁mataio -6863 +▁planes -6864 +▁tamata -6865 +▁tāhiti -6866 +boliquei -6867 +cialiste -6868 +mination -6869 +minister -6870 +miquelon -6871 +mnigueij -6872 +mothrace -6873 +nicskijá -6874 +nikultri -6875 +niàmataì -6876 +nulaceae -6877 +nyászkij -6878 +nyávnyio -6879 +olingare -6880 +ordyline -6881 +orithmic -6882 +orofenua -6883 +oshihide -6884 +peraceae -6885 +plumeria -6886 +polukáre -6887 +poláresz -6888 +pupirīta -6889 +putuputu -6890 +rahovice -6891 +ravaìraa -6892 +rdcastle -6893 +ringfire -6894 +santalum -6895 +scanthus -6896 +sshunter -6897 +sterving -6898 +tacritic -6899 +', -6900 +ык -6901 +ruï -6902 +uti -6903 +зык -6904 +▁cí -6905 +▁fâ -6906 +▁kô -6907 +dria -6908 +fatu -6909 +riva -6910 +tagu -6911 +úcia -6912 +▁mia -6913 +barça -6914 +nenga -6915 +petri -6916 +tagut -6917 +▁arui -6918 +▁cama -6919 +▁care -6920 +▁cruï -6921 +▁huit -6922 +▁lana -6923 +▁nice -6924 +▁terā -6925 +▁vaha -6926 +▁язык -6927 +mihere -6928 +▁abbas -6929 +▁desti -6930 +▁ihipa -6931 +▁lúcia -6932 +▁miami -6933 +▁north -6934 +▁papal -6935 +▁vaiho -6936 +▁wilma -6937 +amihere -6938 +earchga -6939 +iteiraa -6940 +morinda -6941 +nengaro -6942 +▁antoni -6943 +▁career -6944 +▁cínira -6945 +▁mafatu -6946 +▁marcos -6947 +▁māiata -6948 +▁sprint -6949 +liminisz -6950 +orizonte -6951 +tanilles -6952 +tauatini -6953 +teronomi -6954 +thriller -6955 +tificial -6956 +tinanata -6957 +triváles -6958 +ttarella -6959 +uanatura -6960 +ulpellac -6961 +valevska -6962 +warszawa -6963 +whakaaro -6964 +zingiber -6965 +zinyenko -6966 +ūmatatea -6967 +купштина -6968 +▁aahiata -6969 +▁abiodun -6970 +▁adakudu -6971 +▁adakugu -6972 +▁adukwei -6973 +▁afareai -6974 +▁african -6975 +▁agyekum -6976 +▁airport -6977 +▁alberto -6978 +▁algiers -6979 +▁andrzej -6980 +▁anglais -6981 +▁anthony -6982 +▁antoine -6983 +▁antônia -6984 +▁asheley -6985 +▁asiedua -6986 +▁ataahua -6987 +▁avenida -6988 +▁balance -6989 +▁bapetiz -6990 +▁beijing -6991 +▁belango -6992 +▁berisha -6993 +▁bertaèy -6994 +▁bertero -6995 +▁bescanó -6996 +▁biology -6997 +▁boldrin -6998 +▁bollers -6999 +): -7000 +cn -7001 +tm -7002 +ân -7003 +low -7004 +sân -7005 +tep -7006 +óes -7007 +▁im -7008 +▁òc -7009 +cnrs -7010 +elus -7011 +itaā -7012 +nere -7013 +otti -7014 +tape -7015 +▁bih -7016 +▁rég -7017 +▁toa -7018 +festo -7019 +llero -7020 +numia -7021 +otted -7022 +raamu -7023 +urite -7024 +▁back -7025 +▁góes -7026 +▁haro -7027 +▁have -7028 +▁hōpe -7029 +▁iter -7030 +▁koti -7031 +▁lipo -7032 +▁ophi -7033 +▁rāua -7034 +▁tant -7035 +▁tihi -7036 +cotted -7037 +mautia -7038 +rsotti -7039 +scelus -7040 +▁agora -7041 +▁arena -7042 +▁lília -7043 +▁mario -7044 +▁moscà -7045 +▁mouta -7046 +▁nūnaa -7047 +▁régis -7048 +▁taere -7049 +▁temau -7050 +▁terii -7051 +▁tetep -7052 +itaāria -7053 +liaceus -7054 +llerols -7055 +nifolia -7056 +taurite -7057 +ututaru -7058 +ycotted -7059 +▁amanda -7060 +▁backpa -7061 +▁duarte -7062 +▁fortià -7063 +▁huinga -7064 +▁hānere -7065 +▁konohe -7066 +▁ludlow -7067 +▁lílian -7068 +▁miscan -7069 +▁poland -7070 +▁sobral -7071 +▁tantra -7072 +▁tarawa -7073 +▁tuuraa -7074 +csimnáze -7075 +ministry -7076 +tnership -7077 +vinyenko -7078 +▁bonjorn -7079 +▁bonjour -7080 +▁bonmatí -7081 +▁bordils -7082 +▁buzsnyá -7083 +▁cabanes -7084 +▁cainito -7085 +▁calella -7086 +▁calophy -7087 +▁camalle -7088 +▁camargo -7089 +▁camozzi -7090 +▁cananga -7091 +▁capmany -7092 +▁cassini -7093 +▁cellera -7094 +▁cheveux -7095 +▁chicago -7096 +▁christi -7097 +▁cimángo -7098 +▁climent -7099 +") -7100 +hoe -7101 +jta -7102 +nux -7103 +ram -7104 +rao -7105 +vil -7106 +▁ip -7107 +▁it -7108 +▁tv -7109 +▁tx -7110 +▁tô -7111 +chel -7112 +chno -7113 +rema -7114 +veià -7115 +▁eiâ -7116 +▁ene -7117 +▁lec -7118 +▁mum -7119 +▁ult -7120 +hawai -7121 +jtari -7122 +leana -7123 +miere -7124 +narao -7125 +ohsiu -7126 +▁dans -7127 +▁gona -7128 +▁mose -7129 +▁musi -7130 +▁paru -7131 +▁waia -7132 +▁yara -7133 +ramort -7134 +tirara -7135 +ubuntu -7136 +▁auter -7137 +▁civil -7138 +▁enemi -7139 +▁etoto -7140 +▁linux -7141 +▁láves -7142 +▁maior -7143 +▁pavel -7144 +▁publi -7145 +▁rudol -7146 +▁tôvon -7147 +▁àveià -7148 +jtarija -7149 +nanahia -7150 +ohsiung -7151 +èperēra -7152 +▁joelle -7153 +▁jurema -7154 +▁lectin -7155 +▁manage -7156 +▁michel -7157 +▁mumura -7158 +▁parupa -7159 +▁platja -7160 +▁publie -7161 +▁rudolf -7162 +▁tavana -7163 +▁techno -7164 +▁tuaiva -7165 +▁србију -7166 +pflocher -7167 +ukairani -7168 +vanadate -7169 +▁cláudia -7170 +▁cláudio -7171 +▁college -7172 +▁commise -7173 +▁contour -7174 +▁coronel -7175 +▁crespià -7176 +▁császte -7177 +▁cynthia -7178 +▁daniela -7179 +▁darnius -7180 +▁delgado -7181 +▁dentist -7182 +▁despuig -7183 +▁details -7184 +▁diszkor -7185 +▁disznyu -7186 +▁drollet -7187 +▁dutronc -7188 +▁dámángo -7189 +▁edralin -7190 +▁emperor -7191 +▁engraça -7192 +▁escrava -7193 +▁escrito -7194 +▁espolla -7195 +▁esquina -7196 +▁essenti -7197 +▁etiopia -7198 +▁eudósia -7199 +eta -7200 +gel -7201 +hen -7202 +hgh -7203 +mij -7204 +ure -7205 +vić -7206 +▁ex -7207 +▁fc -7208 +▁fī -7209 +▁gy -7210 +▁xi -7211 +hiri -7212 +mily -7213 +mmij -7214 +ngel -7215 +ouma -7216 +rdis -7217 +reta -7218 +teen -7219 +then -7220 +vedo -7221 +▁eda -7222 +▁maō -7223 +▁rid -7224 +▁zsá -7225 +▁âte -7226 +ersti -7227 +pardi -7228 +▁angi -7229 +▁find -7230 +▁fītī -7231 +▁hali -7232 +▁jord -7233 +▁kibi -7234 +▁maes -7235 +▁riel -7236 +▁tito -7237 +▁tole -7238 +▁vasc -7239 +etabli -7240 +gelian -7241 +ollina -7242 +ródmie -7243 +tringa -7244 +zevedo -7245 +▁biure -7246 +▁cohen -7247 +▁corçà -7248 +▁douma -7249 +▁exter -7250 +▁hītoa -7251 +▁janei -7252 +▁lasso -7253 +▁milla -7254 +▁ordis -7255 +▁ridge -7256 +▁tossa -7257 +▁ôhiri -7258 +teensis -7259 +trommij -7260 +▁angitu -7261 +▁family -7262 +▁halifa -7263 +▁jordan -7264 +▁kibing -7265 +▁loreta -7266 +▁matani -7267 +▁moihaa -7268 +▁puurau -7269 +▁rangel -7270 +▁riells -7271 +▁temple -7272 +▁toleza -7273 +▁utahia -7274 +pardines -7275 +stigador -7276 +tīaniani -7277 +▁albanyà -7278 +▁azevedo -7279 +▁collina -7280 +▁eulàlia -7281 +▁faahere -7282 +▁faaueue -7283 +▁faaèraa -7284 +▁faimano -7285 +▁faraāni -7286 +▁farners -7287 +▁faufaai -7288 +▁febuare -7289 +▁feridos -7290 +▁ferrari -7291 +▁ferrite -7292 +▁foerthe -7293 +▁fonteta -7294 +▁francis -7295 +▁frutesc -7296 +▁fédéral -7297 +▁galenon -7298 +▁gateway -7299 +.' -7300 +éc -7301 +dak -7302 +epa -7303 +law -7304 +ndc -7305 +▁ah -7306 +▁ov -7307 +▁rs -7308 +▁sw -7309 +anaí -7310 +llar -7311 +scha -7312 +ório -7313 +▁ika -7314 +▁iot -7315 +▁māt -7316 +▁ngo -7317 +▁nov -7318 +▁pdf -7319 +▁tāà -7320 +▁xan -7321 +riana -7322 +rudak -7323 +écrit -7324 +▁chan -7325 +▁cole -7326 +▁paho -7327 +▁pedy -7328 +▁purū -7329 +▁swis -7330 +▁yare -7331 +anaína -7332 +hereta -7333 +kivále -7334 +lawton -7335 +maggio -7336 +pelkan -7337 +sienne -7338 +tīteni -7339 +▁frank -7340 +▁hamoa -7341 +▁iotua -7342 +▁overe -7343 +▁porte -7344 +▁swiss -7345 +▁turau -7346 +▁tāàmu -7347 +▁yaren -7348 +cananga -7349 +mutunga -7350 +océanie -7351 +▁colera -7352 +▁huntly -7353 +▁osório -7354 +▁purūmu -7355 +▁raroto -7356 +▁tūpoto -7357 +cecropia -7358 +csimonká -7359 +fanauhia -7360 +▁adriana -7361 +▁bàscara -7362 +▁chantal -7363 +▁gbentie -7364 +▁georges -7365 +▁giacomo -7366 +▁gilbert -7367 +▁gitanas -7368 +▁glasgow -7369 +▁golding -7370 +▁gominsk -7371 +▁goodybe -7372 +▁goulart -7373 +▁grandis -7374 +▁gregori -7375 +▁grányiz -7376 +▁guarnie -7377 +▁gugliel -7378 +▁guiller -7379 +▁guiomar -7380 +▁gustavo -7381 +▁guíxols -7382 +▁hakahau -7383 +▁halifax -7384 +▁hammura -7385 +▁hangaia -7386 +▁heimana -7387 +▁hilkias -7388 +▁hinarao -7389 +▁history -7390 +▁honiara -7391 +▁huriama -7392 +▁hussein -7393 +▁ihipapa -7394 +▁inseete -7395 +▁irenita -7396 +▁isabeau -7397 +▁jacquie -7398 +▁janaína -7399 +'. -7400 +it -7401 +jhi -7402 +vao -7403 +▁yi -7404 +buka -7405 +lowo -7406 +mila -7407 +ober -7408 +onet -7409 +▁hor -7410 +▁ior -7411 +▁rae -7412 +▁une -7413 +▁uri -7414 +▁vaù -7415 +bourg -7416 +chsen -7417 +mento -7418 +rates -7419 +troit -7420 +vanaa -7421 +álesz -7422 +едник -7423 +▁___? -7424 +▁akaa -7425 +▁anne -7426 +▁aunu -7427 +▁caso -7428 +▁efaa -7429 +▁jada -7430 +▁leys -7431 +▁maho -7432 +▁mori -7433 +▁peut -7434 +▁rafa -7435 +▁stre -7436 +rcumsp -7437 +rianum -7438 +wolowo -7439 +▁bojhi -7440 +▁faura -7441 +▁jacky -7442 +▁jamra -7443 +▁marty -7444 +▁meire -7445 +▁pimen -7446 +▁stats -7447 +▁strem -7448 +▁taura -7449 +komento -7450 +oncelos -7451 +▁angela -7452 +▁camila -7453 +▁coober -7454 +▁fauraò -7455 +▁fāpura -7456 +▁graffe -7457 +▁izdava -7458 +▁karzai -7459 +▁mahome -7460 +▁mieres -7461 +▁nuinga -7462 +▁pomare -7463 +▁rafael -7464 +▁sacalm -7465 +▁главни -7466 +vinyonet -7467 +▁aivanaa -7468 +▁aunuunu -7469 +▁awolowo -7470 +▁calonge -7471 +▁detroit -7472 +▁garrigo -7473 +▁haapoto -7474 +▁izdavač -7475 +▁janeiro -7476 +▁janvier -7477 +▁jaussen -7478 +▁jeanine -7479 +▁jinping -7480 +▁joachim -7481 +▁jussara -7482 +▁justine -7483 +▁kainuku -7484 +▁kaitito -7485 +▁karanga -7486 +▁kaupapa -7487 +▁kawongo -7488 +▁kilomin -7489 +▁klopper -7490 +▁knights -7491 +▁kuleana -7492 +▁kumanin -7493 +▁kôleeji -7494 +▁kōpūreo -7495 +▁larissa -7496 +▁lecythi -7497 +▁lexique -7498 +▁lietuva -7499 +.), -7500 +dam -7501 +fit -7502 +gol -7503 +mel -7504 +new -7505 +pys -7506 +uen -7507 +éon -7508 +▁ji -7509 +▁èà -7510 +duze -7511 +ffit -7512 +fifi -7513 +lleu -7514 +nunu -7515 +onto -7516 +équi -7517 +▁(), -7518 +▁bac -7519 +▁don -7520 +▁jor -7521 +▁muz -7522 +▁roc -7523 +▁sua -7524 +duzeć -7525 +mbusz -7526 +minum -7527 +munes -7528 +ngrua -7529 +tella -7530 +urval -7531 +▁esti -7532 +▁léon -7533 +▁mane -7534 +▁radc -7535 +▁rohe -7536 +duzeće -7537 +sminum -7538 +terera -7539 +équipe -7540 +▁afriy -7541 +▁atomi -7542 +▁dates -7543 +▁estre -7544 +▁gogol -7545 +▁homel -7546 +▁jordi -7547 +▁kopys -7548 +▁lycée -7549 +▁matua -7550 +▁muzeu -7551 +▁rouen -7552 +▁suave -7553 +▁tipen -7554 +istella -7555 +ngruang -7556 +phoenix -7557 +▁ahurei -7558 +▁cadaqu -7559 +▁durval -7560 +▁gentle -7561 +▁itiraa -7562 +▁limite -7563 +▁maneco -7564 +▁muzeum -7565 +▁māhora -7566 +▁navata -7567 +▁pānunu -7568 +▁rocles -7569 +▁ronald -7570 +▁sassou -7571 +▁sellal -7572 +▁suffit -7573 +▁tapone -7574 +▁ussher -7575 +▁vaiiho -7576 +jasminum -7577 +uixalleu -7578 +▁afriyie -7579 +▁cadaqué -7580 +▁jimángo -7581 +▁limited -7582 +▁llofriu -7583 +▁llogaia -7584 +▁llorenç -7585 +▁loisirs -7586 +▁londres -7587 +▁lottori -7588 +▁lourdes -7589 +▁lumiere -7590 +▁maestro -7591 +▁mandela -7592 +▁manihot -7593 +▁mapmuči -7594 +▁maraamu -7595 +▁maragai -7596 +▁marcelo -7597 +▁marinho -7598 +▁masarac -7599 +cad -7600 +fru -7601 +noi -7602 +ofe -7603 +▁ll -7604 +▁òu -7605 +calo -7606 +frug -7607 +muel -7608 +ncon -7609 +noha -7610 +tene -7611 +tāpa -7612 +zaré -7613 +▁ado -7614 +▁blo -7615 +▁llb -7616 +▁lle -7617 +▁são -7618 +▁tak -7619 +▁yaw -7620 +cados -7621 +gilev -7622 +ōporo -7623 +▁alvi -7624 +▁dala -7625 +▁deca -7626 +▁fano -7627 +▁itea -7628 +▁limi -7629 +▁smet -7630 +▁viri -7631 +samuel -7632 +▁adoni -7633 +▁blota -7634 +▁burgo -7635 +▁hanoi -7636 +▁llers -7637 +▁météo -7638 +▁nunes -7639 +▁rangi -7640 +▁sites -7641 +▁òutou -7642 +byteria -7643 +frugell -7644 +ncontre -7645 +▁alvise -7646 +▁cleyde -7647 +▁faatau -7648 +▁nazaré -7649 +▁papaya -7650 +▁sarrià -7651 +▁states -7652 +▁viride -7653 +▁whakau -7654 +byterian -7655 +ihianoha -7656 +▁hakihea -7657 +▁huitene -7658 +▁iteahia -7659 +▁limites -7660 +▁matangi -7661 +▁matehau -7662 +▁maupiha -7663 +▁maurice -7664 +▁mcgrath -7665 +▁meharry -7666 +▁mendoza -7667 +▁menezes -7668 +▁mennais -7669 +▁metturo -7670 +▁michael -7671 +▁mihiroa -7672 +▁miliona -7673 +▁minarii -7674 +▁mkpeyol -7675 +▁mogilev -7676 +▁moldova -7677 +▁monells -7678 +▁monstri -7679 +▁montcal -7680 +▁montgrí -7681 +▁morinda -7682 +▁moutame -7683 +▁musique -7684 +▁māremia -7685 +▁nationa -7686 +▁nevinha -7687 +▁nicolas -7688 +▁nirvana -7689 +▁nishani -7690 +▁nolasco -7691 +▁nucleic -7692 +▁obafemi -7693 +▁octobre -7694 +▁olivier -7695 +▁orriols -7696 +▁otumfuo -7697 +▁palikir -7698 +▁paltoga -7699 +sb -7700 +dar -7701 +ist -7702 +lda -7703 +nds -7704 +pee -7705 +ppe -7706 +òne -7707 +appe -7708 +arts -7709 +atae -7710 +core -7711 +iter -7712 +koba -7713 +mayd -7714 +orga -7715 +sboa -7716 +sola -7717 +urit -7718 +wata -7719 +èche -7720 +▁fēì -7721 +▁let -7722 +▁mit -7723 +▁oix -7724 +▁pho -7725 +amahu -7726 +haere -7727 +rends -7728 +uriri -7729 +èches -7730 +▁alar -7731 +▁apee -7732 +▁deis -7733 +▁dite -7734 +▁hope -7735 +▁hula -7736 +▁hutu -7737 +▁kape -7738 +▁oroa -7739 +▁puis -7740 +▁roca -7741 +▁rāau -7742 +▁seba -7743 +église -7744 +▁araba -7745 +▁haumi -7746 +▁hilda -7747 +▁patoi -7748 +▁pukae -7749 +▁queen -7750 +▁scran -7751 +▁taeae -7752 +▁taofe -7753 +▁teata -7754 +▁twist -7755 +▁vanua -7756 +▁vorga -7757 +amahuta -7758 +appelle -7759 +mprends -7760 +rdèches -7761 +solanum -7762 +▁capsec -7763 +▁ditema -7764 +▁encore -7765 +▁freire -7766 +▁iakoba -7767 +▁lisboa -7768 +▁mahama -7769 +▁mitche -7770 +▁pātete -7771 +▁sourit -7772 +▁thomas -7773 +▁wawata -7774 +▁âpīraa -7775 +▁dindiok -7776 +▁haamene -7777 +▁lettres -7778 +▁panedes -7779 +▁parlavà -7780 +▁parlors -7781 +▁pasqual -7782 +▁patuhia -7783 +▁pecados -7784 +▁peduase -7785 +▁peptide -7786 +▁phoenix -7787 +▁pimenta -7788 +▁pinkett -7789 +▁polatsk -7790 +▁polessa -7791 +▁pologra -7792 +▁polymer -7793 +▁polymor -7794 +▁portbou -7795 +▁poutine -7796 +▁premier -7797 +▁private -7798 +▁prozeny -7799 +bac -7800 +ely -7801 +faè -7802 +hee -7803 +ifa -7804 +lló -7805 +».( -7806 +āfa -7807 +babi -7808 +chps -7809 +ctey -7810 +mbac -7811 +puru -7812 +▁cas -7813 +▁caz -7814 +▁cel -7815 +▁ent -7816 +▁frs -7817 +▁las -7818 +▁pel -7819 +▁vaa -7820 +▁èpe -7821 +babić -7822 +ckely -7823 +graph -7824 +oteur -7825 +tenim -7826 +çaise -7827 +▁adwo -7828 +▁cazu -7829 +▁deux -7830 +▁four -7831 +▁inga -7832 +▁kapa -7833 +▁kari -7834 +▁kate -7835 +▁kava -7836 +▁komo -7837 +▁line -7838 +▁matā -7839 +▁mini -7840 +▁moça -7841 +▁sils -7842 +▁tadi -7843 +▁varo -7844 +▁what -7845 +caceae -7846 +lusion -7847 +▁armen -7848 +▁braga -7849 +▁casse -7850 +▁celso -7851 +▁entri -7852 +▁karin -7853 +▁matāu -7854 +▁mouse -7855 +▁nauru -7856 +▁orama -7857 +▁paula -7858 +▁prova -7859 +▁pāhee -7860 +▁tadić -7861 +▁tongu -7862 +▁váliá -7863 +clusion -7864 +itenati -7865 +perehia -7866 +▁aupuru -7867 +▁cazuza -7868 +▁fleurs -7869 +▁guerra -7870 +▁guetta -7871 +▁hendan -7872 +▁jectey -7873 +▁mauhaa -7874 +▁minido -7875 +▁moteur -7876 +▁sambac -7877 +▁tanora -7878 +▁tirana -7879 +▁toyota -7880 +berhardt -7881 +▁mickely -7882 +▁peltata -7883 +▁pukaemi -7884 +▁purirau -7885 +▁purpura -7886 +▁pûpûraa -7887 +▁queixàs -7888 +▁rapanga -7889 +▁results -7890 +▁ribeiro -7891 +▁ricardo -7892 +▁richard -7893 +▁riudare -7894 +▁riumors -7895 +▁robbins -7896 +▁rodolfo -7897 +▁rodrigo -7898 +▁romanyà -7899 +más -7900 +oki -7901 +rki -7902 +seu -7903 +sev -7904 +▁só -7905 +aito -7906 +fics -7907 +itoi -7908 +kiwa -7909 +kula -7910 +kutá -7911 +mith -7912 +oran -7913 +orsa -7914 +pehu -7915 +rose -7916 +seba -7917 +ssia -7918 +▁aiû -7919 +▁fep -7920 +▁kim -7921 +▁kus -7922 +▁tuf -7923 +ficus -7924 +kasev -7925 +linny -7926 +nques -7927 +okipa -7928 +orsay -7929 +paris -7930 +pines -7931 +rkiye -7932 +ssias -7933 +stião -7934 +tāura -7935 +valho -7936 +▁aivi -7937 +▁avae -7938 +▁bene -7939 +▁fase -7940 +▁file -7941 +▁henu -7942 +▁hoko -7943 +▁loko -7944 +▁roae -7945 +▁sato -7946 +▁tuku -7947 +▁tāpa -7948 +atāura -7949 +kutára -7950 +seball -7951 +▁canya -7952 +▁julia -7953 +▁mātou -7954 +▁putin -7955 +▁sande -7956 +▁smith -7957 +▁tomás -7958 +▁tufts -7959 +▁zoran -7960 +linnyer -7961 +▁andrés -7962 +▁benedi -7963 +▁eliseu -7964 +▁henuns -7965 +▁kaitoi -7966 +▁kusaug -7967 +▁manava -7968 +▁marino -7969 +▁moehau -7970 +▁roanga -7971 +▁terahi -7972 +▁tōtara -7973 +itemoana -7974 +latavila -7975 +▁cruiser -7976 +▁juliana -7977 +▁maramai -7978 +▁messias -7979 +▁rosario -7980 +▁rosztel -7981 +▁rōpūraa -7982 +▁sabrina -7983 +▁sachsen -7984 +▁sadurní -7985 +▁salazar -7986 +▁satauro -7987 +▁seattle -7988 +▁sekondi -7989 +▁senhora -7990 +▁serinyà -7991 +▁settumo -7992 +▁simárés -7993 +▁siurana -7994 +▁skipper -7995 +▁souffle -7996 +▁souffre -7997 +▁spléger -7998 +▁sprache -7999 +div -8000 +jol -8001 +lic -8002 +old -8003 +uki -8004 +yaa -8005 +yar -8006 +▁ça -8007 +demu -8008 +leil -8009 +nyie -8010 +oldt -8011 +▁aki -8012 +▁aut -8013 +▁bay -8014 +▁ham -8015 +▁kii -8016 +▁ngu -8017 +▁rés -8018 +delic -8019 +hanna -8020 +mgole -8021 +nunaa -8022 +onyar -8023 +sator -8024 +tuete -8025 +zorro -8026 +▁iore -8027 +▁kite -8028 +▁maià -8029 +▁milo -8030 +▁piva -8031 +accadé -8032 +demuls -8033 +irihia -8034 +malaya -8035 +mboldt -8036 +▁akita -8037 +▁akyaa -8038 +▁havai -8039 +▁ihora -8040 +▁kiria -8041 +▁laugh -8042 +▁maòhi -8043 +▁ngues -8044 +▁recep -8045 +▁state -8046 +▁tulle -8047 +▁vaira -8048 +▁vajol -8049 +▁wales -8050 +araahia -8051 +entitki -8052 +ticians -8053 +vanilla -8054 +èrement -8055 +▁autran -8056 +▁edirne -8057 +▁nohona -8058 +▁penson -8059 +▁rairua -8060 +▁schyle -8061 +▁soleil -8062 +▁tahinu -8063 +▁taramo -8064 +▁teller -8065 +coquette -8066 +orozoite -8067 +▁batatas -8068 +▁destino -8069 +▁dzsávre -8070 +▁embassy -8071 +▁hammoud -8072 +▁kiriata -8073 +▁nguesso -8074 +▁pensons -8075 +▁romgole -8076 +▁stephen -8077 +▁stiller -8078 +▁studios -8079 +▁sucesso -8080 +▁switzer -8081 +▁sylvana -8082 +▁szopter -8083 +▁szupris -8084 +▁tahatai -8085 +▁tahiata -8086 +▁taimana -8087 +▁taiohae -8088 +▁takenga -8089 +▁tallinn -8090 +▁tamariu -8091 +▁tampico -8092 +▁taniera -8093 +▁tanumia -8094 +▁tanuraa -8095 +▁tapuhoe -8096 +▁taratia -8097 +▁taravao -8098 +▁tauhiti -8099 +cii -8100 +cob -8101 +dow -8102 +ham -8103 +eina -8104 +hake -8105 +hesz -8106 +mfim -8107 +mije -8108 +mosa -8109 +nsen -8110 +rium -8111 +sian -8112 +▁bip -8113 +▁ili -8114 +▁kou -8115 +▁luz -8116 +▁neo -8117 +▁yer -8118 +chter -8119 +fetia -8120 +outre -8121 +piper -8122 +riapu -8123 +widow -8124 +▁alba -8125 +▁eita -8126 +▁faaū -8127 +▁inve -8128 +▁iune -8129 +▁kako -8130 +▁keta -8131 +▁kopi -8132 +▁māmā -8133 +▁neke -8134 +▁pūhā -8135 +▁seas -8136 +▁ster -8137 +▁tony -8138 +dreres -8139 +franca -8140 +mental -8141 +▁aiman -8142 +▁atlas -8143 +▁child -8144 +▁heiva -8145 +▁ilham -8146 +▁jacob -8147 +▁koura -8148 +▁neura -8149 +▁oliva -8150 +▁piper -8151 +▁szisz -8152 +▁tábre -8153 +▁winge -8154 +deutsch -8155 +ifaahou -8156 +ketanga -8157 +leianum -8158 +paniora -8159 +▁bomfim -8160 +▁efetia -8161 +▁faatae -8162 +▁neural -8163 +▁pupuri -8164 +▁rosana -8165 +▁russia -8166 +▁susque -8167 +▁terani -8168 +▁winged -8169 +itāriana -8170 +jonalnej -8171 +▁fariira -8172 +▁firiapu -8173 +▁protein -8174 +▁richter -8175 +▁taumotu -8176 +▁tawhiti -8177 +▁tcherno -8178 +▁teapehu -8179 +▁temaohi -8180 +▁terrace -8181 +▁tetūnaè -8182 +▁thogoto -8183 +▁tilburg -8184 +▁tinorua -8185 +▁titorot -8186 +▁tonohia -8187 +▁toparaa -8188 +▁toronga -8189 +▁toronto -8190 +▁toroven -8191 +▁toàhotu -8192 +▁tristan -8193 +▁tuatini -8194 +▁tuheita -8195 +▁tuhinga -8196 +▁tweregh -8197 +▁tāmuera -8198 +▁tātūhaa -8199 +kl -8200 +fin -8201 +gov -8202 +inq -8203 +kel -8204 +▁yj -8205 +▁»( -8206 +lisi -8207 +opae -8208 +poly -8209 +rats -8210 +vité -8211 +▁alg -8212 +▁bab -8213 +▁dit -8214 +▁àpu -8215 +eraha -8216 +melle -8217 +oires -8218 +rosti -8219 +ātata -8220 +▁amer -8221 +▁cinq -8222 +▁code -8223 +▁enei -8224 +▁lima -8225 +▁onei -8226 +▁rata -8227 +▁suga -8228 +▁suva -8229 +▁taio -8230 +▁taiò -8231 +▁told -8232 +▁waho -8233 +▁yuri -8234 +▁zulu -8235 +autara -8236 +imiraa -8237 +tiaroa -8238 +titano -8239 +▁aline -8240 +▁babão -8241 +▁breda -8242 +▁enfin -8243 +▁lauro -8244 +▁marco -8245 +▁marua -8246 +▁otahi -8247 +▁santé -8248 +▁taina -8249 +▁taora -8250 +▁virus -8251 +▁àiraa -8252 +carrats -8253 +erahama -8254 +▁arapia -8255 +▁avatea -8256 +▁devres -8257 +▁firipi -8258 +▁frança -8259 +▁fātata -8260 +▁merkel -8261 +▁miller -8262 +▁parlia -8263 +▁tanata -8264 +▁zucato -8265 +philippe -8266 +▁aperira -8267 +▁armelle -8268 +▁coração -8269 +▁haumani -8270 +▁mohamad -8271 +▁paetahi -8272 +▁paleiki -8273 +▁penedès -8274 +▁tallada -8275 +▁tinitoō -8276 +▁tēnuare -8277 +▁tīpaniē -8278 +▁uiuiraa -8279 +▁ukraine -8280 +▁upootià -8281 +▁utaanka -8282 +▁utrecht -8283 +▁vaipaee -8284 +▁vaitahu -8285 +▁vaitape -8286 +▁vanilla -8287 +▁vanuatu -8288 +▁vecchio -8289 +▁viabrea -8290 +▁vicente -8291 +▁victory -8292 +▁vietnam -8293 +▁vilallo -8294 +▁vilnius -8295 +▁vojnoge -8296 +▁vāhiraa -8297 +▁wangeci -8298 +▁warning -8299 +fwa -8300 +gij -8301 +ohu -8302 +autī -8303 +bile -8304 +llam -8305 +mone -8306 +orge -8307 +sity -8308 +tabi -8309 +thus -8310 +yage -8311 +ùoùo -8312 +▁lív -8313 +▁uou -8314 +fwacs -8315 +hauts -8316 +heura -8317 +itohu -8318 +ussie -8319 +vella -8320 +villa -8321 +▁belo -8322 +▁malu -8323 +▁nord -8324 +▁nota -8325 +▁pama -8326 +▁prez -8327 +▁quim -8328 +▁sela -8329 +▁team -8330 +▁uouo -8331 +▁vell -8332 +martin -8333 +▁afaro -8334 +▁chico -8335 +▁ficus -8336 +▁géros -8337 +▁hague -8338 +▁halle -8339 +▁hello -8340 +▁kitro -8341 +▁lille -8342 +▁lívia -8343 +▁merle -8344 +▁metia -8345 +▁mough -8346 +▁nasci -8347 +▁penei -8348 +▁riche -8349 +▁tāura -8350 +▁âvōta -8351 +alberto -8352 +liaceae -8353 +llaceae -8354 +▁aliyev -8355 +▁barack -8356 +▁fogars -8357 +▁garcia -8358 +▁george -8359 +▁killam -8360 +▁mobile -8361 +▁parari -8362 +▁parata -8363 +▁simone -8364 +▁studio -8365 +▁tayyip -8366 +▁torosa -8367 +▁voyage -8368 +▁destabi -8369 +▁dramani -8370 +▁ferriol -8371 +▁iakāson -8372 +▁sevilla -8373 +▁tamatoa -8374 +▁waitohu -8375 +▁weather -8376 +▁welcome -8377 +▁whaihua -8378 +▁whainga -8379 +▁whakati -8380 +▁wieners -8381 +▁winners -8382 +▁youtube -8383 +▁yáconis -8384 +▁àhureva -8385 +▁ápszkur -8386 +▁èperēra -8387 +▁épitopo -8388 +▁ātearaa -8389 +▁београд -8390 +accadémie -8391 +aleurites -8392 +anthurium -8393 +armentera -8394 +autonomia -8395 +barcelona -8396 +casuarina -8397 +cipalidad -8398 +colocasia -8399 +air -8400 +oks -8401 +aihu -8402 +ange -8403 +bece -8404 +guer -8405 +rent -8406 +rust -8407 +scle -8408 +toba -8409 +▁ati -8410 +▁fim -8411 +▁two -8412 +▁zse -8413 +▁âai -8414 +▁ùpu -8415 +berta -8416 +fagra -8417 +gimpa -8418 +manya -8419 +tness -8420 +▁beto -8421 +▁doce -8422 +▁dong -8423 +▁five -8424 +▁jair -8425 +▁mugo -8426 +▁nger -8427 +▁osei -8428 +▁ruta -8429 +▁suja -8430 +▁yola -8431 +▁ômua -8432 +▁ôraa -8433 +▁āura -8434 +angelo -8435 +laguer -8436 +utiraa -8437 +▁amaha -8438 +▁aniol -8439 +▁books -8440 +▁caras -8441 +▁colin -8442 +▁mooni -8443 +▁mággo -8444 +▁ngeru -8445 +▁notre -8446 +▁peter -8447 +▁runga -8448 +▁teahe -8449 +▁torra -8450 +▁trust -8451 +▁tāipe -8452 +▁utara -8453 +becetin -8454 +fagraea -8455 +history -8456 +rōpūhia -8457 +▁eloísa -8458 +▁hetera -8459 +▁isabel -8460 +▁nerone -8461 +▁pāpāho -8462 +▁sotchi -8463 +▁vahitu -8464 +▁vilano -8465 +boskulár -8466 +dremanya -8467 +gelaguer -8468 +maniscle -8469 +orometua -8470 +▁elatior -8471 +▁mathema -8472 +▁mikaere -8473 +▁toopiti -8474 +▁torrent -8475 +▁tuihani -8476 +▁witness -8477 +▁yolanda -8478 +bjuszjáká -8479 +coniaceae -8480 +cordyline -8481 +csikuszto -8482 +csivásztá -8483 +dioscorea -8484 +earchgate -8485 +erenciana -8486 +erstimnyá -8487 +ervenkálo -8488 +erythrina -8489 +etanetana -8490 +etlingera -8491 +gossypium -8492 +guettarda -8493 +hedychium -8494 +heliconia -8495 +inocarpus -8496 +ivotrikoj -8497 +kilopotri -8498 +ladelphia -8499 + -15982 +ä -15983 +ł -15984 +ш -15985 +ا -15986 +# -15987 +š -15988 +ʼ -15989 +й -15990 +ц -15991 +ы -15992 +я -15993 +ب -15994 +ع -15995 diff --git a/models/tokenizer/ty_tokenizer_8k.model b/models/tokenizer/ty_tokenizer_8k.model new file mode 100644 index 0000000000000000000000000000000000000000..5219e8857a42585eb5ce33e1ac1de5d5ddfd740e --- /dev/null +++ b/models/tokenizer/ty_tokenizer_8k.model @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1feeb933142d91be6574717c280b93d052cc7187e1e15c78f367879ab77c0791 +size 371547 diff --git a/models/tokenizer/ty_tokenizer_8k.vocab b/models/tokenizer/ty_tokenizer_8k.vocab new file mode 100644 index 0000000000000000000000000000000000000000..b3725bba52a0cb40b21c5b2689904e116ad377ab --- /dev/null +++ b/models/tokenizer/ty_tokenizer_8k.vocab @@ -0,0 +1,8000 @@ + 0 + 0 + 0 + 0 +▁t -0 +▁te -1 +▁m -2 +▁i -3 +ra -4 +▁n -5 +▁ma -6 +re -7 +ti -8 +▁f -9 +▁p -10 +▁h -11 +ta -12 +ia -13 +▁ta -14 +▁’ -15 +▁mau -16 +▁e -17 +ua -18 +▁no -19 +▁o -20 +▁a -21 +na -22 +hi -23 +ire -24 +▁fa -25 +▁nō -26 +raa -27 +ot -28 +oire -29 +▁iti -30 +te -31 +or -32 +ne -33 +▁s -34 +en -35 +▁ha -36 +ri -37 +ni -38 +otu -39 +▁pa -40 +▁mā -41 +▁ò -42 +ro -43 +▁ra -44 +▁mata -45 +ha -46 +▁hō -47 +nia -48 +va -49 +▁ua -50 +enua -51 +rū -52 +▁fenua -53 +▁tata -54 +motu -55 +rūnia -56 +▁tatarūnia -57 +▁tu -58 +ma -59 +pa -60 +▁r -61 +hiti -62 +▁taa -63 +he -64 +oria -65 +iraa -66 +▁d -67 +▁soria -68 +▁faa -69 +hia -70 +▁b -71 +to -72 +▁k -73 +▁matahiti -74 +la -75 +tia -76 +▁po -77 +rā -78 +pi -79 +rāni -80 +▁farāni -81 +▁( -82 +▁na -83 +rau -84 +▁haa -85 +▁to -86 +tere -87 +▁c -88 +ura -89 +▁mai -90 +▁parau -91 +ka -92 +▁pō -93 +le -94 +rī -95 +▁re -96 +▁ti -97 +tu -98 +netia -99 +▁g -100 +ere -101 +▁taamotu -102 +▁ho -103 +li -104 +▁oia -105 +▁pōrī -106 +▁pōrīnetia -107 +▁haapi -108 +▁fare -109 +ur -110 +▁me -111 +āna -112 +ho -113 +oto -114 +ara -115 +▁pohe -116 +▁fāna -117 +er -118 +ng -119 +vi -120 +▁motu -121 +▁pohera -122 +▁fānaura -123 +po -124 +āmotu -125 +▁tene -126 +▁haapiiraa -127 +▁tuāmotu -128 +▁tenetere -129 +pu -130 +▁roto -131 +ve -132 +▁de -133 +▁pu -134 +au -135 +os -136 +▁mo -137 +▁ni -138 +▁tua -139 +si -140 +▁rahi -141 +ui -142 +tihia -143 +▁ia -144 +▁va -145 +▁ei -146 +ea -147 +ei -148 +tor -149 +haa -150 +ìtihia -151 +hana -152 +lo -153 +▁taata -154 +▁māìtihia -155 +an -156 +▁òire -157 +▁u -158 +▁hoê -159 +oraa -160 +▁w -161 +▁ri -162 +es -163 +us -164 +▁òna -165 +▁tā -166 +▁hau -167 +▁pae -168 +▁tuhaa -169 +ie -170 +toru -171 +iti -172 +▁ro -173 +▁tuatoru -174 +on -175 +are -176 +tua -177 +fi -178 +), -179 +hipa -180 +▁j -181 +me -182 +tira -183 +urg -184 +rii -185 +ru -186 +▁- -187 +▁l -188 +oro -189 +▁â -190 +▁burg -191 +▁pere -192 +no -193 +▁burgos -194 +ca -195 +▁vi -196 +▁ghana -197 +mi -198 +▁hi -199 +▁hu -200 +da -201 +ga -202 +▁nei -203 +▁rā -204 +pe -205 +▁rave -206 +ata -207 +▁por -208 +▁. -209 +▁' -210 +▁riro -211 +▁ohipa -212 +is -213 +ite -214 +▁fē -215 +▁pā -216 +▁reo -217 +▁puna -218 +nd -219 +eae -220 +ira -221 +ceae -222 +hine -223 +▁fēti -224 +el -225 +▁pū -226 +▁ca -227 +▁atu -228 +fa -229 +▁la -230 +▁tama -231 +pooraa -232 +▁faatere -233 +nga -234 +▁ato -235 +▁ora -236 +mo -237 +nu -238 +uri -239 +uru -240 +areva -241 +ba -242 +▁huiraa -243 +▁huiraatira -244 +ote -245 +▁ka -246 +teni -247 +se -248 +▁è -249 +▁sa -250 +itita -251 +▁poritita -252 +mu -253 +▁ai -254 +titeni -255 +▁v -256 +les -257 +▁tei -258 +hu -259 +ora -260 +tou -261 +▁ara -262 +▁raro -263 +ku -264 +▁: -265 +▁tià -266 +oa -267 +fic -268 +tai -269 +▁tahiti -270 +▁mari -271 +▁reira -272 +▁haere -273 +▁" -274 +mua -275 +▁roa -276 +▁tau -277 +ki -278 +ria -279 +rahi -280 +▁peretiteni -281 +tea -282 +▁fe -283 +▁of -284 +rama -285 +▁taote -286 +wa -287 +ya -288 +òhi -289 +▁ki -290 +▁mi -291 +▁san -292 +▁māòhi -293 +ce -294 +de -295 +naa -296 +▁af -297 +▁tae -298 +▁rapa -299 +qu -300 +▁mea -301 +▁âpooraa -302 +ol -303 +▁pupu -304 +▁maareva -305 +▁au -306 +▁pe -307 +▁pi -308 +araa -309 +▁tahi -310 +▁marite -311 +sa -312 +ore -313 +uhia -314 +▁muri -315 +▁reva -316 +▁iho -317 +ficie -318 +▁atoa -319 +▁pārahi -320 +ll -321 +tā -322 +uka -323 +▁vahine -324 +). -325 +di -326 +▁matamua -327 +eu -328 +▁rē -329 +▁afri -330 +▁nati -331 +do -332 +sz -333 +▁ko -334 +▁nga -335 +ch -336 +co -337 +▁nu -338 +▁hui -339 +▁farii -340 +▁haapii -341 +▁maitai -342 +ko -343 +um -344 +sia -345 +ter -346 +▁mou -347 +▁raa -348 +▁buka -349 +▁rēni -350 +ci -351 +▁ne -352 +▁so -353 +▁wha -354 +miraa -355 +▁papa -356 +▁tamarii -357 +ny -358 +ran -359 +▁ite -360 +▁teie -361 +faa -362 +per -363 +auraa -364 +▁mana -365 +▁haama -366 +ke -367 +st -368 +ana -369 +▁an -370 +▁in -371 +▁le -372 +den -373 +men -374 +▁ba -375 +euro -376 +▁maimiraa -377 +▁rapaauraa -378 +il -379 +▁‘ -380 +era -381 +▁am -382 +▁horo -383 +▁sant -384 +europa -385 +▁afrika -386 +in -387 +▁li -388 +▁râ -389 +atira -390 +▁fana -391 +▁y -392 +nei -393 +roa -394 +▁co -395 +▁he -396 +▁su -397 +▁mouà -398 +▁faana -399 +▁huira -400 +▁ku -401 +▁nā -402 +mani -403 +hō -404 +ss -405 +▁à -406 +▁ʻ -407 +pua -408 +▁ao -409 +tion -410 +▁noa -411 +▁tai -412 +▁vai -413 +siden -414 +▁metua -415 +▁ratou -416 +▁oraraa -417 +hōê -418 +sti -419 +▁lo -420 +nata -421 +tahi -422 +tita -423 +vini -424 +▁fau -425 +▁ken -426 +hōêraa -427 +▁tāhōêraa -428 +du -429 +go -430 +ts -431 +ça -432 +net -433 +āta -434 +▁wa -435 +▁apa -436 +▁mar -437 +▁fran -438 +▁tāne -439 +bi -440 +th -441 +lia -442 +lla -443 +lle -444 +que -445 +▁di -446 +▁km -447 +▁èn -448 +tepa -449 +▁amui -450 +▁atua -451 +▁huru -452 +▁noho -453 +▁poli -454 +▁whaka -455 +▁ènāta -456 +tī -457 +▁al -458 +▁da -459 +▁se -460 +▁melo -461 +▁piti -462 +▁site -463 +▁taua -464 +▁mesia -465 +▁moana -466 +▁rahiraa -467 +am -468 +gi -469 +né -470 +ito -471 +pea -472 +toa -473 +▁ac -474 +▁ve -475 +▁ana -476 +▁oro -477 +▁the -478 +▁para -479 +▁mahana -480 +perficie -481 +▁faanaho -482 +▁politita -483 +ly -484 +ou -485 +ari -486 +sie -487 +▁() -488 +vihi -489 +▁feia -490 +▁here -491 +▁pape -492 +▁apooraa -493 +▁aravihi -494 +▁peresiden -495 +▁superficie -496 +gh -497 +lu -498 +rd -499 +▁) -500 +che -501 +hau -502 +ipo -503 +ris -504 +rua -505 +tre -506 +mona -507 +oromona -508 +▁marama -509 +▁peresideni -510 +ge -511 +▁• -512 +ord -513 +tif -514 +▁(, -515 +▁be -516 +iete -517 +tiraa -518 +▁vahi -519 +▁vila -520 +▁ènata -521 +▁faufaa -522 +ck -523 +gu -524 +ye -525 +▁z -526 +▁ô -527 +▁do -528 +▁ga -529 +▁ru -530 +pura -531 +uraa -532 +▁ani -533 +▁ter -534 +nette -535 +▁faaho -536 +▁officie -537 +▁fanauhia -538 +ai -539 +ns -540 +nt -541 +▁; -542 +ngi -543 +ola -544 +roo -545 +áre -546 +▁ap -547 +▁aè -548 +rita -549 +▁hoa -550 +metua -551 +▁tere -552 +▁tumu -553 +▁faaite -554 +▁moromona -555 +▁officiel -556 +▁faanahoraa -557 +pō -558 +ré -559 +ïa -560 +▁« -561 +▁ê -562 +▁ā -563 +ber -564 +car -565 +ete -566 +ohi -567 +oni -568 +ton -569 +▁jo -570 +tara -571 +▁tao -572 +▁vig -573 +▁poly -574 +ororaa -575 +▁apato -576 +▁faahi -577 +▁tatou -578 +▁oraora -579 +▁tuamotu -580 +▁vignette -581 +ph -582 +cia -583 +gra -584 +rus -585 +ász -586 +▁fi -587 +▁ja -588 +▁lu -589 +▁tō -590 +çais -591 +▁kuf -592 +▁tor -593 +▁manu -594 +▁tupu -595 +▁faatereraa -596 +.. -597 +mb -598 +pû -599 +sc -600 +za -601 +▁ù -602 +ihi -603 +man -604 +tal -605 +▁go -606 +▁mu -607 +▁tē -608 +▁ïa -609 +ahia -610 +pere -611 +poto -612 +tera -613 +▁ava -614 +▁eka -615 +▁kwa -616 +▁nui -617 +▁tia -618 +einaa -619 +lesia -620 +▁aita -621 +▁faah -622 +▁hiva -623 +▁piha -624 +▁tara -625 +▁tavini -626 +▁ekalesia -627 +▁français -628 +▁mataeinaa -629 +__ -630 +ao -631 +so -632 +hua -633 +ose -634 +pha -635 +ver -636 +▁ab -637 +▁et -638 +fare -639 +hene -640 +mala -641 +ment -642 +▁and -643 +▁des -644 +▁nia -645 +▁rus -646 +amotu -647 +nésie -648 +rīihi -649 +▁faao -650 +▁faata -651 +▁paari -652 +▁rotopu -653 +▁parīihi -654 +▁fānauhia -655 +▁heremani -656 +▁orometua -657 +be -658 +mp -659 +ama -660 +cra -661 +esu -662 +nes -663 +ori -664 +phe -665 +pia -666 +qui -667 +uor -668 +▁ar -669 +▁du -670 +rana -671 +turu -672 +▁hua -673 +▁pua -674 +▁upo -675 +puare -676 +▁iesu -677 +▁otea -678 +▁pāti -679 +▁utua -680 +taiete -681 +▁nunaa -682 +▁kufuor -683 +▁tapura -684 +▁tetepa -685 +▁fepuare -686 +▁oteania -687 +▁utuafare -688 +▁polynésie -689 +fo -690 +hn -691 +ká -692 +rs -693 +dia -694 +paì -695 +ren -696 +reo -697 +res -698 +sen -699 +▁bi -700 +▁os -701 +▁rê -702 +itei -703 +▁apî -704 +▁ari -705 +▁bra -706 +▁com -707 +▁den -708 +▁eva -709 +▁hiv -710 +▁les -711 +▁par -712 +▁pro -713 +▁arii -714 +▁atoà -715 +▁mahi -716 +▁mili -717 +▁niho -718 +▁oire -719 +▁repu -720 +▁upoo -721 +naceae -722 +▁accra -723 +▁kenya -724 +▁maria -725 +▁tahaa -726 +▁faaroo -727 +▁tahito -728 +▁teitei -729 +▁animala -730 +▁haereere -731 +▁tamahine -732 +▁maramarama -733 +je -734 +ld -735 +ry -736 +té -737 +vo -738 +ger -739 +nge -740 +nui -741 +tri -742 +usa -743 +▁ci -744 +▁en -745 +▁ju -746 +▁si -747 +orea -748 +tura -749 +ātia -750 +ndola -751 +▁aore -752 +▁nuku -753 +▁raua -754 +▁tane -755 +▁tera -756 +▁tooa -757 +henehe -758 +▁kwagh -759 +▁tahua -760 +▁nehenehe -761 +▁française -762 +▁faahororaa -763 +ja -764 +pǔ -765 +ul -766 +ão -767 +▁с -768 +bia -769 +can -770 +chi -771 +ita -772 +los -773 +ndi -774 +nua -775 +rit -776 +unu -777 +▁as -778 +▁ge -779 +▁lá -780 +▁mē -781 +▁tī -782 +ihia -783 +nana -784 +piti -785 +tāne -786 +vema -787 +▁cha -788 +▁fer -789 +▁gra -790 +▁maa -791 +▁mua -792 +▁raì -793 +▁tea -794 +nelia -795 +▁faaa -796 +▁fara -797 +▁fatu -798 +▁hiro -799 +▁john -800 +▁maha -801 +▁mala -802 +▁papû -803 +▁tema -804 +▁ture -805 +itihia -806 +perera -807 +▁faatu -808 +▁haapa -809 +▁varua -810 +▁pōrana -811 +▁tāvini -812 +▁evanelia -813 +ls -814 +pū -815 +▁* -816 +aro -817 +bli -818 +ina -819 +iva -820 +ona -821 +tes -822 +tro -823 +utu -824 +ven -825 +▁hā -826 +▁rū -827 +ston -828 +tifā -829 +▁ali -830 +▁ere -831 +▁hoi -832 +▁hou -833 +▁ihi -834 +▁pau -835 +atere -836 +ngata -837 +rophe -838 +▁iose -839 +▁puka -840 +▁puta -841 +▁tapu -842 +▁toro -843 +ipoipo -844 +pearaa -845 +pirita -846 +▁pāpaì -847 +▁tiunu -848 +▁haamau -849 +▁novema -850 +aterehau -851 +▁haamata -852 +▁iosepha -853 +▁milioni -854 +▁tauturu -855 +▁pātitifā -856 +▁sotaiete -857 +▁faaipoipo -858 +▁repupirita -859 +bu -860 +cs -861 +ct -862 +ky -863 +nk -864 +tr -865 +tō -866 +ze -867 +▁? -868 +ell -869 +iri -870 +mfi -871 +mon -872 +phi -873 +ste -874 +tin -875 +tta -876 +vai -877 +ǔpǔ -878 +▁em -879 +▁gr -880 +▁ny -881 +▁or -882 +▁tm -883 +ctor -884 +dade -885 +erau -886 +here -887 +puka -888 +pōrū -889 +rava -890 +sier -891 +tete -892 +▁adu -893 +▁are -894 +▁boa -895 +▁chi -896 +▁con -897 +▁cse -898 +▁mal -899 +▁pou -900 +▁pre -901 +▁pré -902 +▁sta -903 +▁tel -904 +▁utu -905 +faaho -906 +ndica -907 +stitu -908 +▁anaa -909 +▁auta -910 +▁mate -911 +▁moni -912 +▁pǔpǔ -913 +▁raau -914 +▁rima -915 +▁taho -916 +▁tini -917 +▁tino -918 +▁offic -919 +▁osier -920 +▁rūtia -921 +▁taime -922 +▁ùpōrū -923 +ropheta -924 +▁gaston -925 +▁indica -926 +▁faatupu -927 +▁huahine -928 +▁malaria -929 +▁tupuraa -930 +▁peropheta -931 +nc -932 +op -933 +ty -934 +tá -935 +иј -936 +▁, -937 +amu -938 +dre -939 +ian -940 +ley -941 +lin -942 +mpa -943 +opo -944 +rei -945 +▁bo -946 +▁cu -947 +▁hī -948 +▁ii -949 +▁is -950 +▁ke -951 +▁lā -952 +▁vo -953 +▁wi -954 +ford -955 +iata -956 +itai -957 +manu -958 +masi -959 +mene -960 +mite -961 +ogra -962 +olia -963 +poku -964 +ques -965 +reva -966 +tema -967 +vana -968 +▁ale -969 +▁aro -970 +▁aru -971 +▁grâ -972 +▁hen -973 +▁jac -974 +▁kai -975 +▁mei -976 +▁mer -977 +▁one -978 +▁sel -979 +niora -980 +parau -981 +yamfi -982 +▁bela -983 +▁faaà -984 +▁hiti -985 +▁mani -986 +▁toru -987 +▁ware -988 +faahou -989 +firita -990 +riiraa -991 +▁hopea -992 +▁opoku -993 +▁òhipa -994 +▁hamani -995 +▁kumasi -996 +▁institu -997 +▁papeete -998 +▁tahoera -999 +▁terepia -1000 +▁faaohipa -1001 +▁grândola -1002 +". -1003 +.: -1004 +dy -1005 +fe -1006 +hā -1007 +má -1008 +sh -1009 +sá -1010 +рб -1011 +▁+ -1012 +▁[ -1013 +▁x -1014 +▁» -1015 +▁é -1016 +... -1017 +___ -1018 +est -1019 +gas -1020 +gen -1021 +han -1022 +kye -1023 +moa -1024 +nda -1025 +num -1026 +ort -1027 +osa -1028 +phy -1029 +rea -1030 +rum -1031 +sis -1032 +son -1033 +sta -1034 +▁il -1035 +▁je -1036 +▁ox -1037 +▁ph -1038 +dona -1039 +enei -1040 +land -1041 +line -1042 +pora -1043 +rika -1044 +riti -1045 +tava -1046 +toro -1047 +рбиј -1048 +▁___ -1049 +▁ada -1050 +▁ahu -1051 +▁bro -1052 +▁dis -1053 +▁esc -1054 +▁hei -1055 +▁hia -1056 +▁jea -1057 +▁mon -1058 +▁niu -1059 +▁pla -1060 +▁sha -1061 +▁ven -1062 +ivava -1063 +▁cseb -1064 +▁hoho -1065 +▁juli -1066 +▁mada -1067 +▁make -1068 +▁musa -1069 +▁māti -1070 +▁nana -1071 +▁peri -1072 +▁popa -1073 +▁taia -1074 +▁taka -1075 +gyamfi -1076 +ngatau -1077 +▁boadu -1078 +▁maoro -1079 +▁rusia -1080 +▁santa -1081 +▁selva -1082 +▁србиј -1083 +biaceae -1084 +āfirita -1085 +▁faaora -1086 +▁tinitō -1087 +▁tomite -1088 +▁upooti -1089 +▁belarus -1090 +▁paniora -1091 +▁raapoto -1092 +▁tuahine -1093 +▁fangatau -1094 +▁fariiraa -1095 +., -1096 +hī -1097 +ix -1098 +lá -1099 +nē -1100 +oà -1101 +▁/ -1102 +ano -1103 +api -1104 +atu -1105 +bal -1106 +cha -1107 +chy -1108 +cum -1109 +des -1110 +dio -1111 +dor -1112 +emp -1113 +ial -1114 +iao -1115 +kij -1116 +lei -1117 +lor -1118 +mei -1119 +nas -1120 +ngo -1121 +nha -1122 +nsk -1123 +our -1124 +qua -1125 +shi -1126 +siw -1127 +tau -1128 +tte -1129 +uma -1130 +zil -1131 +āni -1132 +▁ed -1133 +▁eu -1134 +▁ly -1135 +▁st -1136 +▁sz -1137 +▁tw -1138 +▁tū -1139 +▁vī -1140 +bera -1141 +doua -1142 +ella -1143 +esse -1144 +huru -1145 +ingi -1146 +jata -1147 +lles -1148 +mita -1149 +nati -1150 +orle -1151 +pera -1152 +pōnē -1153 +ream -1154 +resa -1155 +rica -1156 +sité -1157 +tero -1158 +tini -1159 +topa -1160 +tori -1161 +èraa -1162 +ātea -1163 +▁aha -1164 +▁ame -1165 +▁ano -1166 +▁bla -1167 +▁can -1168 +▁del -1169 +▁fra -1170 +▁mba -1171 +▁oli -1172 +▁que -1173 +▁sur -1174 +▁tui -1175 +▁uni -1176 +▁vau -1177 +▁vie -1178 +▁âva -1179 +losse -1180 +nuare -1181 +reraa -1182 +ritch -1183 +tanga -1184 +teria -1185 +tāmua -1186 +ōhipa -1187 +▁cast -1188 +▁faka -1189 +▁goka -1190 +▁hana -1191 +▁jean -1192 +▁link -1193 +▁mono -1194 +▁mora -1195 +▁patu -1196 +▁pora -1197 +▁sang -1198 +▁taha -1199 +▁tahu -1200 +▁tapo -1201 +▁tuni -1202 +douard -1203 +taceae -1204 +vairaa -1205 +▁atepa -1206 +▁atopa -1207 +▁hitia -1208 +▁korle -1209 +▁paris -1210 +▁tiger -1211 +hanahia -1212 +▁africa -1213 +▁brazil -1214 +▁faataa -1215 +▁flosse -1216 +▁fritch -1217 +▁moorea -1218 +▁oxford -1219 +▁semita -1220 +▁taiete -1221 +▁tāpōnē -1222 +▁utuutu -1223 +▁србије -1224 +▁alijata -1225 +▁csebász -1226 +▁edouard -1227 +▁mātāmua -1228 +▁theresa -1229 +▁maìtihia -1230 +▁indicatif -1231 +▁faanavairaa -1232 +ad -1233 +al -1234 +bo -1235 +by -1236 +cy -1237 +ds -1238 +dé -1239 +if -1240 +ir -1241 +km -1242 +lt -1243 +mā -1244 +tt -1245 +wi -1246 +▁á -1247 +bre -1248 +cal -1249 +cen -1250 +eti -1251 +for -1252 +ges -1253 +gye -1254 +her -1255 +hle -1256 +iro -1257 +itā -1258 +las -1259 +lau -1260 +llo -1261 +log -1262 +mer -1263 +ney -1264 +nio -1265 +nyi -1266 +orū -1267 +pen -1268 +pra -1269 +ssi -1270 +tho -1271 +tum -1272 +uba -1273 +vid -1274 +zer -1275 +▁ad -1276 +▁ae -1277 +▁el -1278 +▁fo -1279 +▁kū -1280 +▁mc -1281 +▁ng -1282 +▁on -1283 +▁ow -1284 +▁ré -1285 +▁we -1286 +▁ya -1287 +▁ye -1288 +berg -1289 +ller -1290 +mata -1291 +mera -1292 +misi -1293 +nsis -1294 +oane -1295 +ordà -1296 +otea -1297 +para -1298 +rapu -1299 +rles -1300 +tane -1301 +tapu -1302 +teti -1303 +trus -1304 +tītī -1305 +urai -1306 +▁afi -1307 +▁aku -1308 +▁ata -1309 +▁bas -1310 +▁bis -1311 +▁car -1312 +▁gar -1313 +▁han -1314 +▁ice -1315 +▁ino -1316 +▁lla -1317 +▁moi -1318 +▁nen -1319 +▁nià -1320 +▁ona -1321 +▁ore -1322 +▁phi -1323 +▁ref -1324 +▁sar -1325 +▁uru -1326 +▁ver -1327 +▁you -1328 +▁ôoà -1329 +enana -1330 +erorū -1331 +meida -1332 +menia -1333 +mpane -1334 +phyll -1335 +riraa -1336 +senta -1337 +tiare -1338 +urutu -1339 +áresz -1340 +▁anua -1341 +▁arai -1342 +▁cana -1343 +▁cata -1344 +▁faai -1345 +▁hehe -1346 +▁hill -1347 +▁huka -1348 +▁kilo -1349 +▁lone -1350 +▁maui -1351 +▁pato -1352 +▁rava -1353 +▁rock -1354 +▁roma -1355 +▁roro -1356 +▁sain -1357 +▁tana -1358 +▁tano -1359 +▁taui -1360 +▁teva -1361 +▁tita -1362 +▁âvaè -1363 +▁ātea -1364 +gascar -1365 +itāria -1366 +ivavae -1367 +manuel -1368 +▁adamu -1369 +▁aotea -1370 +▁arata -1371 +▁cream -1372 +▁faufa -1373 +▁hesse -1374 +▁hāmoa -1375 +▁māori -1376 +▁oscar -1377 +▁rapae -1378 +▁sahle -1379 +▁tahuà -1380 +▁terra -1381 +▁zingi -1382 +▁âtopa -1383 +empordà -1384 +▁manihi -1385 +▁napuka -1386 +▁piihia -1387 +▁pōtītī -1388 +▁rurutu -1389 +▁russie -1390 +▁taonga -1391 +▁temaru -1392 +▁tetahi -1393 +▁tiurai -1394 +▁tuarua -1395 +beraceae -1396 +erorūtia -1397 +ramarama -1398 +▁afirika -1399 +▁almeida -1400 +▁charles -1401 +▁maupiti -1402 +▁sotiare -1403 +▁tahuata -1404 +▁tamaiti -1405 +▁tauiraa -1406 +▁tempane -1407 +▁tenuare -1408 +▁êperera -1409 +sentation -1410 +▁aotearoa -1411 +▁institut -1412 +▁lonedona -1413 +▁maitiraa -1414 +▁manureva -1415 +▁official -1416 +▁paratāne -1417 +▁peretāne -1418 +▁porapora -1419 +▁raivavae -1420 +▁rimatara -1421 +▁taatiraa -1422 +▁taiarapu -1423 +▁tapearaa -1424 +▁apatoerau -1425 +▁paraparau -1426 +▁rubiaceae -1427 +▁madagascar -1428 +▁pierorūtia -1429 +▁présentation -1430 +▁zingiberaceae -1431 +", -1432 +.) -1433 +ah -1434 +ar -1435 +ed -1436 +ff -1437 +ks -1438 +oe -1439 +oi -1440 +pl -1441 +pā -1442 +pŭ -1443 +su -1444 +tí -1445 +ue -1446 +vá -1447 +xi -1448 +zy -1449 +». -1450 +òa -1451 +ós -1452 +на -1453 +▁× -1454 +▁р -1455 +amā -1456 +ati -1457 +bar -1458 +bla -1459 +bri -1460 +csi -1461 +dan -1462 +del -1463 +epi -1464 +eru -1465 +fan -1466 +gau -1467 +gor -1468 +gua -1469 +hui -1470 +iat -1471 +ine -1472 +isz -1473 +kwa -1474 +lar -1475 +len -1476 +lez -1477 +lis -1478 +mar -1479 +mau -1480 +nca -1481 +nea -1482 +nel -1483 +ner -1484 +oso -1485 +pel -1486 +pus -1487 +rac -1488 +ric -1489 +ted -1490 +tià -1491 +uar -1492 +uis -1493 +use -1494 +ves -1495 +wai -1496 +xan -1497 +yev -1498 +ìte -1499 +ēra -1500 +ŭpŭ -1501 +▁ag -1502 +▁bu -1503 +▁ch -1504 +▁dé -1505 +▁má -1506 +▁oa -1507 +▁qu -1508 +▁sc -1509 +atua -1510 +bert -1511 +burg -1512 +enko -1513 +fera -1514 +gory -1515 +hara -1516 +hiva -1517 +humb -1518 +iahi -1519 +koto -1520 +lium -1521 +logy -1522 +mana -1523 +maru -1524 +mihi -1525 +musa -1526 +nell -1527 +pala -1528 +pani -1529 +pehe -1530 +puai -1531 +rela -1532 +ster -1533 +tina -1534 +tipe -1535 +vern -1536 +ītia -1537 +▁afa -1538 +▁aka -1539 +▁amu -1540 +▁ave -1541 +▁bor -1542 +▁bre -1543 +▁cor -1544 +▁csi -1545 +▁dna -1546 +▁est -1547 +▁fro -1548 +▁hao -1549 +▁hiò -1550 +▁iii -1551 +▁imi -1552 +▁kau -1553 +▁lau -1554 +▁llo -1555 +▁man -1556 +▁maì -1557 +▁men -1558 +▁māi -1559 +▁ngā -1560 +▁non -1561 +▁nuu -1562 +▁oti -1563 +▁phd -1564 +▁pri -1565 +▁qua -1566 +▁qui -1567 +▁rua -1568 +▁sal -1569 +▁sou -1570 +▁tar -1571 +▁tro -1572 +▁uta -1573 +▁web -1574 +aceae -1575 +ctory -1576 +episo -1577 +hanti -1578 +irobi -1579 +kueru -1580 +moana -1581 +muera -1582 +naaro -1583 +neine -1584 +ngton -1585 +pûraa -1586 +rāria -1587 +tānia -1588 +ászop -1589 +▁aamu -1590 +▁afua -1591 +▁aman -1592 +▁anto -1593 +▁feli -1594 +▁fifi -1595 +▁gita -1596 +▁king -1597 +▁kāna -1598 +▁mais -1599 +▁maka -1600 +▁maro -1601 +▁meià -1602 +▁mele -1603 +▁nene -1604 +▁open -1605 +▁opua -1606 +▁popu -1607 +▁pŭpŭ -1608 +▁raia -1609 +▁reao -1610 +▁slei -1611 +▁taea -1612 +▁tani -1613 +▁teri -1614 +▁tona -1615 +▁tong -1616 +▁tuva -1617 +▁tīri -1618 +▁vict -1619 +▁vren -1620 +▁vītī -1621 +▁well -1622 +▁àere -1623 +carpus -1624 +eaèraa -1625 +gauche -1626 +gyekye -1627 +mation -1628 +metera -1629 +ngarau -1630 +tavake -1631 +ururaa -1632 +▁brong -1633 +▁david -1634 +▁faaea -1635 +▁faito -1636 +▁grace -1637 +▁hanna -1638 +▁ioane -1639 +▁matau -1640 +▁minsk -1641 +▁oware -1642 +▁papai -1643 +▁piahi -1644 +▁ranei -1645 +▁ravea -1646 +▁saint -1647 +▁tiare -1648 +▁tieti -1649 +▁tonga -1650 +▁touri -1651 +▁tātou -1652 +▁villa -1653 +iatpala -1654 +phyllum -1655 +tahiraa -1656 +tipetia -1657 +▁apatoa -1658 +▁arutua -1659 +▁bissiw -1660 +▁chirac -1661 +▁disney -1662 +▁farani -1663 +▁govern -1664 +▁hīmene -1665 +▁lāmihi -1666 +▁mahiti -1667 +▁makemo -1668 +▁nászop -1669 +▁setepa -1670 +▁tiaraa -1671 +▁titema -1672 +▁tuiroo -1673 +▁tupuai -1674 +▁tureia -1675 +▁varela -1676 +▁waiata -1677 +episodio -1678 +▁ashanti -1679 +▁densité -1680 +▁hikueru -1681 +▁hinaaro -1682 +▁jacques -1683 +▁nairobi -1684 +▁opuaraa -1685 +▁raatira -1686 +▁sleiman -1687 +▁taairaa -1688 +▁takaroa -1689 +▁taravai -1690 +▁whakama -1691 +▁areteria -1692 +▁fakarava -1693 +▁fanauraa -1694 +▁peretane -1695 +▁tahitien -1696 +▁faaineine -1697 +▁vitipetia -1698 +▁autaeaèraa -1699 +▁mauiatpala -1700 +▁nukutavake -1701 +▁amuitahiraa -1702 +▁faahopearaa -1703 +▁haamaramarama -1704 +cu -1705 +cé -1706 +dc -1707 +ft -1708 +hr -1709 +ji -1710 +jo -1711 +ps -1712 +px -1713 +rē -1714 +sp -1715 +wo -1716 +ys -1717 +ło -1718 +ик -1719 +ال -1720 +▁б -1721 +▁в -1722 +▁г -1723 +▁т -1724 +▁– -1725 +ahu -1726 +apa -1727 +ape -1728 +bez -1729 +bhi -1730 +bou -1731 +cel -1732 +ces -1733 +cro -1734 +cti -1735 +din -1736 +dri -1737 +ear -1738 +ena -1739 +ens -1740 +faì -1741 +fes -1742 +fia -1743 +fri -1744 +gar -1745 +ght -1746 +gli -1747 +gue -1748 +hio -1749 +ihā -1750 +jan -1751 +kar -1752 +kau -1753 +ker -1754 +kyi -1755 +nde -1756 +nie -1757 +nya -1758 +nye -1759 +nyá -1760 +osc -1761 +pae -1762 +pho -1763 +raì -1764 +rie -1765 +rio -1766 +rne -1767 +rot -1768 +sah -1769 +sil -1770 +sme -1771 +ssa -1772 +sua -1773 +tim -1774 +trá -1775 +urt -1776 +usz -1777 +val -1778 +vio -1779 +yol -1780 +āpo -1781 +īne -1782 +ōpu -1783 +ōpū -1784 +▁at -1785 +▁ea -1786 +▁es -1787 +▁fé -1788 +▁kī -1789 +▁lí -1790 +▁my -1791 +▁ou -1792 +▁pû -1793 +▁um -1794 +▁òe -1795 +▁ùo -1796 +▁ło -1797 +aore -1798 +auia -1799 +bhit -1800 +cher -1801 +dium -1802 +enta -1803 +erra -1804 +fana -1805 +haro -1806 +hune -1807 +itea -1808 +kozy -1809 +lata -1810 +lena -1811 +lifi -1812 +lika -1813 +llet -1814 +mina -1815 +mini -1816 +mira -1817 +nald -1818 +ness -1819 +ngli -1820 +noto -1821 +olle -1822 +onal -1823 +papa -1824 +pium -1825 +port -1826 +raro -1827 +rena -1828 +ring -1829 +roto -1830 +sion -1831 +tani -1832 +taru -1833 +tome -1834 +tres -1835 +tutu -1836 +āito -1837 +ōire -1838 +▁ahi -1839 +▁bar -1840 +▁ber -1841 +▁bes -1842 +▁bré -1843 +▁csá -1844 +▁flo -1845 +▁fon -1846 +▁gam -1847 +▁gua -1848 +▁her -1849 +▁hoe -1850 +▁how -1851 +▁hōê -1852 +▁isa -1853 +▁iva -1854 +▁iòa -1855 +▁kua -1856 +▁lee -1857 +▁lui -1858 +▁mul -1859 +▁nao -1860 +▁nor -1861 +▁ofa -1862 +▁peu -1863 +▁pra -1864 +▁rau -1865 +▁shi -1866 +▁sil -1867 +▁ste -1868 +▁tha -1869 +▁toi -1870 +▁tou -1871 +▁von -1872 +▁wes -1873 +▁wil -1874 +amaru -1875 +drell -1876 +earch -1877 +fenua -1878 +heira -1879 +koata -1880 +maiao -1881 +natae -1882 +oseph -1883 +piuma -1884 +rench -1885 +rutea -1886 +terni -1887 +ticia -1888 +tress -1889 +tunga -1890 +ānira -1891 +īneti -1892 +ōpuhi -1893 +▁agot -1894 +▁aids -1895 +▁ange -1896 +▁anno -1897 +▁anti -1898 +▁auro -1899 +▁aute -1900 +▁avec -1901 +▁bian -1902 +▁blay -1903 +▁cada -1904 +▁caro -1905 +▁dire -1906 +▁elia -1907 +▁gene -1908 +▁hotu -1909 +▁huna -1910 +▁mara -1911 +▁mere -1912 +▁mont -1913 +▁namu -1914 +▁nico -1915 +▁nova -1916 +▁paki -1917 +▁pera -1918 +▁pili -1919 +▁poro -1920 +▁port -1921 +▁repo -1922 +▁rosa -1923 +▁ruga -1924 +▁sapi -1925 +▁tape -1926 +▁taru -1927 +▁tena -1928 +▁tohu -1929 +▁topa -1930 +▁tote -1931 +▁tuha -1932 +▁turu -1933 +▁twer -1934 +▁tāma -1935 +▁veve -1936 +▁vous -1937 +▁wiki -1938 +auitai -1939 +chelor -1940 +ihānia -1941 +inetia -1942 +inītia -1943 +itoito -1944 +oturaa -1945 +perēra -1946 +ration -1947 +stique -1948 +ubakar -1949 +ulenta -1950 +uruuru -1951 +vaceae -1952 +▁ahafo -1953 +▁anuan -1954 +▁atete -1955 +▁atura -1956 +▁feliu -1957 +▁horoa -1958 +▁inter -1959 +▁iriti -1960 +▁lanca -1961 +▁lydia -1962 +▁maimi -1963 +▁maira -1964 +▁martí -1965 +▁nengo -1966 +▁patri -1967 +▁paulo -1968 +▁pihai -1969 +▁tamau -1970 +▁teura -1971 +▁thumb -1972 +▁tuata -1973 +▁tuete -1974 +▁tunis -1975 +▁vaihī -1976 +▁vietu -1977 +▁washi -1978 +▁whare -1979 +▁âtete -1980 +▁łobez -1981 +ographi -1982 +▁alexan -1983 +▁aroraa -1984 +▁autahu -1985 +▁canada -1986 +▁chapel -1987 +▁cīneti -1988 +▁dental -1989 +▁faaore -1990 +▁faaoti -1991 +▁feruri -1992 +▁french -1993 +▁gitata -1994 +▁joseph -1995 +▁julius -1996 +▁kilifi -1997 +▁lamisi -1998 +▁mahina -1999 +▁mariri -2000 +▁mauiui -2001 +▁morena -2002 +▁mētera -2003 +▁parahi -2004 +▁paturu -2005 +▁pātifi -2006 +▁quakyi -2007 +▁refere -2008 +▁tepoto -2009 +▁titeti -2010 +▁tupuna -2011 +▁tāpura -2012 +▁tītema -2013 +▁tōnoto -2014 +▁vairaa -2015 +▁vānira -2016 +▁wesley -2017 +▁actress -2018 +▁amankwa -2019 +▁araceae -2020 +▁armenia -2021 +▁faahana -2022 +▁faatura -2023 +▁hororaa -2024 +▁itenati -2025 +▁marutea -2026 +▁pariraa -2027 +▁poaceae -2028 +▁raiatea -2029 +▁rekoata -2030 +▁sarkozy -2031 +▁tamuera -2032 +▁tapuraa -2033 +▁tipiuma -2034 +▁tuatahi -2035 +ternidade -2036 +▁abubakar -2037 +▁bachelor -2038 +▁emmanuel -2039 +▁grandola -2040 +▁hanahana -2041 +▁kwaghfan -2042 +▁musaceae -2043 +▁officina -2044 +▁peritome -2045 +▁pilibhit -2046 +▁présiden -2047 +▁pukapuka -2048 +▁pāpaìraa -2049 +▁tatakoto -2050 +▁tōtaiete -2051 +▁vendrell -2052 +▁victoria -2053 +peretiteni -2054 +▁anaanatae -2055 +▁auterāria -2056 +▁csebásztá -2057 +▁directory -2058 +▁esculenta -2059 +▁faaiteraa -2060 +▁faaitoito -2061 +▁haamauraa -2062 +▁haapiihia -2063 +▁hamaniraa -2064 +▁malvaceae -2065 +▁taviniraa -2066 +▁annonaceae -2067 +▁cīnetienei -2068 +▁faahoturaa -2069 +▁government -2070 +▁haapapûraa -2071 +▁perititeni -2072 +▁washington -2073 +▁atepaihānia -2074 +▁tāmahanahia -2075 +▁faaipoipohia -2076 +▁fraternidade -2077 +], -2078 +dr -2079 +et -2080 +ig -2081 +ià -2082 +lk -2083 +lé -2084 +mc -2085 +mn -2086 +mē -2087 +ok -2088 +pf -2089 +rá -2090 +sy -2091 +tô -2092 +ud -2093 +up -2094 +we -2095 +ww -2096 +xa -2097 +yi -2098 +yo -2099 +zi -2100 +às -2101 +ço -2102 +çà -2103 +éa -2104 +ée -2105 +ôm -2106 +ši -2107 +ад -2108 +бл -2109 +еп -2110 +ич -2111 +ни -2112 +од -2113 +ри -2114 +▁< -2115 +▁| -2116 +▁î -2117 +▁ī -2118 +▁к -2119 +▁о -2120 +▁п -2121 +▁я -2122 +abi -2123 +aif -2124 +bil -2125 +bio -2126 +bun -2127 +cep -2128 +ció -2129 +cos -2130 +cse -2131 +cur -2132 +cus -2133 +dad -2134 +dis -2135 +eno -2136 +ert -2137 +eva -2138 +fau -2139 +gio -2140 +git -2141 +hea -2142 +hos -2143 +ily -2144 +ins -2145 +ius -2146 +jet -2147 +kon -2148 +kul -2149 +kyo -2150 +lab -2151 +lav -2152 +ldo -2153 +lev -2154 +lip -2155 +lit -2156 +lop -2157 +lou -2158 +lus -2159 +mes -2160 +mos -2161 +mpi -2162 +niu -2163 +nks -2164 +nle -2165 +nyà -2166 +oia -2167 +ors -2168 +oru -2169 +osé -2170 +pai -2171 +plô -2172 +pou -2173 +ppa -2174 +psi -2175 +ral -2176 +reg -2177 +rey -2178 +ros -2179 +sei -2180 +ssà -2181 +ssè -2182 +sul -2183 +szk -2184 +tat -2185 +taè -2186 +tey -2187 +thi -2188 +tio -2189 +tit -2190 +tsk -2191 +uni -2192 +uts -2193 +vea -2194 +vià -2195 +vol -2196 +vre -2197 +wha -2198 +zsá -2199 +áze -2200 +ção -2201 +епу -2202 +ике -2203 +▁), -2204 +▁." -2205 +▁ak -2206 +▁ce -2207 +▁cs -2208 +▁ec -2209 +▁er -2210 +▁gu -2211 +▁gé -2212 +▁jr -2213 +▁mp -2214 +▁nū -2215 +▁ue -2216 +▁ui -2217 +▁un -2218 +▁yô -2219 +▁», -2220 +▁àu -2221 +▁èo -2222 +▁āu -2223 +▁ši -2224 +abid -2225 +addo -2226 +anno -2227 +ante -2228 +anus -2229 +aroa -2230 +atoa -2231 +bier -2232 +cana -2233 +celo -2234 +cipa -2235 +come -2236 +cord -2237 +cská -2238 +dela -2239 +dena -2240 +ehia -2241 +elle -2242 +enga -2243 +ents -2244 +erca -2245 +erto -2246 +fran -2247 +gier -2248 +heti -2249 +hiru -2250 +iaca -2251 +iahu -2252 +inai -2253 +inne -2254 +irae -2255 +issa -2256 +jevo -2257 +kara -2258 +ksan -2259 +leia -2260 +lina -2261 +ling -2262 +lino -2263 +lius -2264 +lues -2265 +ming -2266 +mons -2267 +mota -2268 +naho -2269 +nand -2270 +nces -2271 +nder -2272 +nice -2273 +nuae -2274 +oast -2275 +olum -2276 +onel -2277 +peak -2278 +peci -2279 +piho -2280 +poro -2281 +puni -2282 +rade -2283 +riba -2284 +site -2285 +ssou -2286 +taki -2287 +tapo -2288 +tary -2289 +tata -2290 +tica -2291 +timé -2292 +tito -2293 +toni -2294 +ttar -2295 +ture -2296 +tārē -2297 +uisa -2298 +urae -2299 +urse -2300 +usée -2301 +vela -2302 +vina -2303 +viri -2304 +ward -2305 +çois -2306 +ìraa -2307 +▁aba -2308 +▁agu -2309 +▁alb -2310 +▁ama -2311 +▁api -2312 +▁bon -2313 +▁bos -2314 +▁cli -2315 +▁dro -2316 +▁edu -2317 +▁ela -2318 +▁fai -2319 +▁fal -2320 +▁for -2321 +▁fru -2322 +▁gen -2323 +▁gil -2324 +▁gon -2325 +▁gou -2326 +▁gui -2327 +▁hos -2328 +▁iba -2329 +▁ivi -2330 +▁jan -2331 +▁jes -2332 +▁kei -2333 +▁lli -2334 +▁loa -2335 +▁mis -2336 +▁môm -2337 +▁nan -2338 +▁ndc -2339 +▁new -2340 +▁nom -2341 +▁ola -2342 +▁ono -2343 +▁pas -2344 +▁rai -2345 +▁rea -2346 +▁rii -2347 +▁rik -2348 +▁rio -2349 +▁rop -2350 +▁sol -2351 +▁sot -2352 +▁sra -2353 +▁whi -2354 +▁www -2355 +▁xvi -2356 +▁àhu -2357 +▁ìte -2358 +▁òia -2359 +atoro -2360 +berto -2361 +bilia -2362 +blanc -2363 +blika -2364 +buntu -2365 +burgh -2366 +canus -2367 +chris -2368 +ction -2369 +denia -2370 +dirne -2371 +erere -2372 +folia -2373 +hanga -2374 +heraa -2375 +hinga -2376 +lands -2377 +llada -2378 +losop -2379 +lunya -2380 +maraa -2381 +mataì -2382 +media -2383 +mángo -2384 +ngila -2385 +ograd -2386 +oroni -2387 +ouest -2388 +pania -2389 +plôme -2390 +prage -2391 +ranta -2392 +rdoso -2393 +rihia -2394 +risci -2395 +risti -2396 +sioni -2397 +ssède -2398 +suari -2399 +szter -2400 +tapua -2401 +taraa -2402 +thoni -2403 +tiano -2404 +tista -2405 +tophe -2406 +uardo -2407 +ukash -2408 +umotu -2409 +utuna -2410 +whaka -2411 +блике -2412 +▁anaè -2413 +▁antô -2414 +▁ariā -2415 +▁arue -2416 +▁bara -2417 +▁bola -2418 +▁calo -2419 +▁cape -2420 +▁cate -2421 +▁colo -2422 +▁coro -2423 +▁edin -2424 +▁eiao -2425 +▁este -2426 +▁faba -2427 +▁faus -2428 +▁feti -2429 +▁fédé -2430 +▁glau -2431 +▁hara -2432 +▁huku -2433 +▁hōho -2434 +▁jack -2435 +▁josé -2436 +▁kato -2437 +▁kiri -2438 +▁kore -2439 +▁logo -2440 +▁lucy -2441 +▁lāli -2442 +▁medi -2443 +▁mihi -2444 +▁mira -2445 +▁moho -2446 +▁momo -2447 +▁nous -2448 +▁osma -2449 +▁paea -2450 +▁pehe -2451 +▁pina -2452 +▁pola -2453 +▁povo -2454 +▁pure -2455 +▁quem -2456 +▁rené -2457 +▁rohi -2458 +▁sara -2459 +▁scho -2460 +▁tapa -2461 +▁temp -2462 +▁teti -2463 +▁tika -2464 +▁tiro -2465 +▁tomo -2466 +▁tono -2467 +▁turo -2468 +▁yeke -2469 +▁àito -2470 +▁репу -2471 +annona -2472 +citrus -2473 +daceae -2474 +hiahia -2475 +issala -2476 +iteraa -2477 +itiraa -2478 +laceae -2479 +lation -2480 +linois -2481 +llande -2482 +maitai -2483 +ndanus -2484 +perara -2485 +sement -2486 +tersen -2487 +torika -2488 +tuania -2489 +▁abdel -2490 +▁ahuru -2491 +▁akufo -2492 +▁apiti -2493 +▁caste -2494 +▁chris -2495 +▁coast -2496 +▁cunha -2497 +▁docum -2498 +▁enana -2499 +▁etahi -2500 +▁garri -2501 +▁heheu -2502 +▁henry -2503 +▁hurae -2504 +▁infor -2505 +▁jonas -2506 +▁katoa -2507 +▁laura -2508 +▁maama -2509 +▁maeva -2510 +▁mahia -2511 +▁maohi -2512 +▁mataì -2513 +▁maupi -2514 +▁messi -2515 +▁mohio -2516 +▁najet -2517 +▁nurse -2518 +▁outou -2519 +▁palau -2520 +▁patia -2521 +▁pirae -2522 +▁popaā -2523 +▁press -2524 +▁proje -2525 +▁ramos -2526 +▁sofia -2527 +▁speak -2528 +▁speci -2529 +▁stati -2530 +▁tairi -2531 +▁tokyo -2532 +▁tupai -2533 +▁tāati -2534 +▁ville -2535 +▁vitor -2536 +▁yange -2537 +▁ètārē -2538 +ctorius -2539 +disiaca -2540 +enovela -2541 +mations -2542 +nyáresz -2543 +oscorea -2544 +otetani -2545 +rareraa -2546 +ritoria -2547 +timédia -2548 +waitara -2549 +▁ahurea -2550 +▁anokye -2551 +▁anotau -2552 +▁bianya -2553 +▁citrus -2554 +▁donald -2555 +▁faaapu -2556 +▁faahou -2557 +▁futuna -2558 +▁hatutu -2559 +▁hitiaa -2560 +▁ibadan -2561 +▁ingila -2562 +▁iteraa -2563 +▁kufour -2564 +▁laurey -2565 +▁lesley -2566 +▁lionel -2567 +▁louisa -2568 +▁manawa -2569 +▁manuae -2570 +▁martin -2571 +▁mbayev -2572 +▁meheti -2573 +▁mensah -2574 +▁metres -2575 +▁nainai -2576 +▁nicole -2577 +▁nuihau -2578 +▁numera -2579 +▁ordena -2580 +▁papara -2581 +▁parlez -2582 +▁patava -2583 +▁prisci -2584 +▁profes -2585 +▁pūerto -2586 +▁raìroa -2587 +▁rotopū -2588 +▁sangen -2589 +▁srairi -2590 +▁taatoa -2591 +▁tapiho -2592 +▁tereza -2593 +▁terihi -2594 +▁tuvaru -2595 +▁tāvana -2596 +▁united -2597 +▁univer -2598 +▁uturoa -2599 +▁vrenko -2600 +atuaiahu -2601 +losophia -2602 +tapuatea -2603 +tocarpus -2604 +▁aleksan -2605 +▁america -2606 +▁amuiraa -2607 +▁andrade -2608 +▁batista -2609 +▁beograd -2610 +▁bibilia -2611 +▁bolanle -2612 +▁cardoso -2613 +▁commons -2614 +▁diplôme -2615 +▁eduardo -2616 +▁faafana -2617 +▁faarahi -2618 +▁farerei -2619 +▁gambier -2620 +▁jesberg -2621 +▁llierca -2622 +▁mataura -2623 +▁misioni -2624 +▁muthoni -2625 +▁nyerere -2626 +▁patrick -2627 +▁paturaa -2628 +▁possède -2629 +▁pureraa -2630 +▁ravehia -2631 +▁raveraa -2632 +▁raìātea -2633 +▁riroraa -2634 +▁rorofaì -2635 +▁sissala -2636 +▁taheraa -2637 +▁tairoto -2638 +▁tangata -2639 +▁tumaraa -2640 +▁tunisia -2641 +▁tūāmotu -2642 +▁village -2643 +▁website -2644 +▁âperera -2645 +▁êperara -2646 +▁šiprage -2647 +ukashenko -2648 +▁amankwah -2649 +▁arapania -2650 +▁caroline -2651 +▁category -2652 +▁fabaceae -2653 +▁faustina -2654 +▁françois -2655 +▁ghanaian -2656 +▁haerenga -2657 +▁haereraa -2658 +▁heheuraa -2659 +▁hollande -2660 +▁katolika -2661 +▁katorika -2662 +▁maitihia -2663 +▁maìtiraa -2664 +▁moraceae -2665 +▁otitānia -2666 +▁pangarau -2667 +▁parauhia -2668 +▁pehepehe -2669 +▁punaauia -2670 +▁rituania -2671 +▁rutaceae -2672 +▁sarajevo -2673 +▁tapotapo -2674 +▁taputapu -2675 +▁tauatini -2676 +▁titauraa -2677 +▁toromona -2678 +▁uetersen -2679 +▁wellness -2680 +▁ètārētia -2681 +▁catalunya -2682 +▁documents -2683 +▁edinburgh -2684 +▁faahiahia -2685 +▁faaotiraa -2686 +▁institute -2687 +▁makeranta -2688 +▁parahiraa -2689 +▁parururaa -2690 +▁tectorius -2691 +▁tuatapapa -2692 +▁wikimedia -2693 +▁републике -2694 +▁kilometera -2695 +▁multimédia -2696 +▁population -2697 +▁porotetani -2698 +▁présidence -2699 +▁references -2700 +▁tapihooraa -2701 +▁telenovela -2702 +▁territoria -2703 +atuaiahutapu -2704 +▁faanahonaho -2705 +▁faaohiparaa -2706 +▁pakiwaitara -2707 +▁paradisiaca -2708 +▁peritomeraa -2709 +▁philosophia -2710 +▁faaineinehia -2711 +▁haaparareraa -2712 +▁taputapuatea -2713 +▁faahanahanahia -2714 +.[ -2715 +ac -2716 +aè -2717 +bb -2718 +bá -2719 +bé -2720 +cl -2721 +cê -2722 +df -2723 +dí -2724 +dó -2725 +fé -2726 +hy -2727 +ib -2728 +ju -2729 +kp -2730 +kā -2731 +lv -2732 +mm -2733 +mw -2734 +nō -2735 +oh -2736 +pī -2737 +rt -2738 +tì -2739 +tū -2740 +uk -2741 +un -2742 +ux -2743 +vō -2744 +wī -2745 +yd -2746 +yl -2747 +yu -2748 +zh -2749 +», -2750 +ás -2751 +ên -2752 +ît -2753 +ùo -2754 +āi -2755 +či -2756 +ед -2757 +ст -2758 +عب -2759 +▁# -2760 +▁= -2761 +▁° -2762 +▁û -2763 +▁ū -2764 +▁ʼ -2765 +▁ˈ -2766 +▁а -2767 +▁д -2768 +▁е -2769 +▁з -2770 +▁и -2771 +▁й -2772 +▁л -2773 +▁н -2774 +▁ц -2775 +▁ч -2776 +▁ш -2777 +▁ы -2778 +ale -2779 +ali -2780 +alo -2781 +ani -2782 +ank -2783 +ans -2784 +apu -2785 +arā -2786 +ase -2787 +aug -2788 +aux -2789 +ava -2790 +bes -2791 +bor -2792 +cie -2793 +com -2794 +cre -2795 +cri -2796 +day -2797 +dra -2798 +dua -2799 +ка -2800 +▁у -2801 +bis -2802 +bua -2803 +cto -2804 +ehi -2805 +eie -2806 +eue -2807 +fer -2808 +ffe -2809 +fim -2810 +fos -2811 +fre -2812 +gie -2813 +gos -2814 +gro -2815 +gui -2816 +har -2817 +hie -2818 +hin -2819 +hot -2820 +iar -2821 +ide -2822 +ini -2823 +isu -2824 +jor -2825 +kin -2826 +koa -2827 +kos -2828 +kru -2829 +lco -2830 +lls -2831 +lly -2832 +lol -2833 +lto -2834 +láu -2835 +mad -2836 +mah -2837 +mat -2838 +mgo -2839 +mia -2840 +mie -2841 +min -2842 +mir -2843 +mni -2844 +mor -2845 +mot -2846 +mui -2847 +nen -2848 +nho -2849 +nor -2850 +nou -2851 +nti -2852 +nva -2853 +nys -2854 +oha -2855 +ols -2856 +one -2857 +ono -2858 +onu -2859 +oti -2860 +ots -2861 +ous -2862 +paa -2863 +pal -2864 +pan -2865 +pii -2866 +pon -2867 +pos -2868 +pse -2869 +ras -2870 +reu -2871 +rid -2872 +riu -2873 +rni -2874 +rés -2875 +san -2876 +sea -2877 +sha -2878 +sit -2879 +siu -2880 +ski -2881 +sto -2882 +tan -2883 +teg -2884 +thy -2885 +tic -2886 +tie -2887 +tiu -2888 +toà -2889 +toè -2890 +ttu -2891 +tue -2892 +upa -2893 +urs -2894 +ute -2895 +vau -2896 +vel -2897 +vis -2898 +wen -2899 +af -2900 +ки -2901 +▁ó -2902 +bas -2903 +elr -2904 +iso -2905 +isy -2906 +mic -2907 +moe -2908 +ndo -2909 +noa -2910 +now -2911 +rdi -2912 +the -2913 +tty -2914 +whi -2915 +yij -2916 +zen -2917 +zes -2918 +zos -2919 +ûru -2920 +āpi -2921 +āto -2922 +čes -2923 +ītā -2924 +īwī -2925 +ōna -2926 +рад -2927 +род -2928 +▁(° -2929 +▁az -2930 +▁cé -2931 +▁dá -2932 +▁dä -2933 +▁ej -2934 +▁gi -2935 +▁gl -2936 +▁gá -2937 +▁io -2938 +▁iz -2939 +▁kā -2940 +▁mé -2941 +▁od -2942 +▁oè -2943 +▁pá -2944 +▁pē -2945 +▁pī -2946 +▁sp -2947 +▁sé -2948 +▁sí -2949 +▁th -2950 +▁ty -2951 +▁uk -2952 +▁us -2953 +▁vá -2954 +▁wh -2955 +▁ze -2956 +▁». -2957 +▁ту -2958 +▁ال -2959 +alpi -2960 +anth -2961 +arii -2962 +bayo -2963 +bral -2964 +ccha -2965 +cial -2966 +ción -2967 +cron -2968 +date -2969 +desh -2970 +divi -2971 +eira -2972 +elli -2973 +ence -2974 +enix -2975 +eren -2976 +eres -2977 +esca -2978 +esia -2979 +esti -2980 +fano -2981 +fski -2982 +gado -2983 +goso -2984 +gual -2985 +hapa -2986 +hata -2987 +heli -2988 +hena -2989 +hera -2990 +hina -2991 +hinu -2992 +hiro -2993 +hono -2994 +hora -2995 +iaki -2996 +iana -2997 +ibge -2998 +inda -2999 +ró -3000 +.). -3001 +dol -3002 +dom -3003 +eux -3004 +iki -3005 +kum -3006 +llà -3007 +nce -3008 +rst -3009 +▁". -3010 +▁). -3011 +amra -3012 +fata -3013 +grat -3014 +inga -3015 +jany -3016 +jour -3017 +kahu -3018 +kare -3019 +kava -3020 +keok -3021 +kete -3022 +kiro -3023 +kota -3024 +kume -3025 +kura -3026 +ladi -3027 +lano -3028 +lecu -3029 +left -3030 +lesz -3031 +lien -3032 +liki -3033 +lixa -3034 +llus -3035 +lnea -3036 +lori -3037 +lska -3038 +lter -3039 +léme -3040 +mara -3041 +mato -3042 +mbra -3043 +meka -3044 +meni -3045 +mont -3046 +mote -3047 +muna -3048 +nani -3049 +nato -3050 +nava -3051 +navi -3052 +ndis -3053 +ners -3054 +nges -3055 +ngoa -3056 +ngon -3057 +niak -3058 +nini -3059 +nira -3060 +nuve -3061 +onné -3062 +oriz -3063 +orro -3064 +osco -3065 +osus -3066 +otri -3067 +otro -3068 +oute -3069 +peri -3070 +piah -3071 +pipi -3072 +pohe -3073 +pool -3074 +puri -3075 +putu -3076 +quel -3077 +quer -3078 +quil -3079 +raka -3080 +rara -3081 +reia -3082 +ries -3083 +risi -3084 +ropo -3085 +rson -3086 +ruhi -3087 +ruve -3088 +rédé -3089 +rātā -3090 +sara -3091 +sien -3092 +siti -3093 +ssen -3094 +stor -3095 +sula -3096 +szte -3097 +tade -3098 +tahu -3099 +amâ -3100 +bel -3101 +kei -3102 +ong -3103 +ron -3104 +sso -3105 +une -3106 +àau -3107 +ère -3108 +▁zu -3109 +▁на -3110 +cast -3111 +cego -3112 +cide -3113 +cies -3114 +kowa -3115 +kále -3116 +nake -3117 +rike -3118 +stro -3119 +taro -3120 +tati -3121 +ther -3122 +thri -3123 +tifo -3124 +tika -3125 +tine -3126 +tiri -3127 +tsch -3128 +tska -3129 +tten -3130 +ttli -3131 +uaku -3132 +udad -3133 +urne -3134 +usta -3135 +uvea -3136 +uvre -3137 +vaco -3138 +vier -3139 +vila -3140 +viny -3141 +voir -3142 +vōta -3143 +wani -3144 +yama -3145 +áres -3146 +èrau -3147 +ètoè -3148 +état -3149 +être -3150 +íbal -3151 +òhia -3152 +āraì -3153 +рист -3154 +▁aau -3155 +▁abc -3156 +▁ahe -3157 +▁air -3158 +▁ake -3159 +▁ami -3160 +▁apo -3161 +▁arb -3162 +▁atâ -3163 +▁aua -3164 +▁aux -3165 +▁ben -3166 +▁beu -3167 +▁bol -3168 +▁bru -3169 +▁cam -3170 +▁cen -3171 +▁ceo -3172 +▁cla -3173 +▁die -3174 +▁din -3175 +▁dra -3176 +▁eie -3177 +▁eli -3178 +▁esz -3179 +▁fan -3180 +▁far -3181 +▁fil -3182 +▁flu -3183 +▁flá -3184 +▁fre -3185 +▁gif -3186 +▁gre -3187 +▁hea -3188 +▁hel -3189 +▁ina -3190 +▁ire -3191 +▁jus -3192 +▁kar -3193 +▁kni -3194 +▁koa -3195 +▁kom -3196 +▁kpi -3197 +▁lin -3198 +▁loi -3199 +at -3200 +ôr -3201 +bol -3202 +der -3203 +glo -3204 +ifo -3205 +luc -3206 +oko -3207 +pià -3208 +von -3209 +íso -3210 +▁fā -3211 +▁já -3212 +▁xh -3213 +▁za -3214 +aita -3215 +bird -3216 +bosa -3217 +cifo -3218 +eraa -3219 +gill -3220 +gues -3221 +káve -3222 +lder -3223 +mbre -3224 +ndão -3225 +polu -3226 +pure -3227 +pōra -3228 +rcia -3229 +rdia -3230 +rons -3231 +rump -3232 +soma -3233 +veta -3234 +ícia -3235 +▁acu -3236 +▁bio -3237 +▁los -3238 +▁lud -3239 +▁mlu -3240 +▁moe -3241 +▁myr -3242 +▁nas -3243 +▁nya -3244 +▁não -3245 +▁oba -3246 +▁oei -3247 +▁oto -3248 +▁oui -3249 +▁pad -3250 +▁pen -3251 +▁pep -3252 +▁per -3253 +▁pfi -3254 +▁pii -3255 +▁ple -3256 +▁pop -3257 +▁rei -3258 +▁res -3259 +▁roh -3260 +▁sad -3261 +▁sau -3262 +▁sci -3263 +▁sea -3264 +▁ses -3265 +▁sme -3266 +▁son -3267 +▁sti -3268 +▁sto -3269 +▁stu -3270 +▁ten -3271 +▁tom -3272 +▁toà -3273 +▁ufi -3274 +▁val -3275 +▁vea -3276 +▁vii -3277 +▁vir -3278 +▁yem -3279 +▁yes -3280 +▁zan -3281 +▁àif -3282 +▁àno -3283 +▁àti -3284 +▁âau -3285 +▁âià -3286 +▁âpī -3287 +▁ère -3288 +▁òro -3289 +▁ùru -3290 +ahotu -3291 +alofa -3292 +amana -3293 +ankro -3294 +apira -3295 +arava -3296 +arāau -3297 +atata -3298 +bbins -3299 +etu -3300 +jar -3301 +rià -3302 +▁ér -3303 +blic -3304 +dyta -3305 +java -3306 +lada -3307 +lité -3308 +melo -3309 +orld -3310 +phor -3311 +rapa -3312 +▁che -3313 +▁jau -3314 +▁six -3315 +▁tho -3316 +apeto -3317 +aturi -3318 +brega -3319 +casia -3320 +ching -3321 +chyum -3322 +ciano -3323 +colum -3324 +conia -3325 +crest -3326 +curma -3327 +deval -3328 +dinha -3329 +dulus -3330 +dísti -3331 +ehara -3332 +entum -3333 +féren -3334 +gegie -3335 +geria -3336 +gifer -3337 +gique -3338 +guaya -3339 +hangi -3340 +hação -3341 +hetia -3342 +hiata -3343 +hibis -3344 +hiraa -3345 +iland -3346 +illes -3347 +imira -3348 +inapo -3349 +irani -3350 +itihi -3351 +iātea -3352 +kehau -3353 +lcomb -3354 +leurs -3355 +llets -3356 +marie -3357 +mores -3358 +moteo -3359 +muaki -3360 +naldo -3361 +nells -3362 +nellà -3363 +nesco -3364 +nford -3365 +niara -3366 +nilla -3367 +niota -3368 +nshin -3369 +ntiif -3370 +nuraa -3371 +oragi -3372 +orata -3373 +ordor -3374 +oreau -3375 +orges -3376 +orpho -3377 +oscou -3378 +petit -3379 +piria -3380 +pital -3381 +publi -3382 +pāpaì -3383 +quise -3384 +rican -3385 +riket -3386 +riona -3387 +rothe -3388 +runga -3389 +silia -3390 +steur -3391 +story -3392 +sulté -3393 +tahaa -3394 +taima -3395 +taito -3396 +talum -3397 +tangi -3398 +teate -3399 +tilis -3400 +tinia -3401 +tonia -3402 +tráti -3403 +tuhaa -3404 +tumor -3405 +tures -3406 +uador -3407 +ubaix -3408 +univa -3409 +uraro -3410 +ution -3411 +vador -3412 +veira -3413 +verne -3414 +vesen -3415 +wanga -3416 +wango -3417 +yline -3418 +zalez -3419 +zerba -3420 +zosta -3421 +çanet -3422 +ïaraa -3423 +ānani -3424 +родна -3425 +▁achi -3426 +▁aito -3427 +▁aora -3428 +▁ashe -3429 +▁asia -3430 +▁aura -3431 +▁azin -3432 +▁baku -3433 +▁basi -3434 +▁boui -3435 +▁burt -3436 +▁caba -3437 +▁camb -3438 +▁camp -3439 +▁cara -3440 +▁city -3441 +▁cláu -3442 +▁cora -3443 +▁cour -3444 +▁cuba -3445 +▁curi -3446 +▁data -3447 +▁disz -3448 +▁domi -3449 +▁duck -3450 +▁duma -3451 +▁eaha -3452 +▁espo -3453 +▁esta -3454 +▁fine -3455 +▁flav -3456 +▁from -3457 +▁heli -3458 +▁hitu -3459 +▁hune -3460 +▁iyol -3461 +▁joan -3462 +▁kaha -3463 +▁kpaa -3464 +▁land -3465 +▁lehn -3466 +▁lins -3467 +▁lisa -3468 +▁lond -3469 +▁luiz -3470 +▁mama -3471 +▁mary -3472 +▁mati -3473 +▁meka -3474 +▁mena -3475 +▁miro -3476 +▁moli -3477 +▁mona -3478 +▁moru -3479 +▁moto -3480 +▁muni -3481 +▁name -3482 +▁nano -3483 +▁natī -3484 +▁nava -3485 +▁news -3486 +▁niau -3487 +▁niuē -3488 +▁nkru -3489 +▁noaa -3490 +▁nono -3491 +▁nuci -3492 +▁ohie -3493 +▁omua -3494 +▁oteg -3495 +▁otia -3496 +▁pala -3497 +▁papu -3498 +▁pati -3499 +▁patr -3500 +▁pene -3501 +▁pont -3502 +▁porī -3503 +▁poti -3504 +▁poto -3505 +▁pour -3506 +▁pres -3507 +▁prot -3508 +▁puig -3509 +▁reis -3510 +▁rien -3511 +▁riud -3512 +▁roll -3513 +▁ropu -3514 +▁rose -3515 +▁ruby -3516 +▁rōpū -3517 +▁sala -3518 +▁sali -3519 +▁sera -3520 +▁sert -3521 +▁seus -3522 +▁sine -3523 +▁snow -3524 +▁sola -3525 +▁suis -3526 +▁sule -3527 +▁surf -3528 +▁taro -3529 +▁teko -3530 +▁teme -3531 +▁tepa -3532 +▁tepo -3533 +▁teve -3534 +▁titi -3535 +▁toau -3536 +▁toka -3537 +▁tonu -3538 +▁tuhe -3539 +▁tuhu -3540 +▁tura -3541 +▁tutu -3542 +▁tōna -3543 +▁uira -3544 +▁vall -3545 +▁vana -3546 +▁vera -3547 +▁você -3548 +▁vāna -3549 +▁with -3550 +▁wīwī -3551 +▁âamu -3552 +▁âmui -3553 +▁îraa -3554 +africa -3555 +aifiti -3556 +amâraa -3557 +apiira -3558 +ataata -3559 +atuhia -3560 +cation -3561 +celona -3562 +center -3563 +chiman -3564 +donald -3565 +edirne -3566 +fauraa -3567 +fortia -3568 +gentea -3569 +heretō -3570 +hostal -3571 +huinga -3572 +hīmene -3573 +iriraa -3574 +ivavao -3575 +kareka -3576 +kuláre -3577 +llyday -3578 +lémena -3579 +marama -3580 +minist -3581 +misina -3582 +nglish -3583 +ngonui -3584 +numiti -3585 +nuvera -3586 +oniifo -3587 +prache -3588 +ribati -3589 +roella -3590 +ruhito -3591 +sident -3592 +silien -3593 +spesia -3594 +sticum -3595 +sulare -3596 +sypium -3597 +tepipi -3598 +terani -3599 +ticosa -3600 +tārava -3601 +urites -3602 +urunga -3603 +vatska -3604 +waiata -3605 +ìteraa -3606 +ристич -3607 +▁actua -3608 +▁adaku -3609 +▁adela -3610 +▁alata -3611 +▁alice -3612 +▁alpha -3613 +▁amanu -3614 +▁amaru -3615 +▁angli -3616 +▁arabi -3617 +▁aroha -3618 +▁auraa -3619 +▁award -3620 +▁betty -3621 +▁bisiw -3622 +▁blues -3623 +▁boute -3624 +▁bowen -3625 +▁brest -3626 +▁cassà -3627 +▁citri -3628 +▁commi -3629 +▁daily -3630 +▁daisy -3631 +▁denis -3632 +▁eesti -3633 +▁ejisu -3634 +▁etoni -3635 +▁faaau -3636 +▁faaru -3637 +▁faati -3638 +▁faith -3639 +▁falab -3640 +▁ferra -3641 +▁ferri -3642 +▁fetia -3643 +▁fetià -3644 +▁first -3645 +▁flori -3646 +▁franc -3647 +▁frédé -3648 +▁fānau -3649 +▁gusta -3650 +▁haamo -3651 +▁hanga -3652 +▁henen -3653 +▁henri -3654 +▁hiroà -3655 +▁huaai -3656 +▁hōreo -3657 +▁idade -3658 +▁igual -3659 +▁infos -3660 +▁ingoa -3661 +▁julià -3662 +▁jurei -3663 +▁kairo -3664 +▁katiu -3665 +▁komfo -3666 +▁konge -3667 +▁kwame -3668 +▁kwase -3669 +▁leone -3670 +▁liver -3671 +▁longa -3672 +▁lídia -3673 +▁manar -3674 +▁manui -3675 +▁mello -3676 +▁merci -3677 +▁methy -3678 +▁moluc -3679 +▁monte -3680 +▁mount -3681 +▁musée -3682 +▁names -3683 +▁negro -3684 +▁nenei -3685 +▁nepal -3686 +▁nephi -3687 +▁noreg -3688 +▁nyáze -3689 +▁opani -3690 +▁panda -3691 +▁papaa -3692 +▁parti -3693 +▁perez -3694 +▁photo -3695 +▁plaît -3696 +▁popaa -3697 +▁pouri -3698 +▁prado -3699 +▁premi -3700 +▁priva -3701 +▁puoro -3702 +▁pwani -3703 +▁pāpua -3704 +▁ratio -3705 +▁raveā -3706 +▁rocha -3707 +▁rodri -3708 +▁rosto -3709 +▁rātou -3710 +▁sabia -3711 +▁sagit -3712 +▁seven -3713 +▁silva -3714 +▁solia -3715 +▁souff -3716 +▁souza -3717 +▁staat -3718 +▁taato -3719 +▁taero -3720 +▁taite -3721 +▁tamaì -3722 +▁tapea -3723 +▁taruā -3724 +▁taure -3725 +▁teioa -3726 +▁temoe -3727 +▁temps -3728 +▁terai -3729 +▁tikei -3730 +▁tiwhi -3731 +▁toroa -3732 +▁trump -3733 +▁tuaro -3734 +▁tuite -3735 +▁tychy -3736 +▁uttar -3737 +▁vavai -3738 +▁visit -3739 +▁vladi -3740 +▁whana -3741 +▁world -3742 +▁àhuru -3743 +▁ânani -3744 +▁ènana -3745 +ahotura -3746 +alpinia -3747 +ccharum -3748 +cepción -3749 +ciparum -3750 +dytarum -3751 +dística -3752 +fritsch -3753 +heretue -3754 +kávetrá -3755 +manihia -3756 +minalia -3757 +navichy -3758 +ndaceae -3759 +ngifera -3760 +paraiso -3761 +paraíso -3762 +phallus -3763 +psidium -3764 +queline -3765 +ristina -3766 +ruvetia -3767 +stiques -3768 +tallada -3769 +taronia -3770 +tetiano -3771 +thosoma -3772 +tifolia -3773 +titohia -3774 +tsoreau -3775 +ttlikon -3776 +āitoraa -3777 +ōperera -3778 +▁aguiar -3779 +▁ahakoa -3780 +▁ahunui -3781 +▁akanva -3782 +▁akiaki -3783 +▁albert -3784 +▁anavai -3785 +▁andreu -3786 +▁anuanu -3787 +▁aníbal -3788 +▁aparau -3789 +▁apatoà -3790 +▁appiah -3791 +▁arorau -3792 +▁asante -3793 +▁ateate -3794 +▁azerba -3795 +▁baskin -3796 +▁batata -3797 +▁boragi -3798 +▁brasil -3799 +▁brésil -3800 +▁carlos -3801 +▁castro -3802 +▁cavaco -3803 +▁cidade -3804 +▁compan -3805 +▁decide -3806 +▁dentro -3807 +▁dordor -3808 +▁edulis -3809 +▁elaine -3810 +▁eliana -3811 +▁eliane -3812 +▁equise -3813 +▁ereraa -3814 +▁esteve -3815 +▁eunice -3816 +▁euphor -3817 +▁faatià -3818 +▁faaàhā -3819 +▁faaàpu -3820 +▁faaûru -3821 +▁farara -3822 +▁fatata -3823 +▁fluvià -3824 +▁flávio -3825 +▁france -3826 +▁haerea -3827 +▁henryk -3828 +▁herbal -3829 +▁hetero -3830 +▁howell -3831 +▁hīmeni -3832 +▁imiraa -3833 +▁itehia -3834 +▁jacqui -3835 +▁johnny -3836 +▁kauehi -3837 +▁kouaku -3838 +▁louvre -3839 +▁macron -3840 +▁manuïa -3841 +▁maraga -3842 +▁marcel -3843 +▁mature -3844 +▁mcgill -3845 +▁mekiro -3846 +▁merger -3847 +▁metera -3848 +▁miquel -3849 +▁mokowa -3850 +▁molecu -3851 +▁mollet -3852 +▁morane -3853 +▁moroni -3854 +▁moscou -3855 +▁márcia -3856 +▁mānava -3857 +▁nihiru -3858 +▁niuhia -3859 +▁nohora -3860 +▁nūmera -3861 +▁parani -3862 +▁paraoa -3863 +▁parisi -3864 +▁peehia -3865 +▁petero -3866 +▁pfizer -3867 +▁philip -3868 +▁pinaki -3869 +▁please -3870 +▁polska -3871 +▁polyne -3872 +▁portal -3873 +▁porter -3874 +▁rahira -3875 +▁raraka -3876 +▁raroia -3877 +▁ratere -3878 +▁riveta -3879 +▁roaraa -3880 +▁roszte -3881 +▁rēmuna -3882 +▁sahara -3883 +▁sandra -3884 +▁school -3885 +▁sierra -3886 +▁sombra -3887 +▁taenga -3888 +▁taiaro -3889 +▁takume -3890 +▁tamanu -3891 +▁tarahu -3892 +▁tauere -3893 +▁tauraa -3894 +▁taviri -3895 +▁taòhia -3896 +▁tearii -3897 +▁teatea -3898 +▁tekava -3899 +▁terera -3900 +▁thanks -3901 +▁tiaàau -3902 +▁tigers -3903 +▁tinito -3904 +▁tiàraa -3905 +▁tourne -3906 +▁toètoè -3907 +▁troglo -3908 +▁turiti -3909 +▁tuvalu -3910 +▁tāfano -3911 +▁tāhinu -3912 +▁tāporo -3913 +▁ubuntu -3914 +▁unesco -3915 +▁victor -3916 +▁vilada -3917 +▁vilama -3918 +▁whanga -3919 +▁whanui -3920 +▁whenua -3921 +▁wilson -3922 +▁yuniva -3923 +▁ànotau -3924 +▁àuhune -3925 +▁āmenia -3926 +atuahiva -3927 +aturiraa -3928 +cifolium -3929 +division -3930 +férences -3931 +gardenia -3932 +hibiscus -3933 +national -3934 +ografski -3935 +ographie -3936 +otropium -3937 +pandanus -3938 +parauraa -3939 +publique -3940 +pāpaìraa -3941 +tatihata -3942 +tifolium -3943 +whakaari -3944 +▁abankro -3945 +▁akamaru -3946 +▁altilis -3947 +▁amerika -3948 +▁angeles -3949 +▁antigen -3950 +▁antonio -3951 +▁antônio -3952 +▁anuvera -3953 +▁apataki -3954 +▁arairaa -3955 +▁aratika -3956 +▁atamira -3957 +▁atuaraa -3958 +▁barbosa -3959 +▁brandão -3960 +▁castell -3961 +▁casuari -3962 +▁catappa -3963 +▁comosus -3964 +▁corinne -3965 +▁cucurma -3966 +▁ecuador -3967 +▁english -3968 +▁faahapa -3969 +▁faahiti -3970 +▁faahoho -3971 +▁faatoro -3972 +▁faatumu -3973 +▁fagifer -3974 +▁fareata -3975 +▁fernand -3976 +▁fragoso -3977 +▁frogier -3978 +▁gregory -3979 +▁guajava -3980 +▁hanshin -3981 +▁haraiki -3982 +▁hercego -3983 +▁holcomb -3984 +▁hunaraa -3985 +▁hurihia -3986 +▁incanus -3987 +▁islands -3988 +▁jackson -3989 +▁kaukura -3990 +▁kawango -3991 +▁kingdom -3992 +▁kohinga -3993 +▁leticia -3994 +▁llémena -3995 +▁makaroa -3996 +▁makatea -3997 +▁malgrat -3998 +▁marokau -3999 +▁mataiva -4000 +▁maçanet -4001 +▁medical -4002 +▁miranda -4003 +▁miriona -4004 +▁moruroa -4005 +▁māniota -4006 +▁nigeria -4007 +▁nkrumah -4008 +▁nohoraa -4009 +▁odorata -4010 +▁omuaraa -4011 +▁orohena -4012 +▁orvesen -4013 +▁painapo -4014 +▁pasteur -4015 +▁pipiria -4016 +▁poheraa -4017 +▁polanyi -4018 +▁poszter -4019 +▁pradesh -4020 +▁project -4021 +▁prolixa -4022 +▁puarātā -4023 +▁pukarua -4024 +▁pētānia -4025 +▁pōtinia -4026 +▁raitihi -4027 +▁rapaeau -4028 +▁reitoru -4029 +▁rikitea -4030 +▁ronaldo -4031 +▁roubaix -4032 +▁sanquer -4033 +▁science -4034 +▁serafim -4035 +▁sotelli -4036 +▁tahanea -4037 +▁taioraa -4038 +▁tatuhaa -4039 +▁tauihaa -4040 +▁tehetia -4041 +▁teienei -4042 +▁tikanga -4043 +▁tikehau -4044 +▁timoteo -4045 +▁trojany -4046 +▁tuanake -4047 +▁tumuaki -4048 +▁vahanga -4049 +▁verrons -4050 +▁vontade -4051 +▁whakapu -4052 +▁àhuāraì -4053 +▁êperēra -4054 +▁народна -4055 +chimantia -4056 +guayaquil -4057 +hostalnou -4058 +montblanc -4059 +niuterani -4060 +ntiifolia -4061 +raromataì -4062 +ringtonia -4063 +taimareva -4064 +toronetia -4065 +vernement -4066 +▁achimota -4067 +▁adelaide -4068 +▁american -4069 +▁anglican -4070 +▁argentea -4071 +▁asiatica -4072 +▁basileia -4073 +▁bouissou -4074 +▁brasilia -4075 +▁consulté -4076 +▁cristina -4077 +▁dominiak -4078 +▁faafanau -4079 +▁fakahina -4080 +▁frédéric -4081 +▁gonzalez -4082 +▁hallyday -4083 +▁hangarau -4084 +▁hospital -4085 +▁illinois -4086 +▁insulare -4087 +▁kenyatta -4088 +▁komisina -4089 +▁malhação -4090 +▁manahune -4091 +▁manutahi -4092 +▁marotiri -4093 +▁maupihaa -4094 +▁mcdonald -4095 +▁mekameka -4096 +▁melekeok -4097 +▁military -4098 +▁mātiharo -4099 +▁māuruuru -4100 +▁nanumiti -4101 +▁naruhito -4102 +▁natīrara -4103 +▁nucifera -4104 +▁nászopki -4105 +▁oeillets -4106 +▁oliveira -4107 +▁otegbayo -4108 +▁patireia -4109 +▁patrícia -4110 +▁peralada -4111 +▁peretita -4112 +▁populnea -4113 +▁profesôr -4114 +▁pātifita -4115 +▁pātifitā -4116 +▁raparapa -4117 +▁ravahere -4118 +▁rekareka -4119 +▁research -4120 +▁rohipehe -4121 +▁rongonui -4122 +▁salvador -4123 +▁sinensis -4124 +▁snowbird -4125 +▁speciosa -4126 +▁stanford -4127 +▁sulemana -4128 +▁takapoto -4129 +▁taratara -4130 +▁tarutaru -4131 +▁teaching -4132 +▁tekokota -4133 +▁temeharo -4134 +▁tenararo -4135 +▁tepapuri -4136 +▁thailand -4137 +▁tiribati -4138 +▁titauhia -4139 +▁toroātia -4140 +▁tourisme -4141 +▁vaataata -4142 +▁vahitahi -4143 +▁vanavana -4144 +▁ventures -4145 +▁vladimir -4146 +▁wellcome -4147 +▁whakaaro -4148 +▁whakanui -4149 +▁òrometua -4150 +▁туристич -4151 +artocarpus -4152 +christophe -4153 +heretōvina -4154 +ographical -4155 +oniifolius -4156 +zostachyum -4157 +▁actualité -4158 +▁aleksandr -4159 +▁alexandre -4160 +▁americana -4161 +▁animation -4162 +▁antitumor -4163 +▁apatoèrau -4164 +▁azinheira -4165 +▁brésilien -4166 +▁csebászti -4167 +▁dioscorea -4168 +▁dättlikon -4169 +▁faaoraraa -4170 +▁faataahia -4171 +▁faataaraa -4172 +▁faaìteraa -4173 +▁falabella -4174 +▁feruriraa -4175 +▁fruticosa -4176 +▁haamaitai -4177 +▁heremoana -4178 +▁huitārava -4179 +▁hāmanihia -4180 +▁igualdade -4181 +▁kaiwaiata -4182 +▁lancaster -4183 +▁lancastro -4184 +▁liverpool -4185 +▁manuhangi -4186 +▁manuïaraa -4187 +▁motutunga -4188 +▁myrtaceae -4189 +▁noruvetia -4190 +▁parataito -4191 +▁porinetia -4192 +▁porīnetia -4193 +▁president -4194 +▁priscille -4195 +▁republika -4196 +▁sapientum -4197 +▁taitensis -4198 +▁tamataraa -4199 +▁taraehara -4200 +▁tematangi -4201 +▁tenarunga -4202 +▁tetaronia -4203 +▁tiwhikete -4204 +▁torinetia -4205 +▁torroella -4206 +▁totegegie -4207 +▁vairaatea -4208 +▁anuanuraro -4209 +▁asantehene -4210 +▁citrifolia -4211 +▁concepción -4212 +▁faaterehau -4213 +▁faatupuhia -4214 +▁falciparum -4215 +▁fangataufa -4216 +▁floridulus -4217 +▁fédération -4218 +▁géographie -4219 +▁haamataraa -4220 +▁inophyllum -4221 +▁jacqueline -4222 +▁kongeriket -4223 +▁lukashenko -4224 +▁matauranga -4225 +▁mohiotanga -4226 +▁mountcrest -4227 +▁nukutepipi -4228 +▁officinale -4229 +▁rohfritsch -4230 +▁références -4231 +▁république -4232 +▁solanaceae -4233 +▁tirometera -4234 +▁université -4235 +▁valparaíso -4236 +▁whakamahia -4237 +▁whakamaori -4238 +▁yunivasiti -4239 +▁àifāitoraa -4240 +devalparaiso -4241 +orphophallus -4242 +▁anuanurunga -4243 +▁baranavichy -4244 +▁companheira -4245 +▁haamauruuru -4246 +▁hereheretue -4247 +▁kaiwhakaari -4248 +▁methysticum -4249 +▁officinarum -4250 +▁pandanaceae -4251 +▁papetitohia -4252 +▁sapindaceae -4253 +▁statistique -4254 +▁techimantia -4255 +▁teritetiano -4256 +▁touristique -4257 +▁whakaatuhia -4258 +▁boraginaceae -4259 +▁geographical -4260 +▁glaucifolium -4261 +▁gouvernement -4262 +▁informations -4263 +▁matatatihata -4264 +▁matureivavao -4265 +▁tauaparauraa -4266 +▁territoriale -4267 +▁tournefortia -4268 +▁aurantiifolia -4269 +▁equisetifolia -4270 +▁euphorbiaceae -4271 +▁international -4272 +▁nászopkávetrá -4273 +▁paeoniifolius -4274 +▁sagittifolium -4275 +▁troglodytarum -4276 +▁faanahonahoraa -4277 +.[] -4278 +cdf -4279 +juï -4280 +mcm -4281 +nçà -4282 +ród -4283 +vāi -4284 +wee -4285 +why -4286 +yip -4287 +ziz -4288 +zzi -4289 +čić -4290 +ани -4291 +вни -4292 +едн -4293 +ени -4294 +лад -4295 +нка -4296 +▁ -6707 +cor -6708 +lij -6709 +pao -6710 +taa -6711 +▁jk -6712 +bcor -6713 +othè -6714 +urac -6715 +yves -6716 +▁der -6717 +▁emi -6718 +▁haè -6719 +▁nii -6720 +▁teu -6721 +▁vol -6722 +aaamu -6723 +rissa -6724 +tiale -6725 +trosi -6726 +ttare -6727 +verde -6728 +▁andr -6729 +▁août -6730 +▁fiti -6731 +▁ihoa -6732 +▁kadu -6733 +▁pays -6734 +▁petr -6735 +▁regi -6736 +▁rico -6737 +▁tīaì -6738 +bcorda -6739 +▁biden -6740 +▁eurac -6741 +▁ferre -6742 +▁flaçà -6743 +▁mutaa -6744 +▁málij -6745 +▁neuro -6746 +▁opbri -6747 +▁samoa -6748 +▁taoto -6749 +▁tapaò -6750 +▁tiaki -6751 +▁volta -6752 +bliothè -6753 +metrosi -6754 +otiteat -6755 +patiale -6756 +saverde -6757 +▁andrze -6758 +▁droite -6759 +▁emilin -6760 +▁geneva -6761 +▁kiloni -6762 +▁regina -6763 +▁sergio -6764 +▁solius -6765 +▁sílvio -6766 +▁vilana -6767 +averrhoa -6768 +bcordata -6769 +briciano -6770 +capsicum -6771 +chnitzel -6772 +collecti -6773 +commissa -6774 +cskumáre -6775 +ctionary -6776 +ductions -6777 +ellement -6778 +empúries -6779 +gasriika -6780 +gholough -6781 +glicério -6782 +gueiredo -6783 +hinensis -6784 +hocolate -6785 +hostoles -6786 +hrvatska -6787 +huatanga -6788 +huirecen -6789 +illinois -6790 +isztorul -6791 +ivotriko -6792 +licsárij -6793 +llastret -6794 +llobrega -6795 +légation -6796 +makitaki -6797 +matauhia -6798 +matology -6799 +)" -6800 +io -6801 +pt -6802 +pî -6803 +äc -6804 +end -6805 +eri -6806 +iaa -6807 +née -6808 +ynt -6809 +▁av -6810 +▁mk -6811 +dame -6812 +gram -6813 +nomi -6814 +quei -6815 +uang -6816 +ēera -6817 +▁(). -6818 +▁ito -6819 +▁may -6820 +▁pur -6821 +▁päc -6822 +▁teo -6823 +▁via -6824 +ciali -6825 +criti -6826 +elend -6827 +gizes -6828 +iaame -6829 +ruant -6830 +zania -6831 +▁avri -6832 +▁cale -6833 +▁cynt -6834 +▁oslo -6835 +▁prus -6836 +▁sept -6837 +▁viab -6838 +critic -6839 +gramme -6840 +liquei -6841 +nzania -6842 +▁arara -6843 +▁avril -6844 +▁hawai -6845 +▁huita -6846 +▁isabe -6847 +▁juang -6848 +▁kainu -6849 +▁mayer -6850 +▁tator -6851 +▁teeri -6852 +▁whiti -6853 +▁ûmara -6854 +perēera -6855 +rágizes -6856 +русский -6857 +▁bruant -6858 +▁faaapî -6859 +▁faatia -6860 +▁itoito -6861 +▁kelend -6862 +▁mataio -6863 +▁planes -6864 +▁tamata -6865 +▁tāhiti -6866 +boliquei -6867 +cialiste -6868 +mination -6869 +minister -6870 +miquelon -6871 +mnigueij -6872 +mothrace -6873 +nicskijá -6874 +nikultri -6875 +niàmataì -6876 +nulaceae -6877 +nyászkij -6878 +nyávnyio -6879 +olingare -6880 +ordyline -6881 +orithmic -6882 +orofenua -6883 +oshihide -6884 +peraceae -6885 +plumeria -6886 +polukáre -6887 +poláresz -6888 +pupirīta -6889 +putuputu -6890 +rahovice -6891 +ravaìraa -6892 +rdcastle -6893 +ringfire -6894 +santalum -6895 +scanthus -6896 +sshunter -6897 +sterving -6898 +tacritic -6899 +', -6900 +ык -6901 +ruï -6902 +uti -6903 +зык -6904 +▁cí -6905 +▁fâ -6906 +▁kô -6907 +dria -6908 +fatu -6909 +riva -6910 +tagu -6911 +úcia -6912 +▁mia -6913 +barça -6914 +nenga -6915 +petri -6916 +tagut -6917 +▁arui -6918 +▁cama -6919 +▁care -6920 +▁cruï -6921 +▁huit -6922 +▁lana -6923 +▁nice -6924 +▁terā -6925 +▁vaha -6926 +▁язык -6927 +mihere -6928 +▁abbas -6929 +▁desti -6930 +▁ihipa -6931 +▁lúcia -6932 +▁miami -6933 +▁north -6934 +▁papal -6935 +▁vaiho -6936 +▁wilma -6937 +amihere -6938 +earchga -6939 +iteiraa -6940 +morinda -6941 +nengaro -6942 +▁antoni -6943 +▁career -6944 +▁cínira -6945 +▁mafatu -6946 +▁marcos -6947 +▁māiata -6948 +▁sprint -6949 +liminisz -6950 +orizonte -6951 +tanilles -6952 +tauatini -6953 +teronomi -6954 +thriller -6955 +tificial -6956 +tinanata -6957 +triváles -6958 +ttarella -6959 +uanatura -6960 +ulpellac -6961 +valevska -6962 +warszawa -6963 +whakaaro -6964 +zingiber -6965 +zinyenko -6966 +ūmatatea -6967 +купштина -6968 +▁aahiata -6969 +▁abiodun -6970 +▁adakudu -6971 +▁adakugu -6972 +▁adukwei -6973 +▁afareai -6974 +▁african -6975 +▁agyekum -6976 +▁airport -6977 +▁alberto -6978 +▁algiers -6979 +▁andrzej -6980 +▁anglais -6981 +▁anthony -6982 +▁antoine -6983 +▁antônia -6984 +▁asheley -6985 +▁asiedua -6986 +▁ataahua -6987 +▁avenida -6988 +▁balance -6989 +▁bapetiz -6990 +▁beijing -6991 +▁belango -6992 +▁berisha -6993 +▁bertaèy -6994 +▁bertero -6995 +▁bescanó -6996 +▁biology -6997 +▁boldrin -6998 +▁bollers -6999 +): -7000 +cn -7001 +tm -7002 +ân -7003 +low -7004 +sân -7005 +tep -7006 +óes -7007 +▁im -7008 +▁òc -7009 +cnrs -7010 +elus -7011 +itaā -7012 +nere -7013 +otti -7014 +tape -7015 +▁bih -7016 +▁rég -7017 +▁toa -7018 +festo -7019 +llero -7020 +numia -7021 +otted -7022 +raamu -7023 +urite -7024 +▁back -7025 +▁góes -7026 +▁haro -7027 +▁have -7028 +▁hōpe -7029 +▁iter -7030 +▁koti -7031 +▁lipo -7032 +▁ophi -7033 +▁rāua -7034 +▁tant -7035 +▁tihi -7036 +cotted -7037 +mautia -7038 +rsotti -7039 +scelus -7040 +▁agora -7041 +▁arena -7042 +▁lília -7043 +▁mario -7044 +▁moscà -7045 +▁mouta -7046 +▁nūnaa -7047 +▁régis -7048 +▁taere -7049 +▁temau -7050 +▁terii -7051 +▁tetep -7052 +itaāria -7053 +liaceus -7054 +llerols -7055 +nifolia -7056 +taurite -7057 +ututaru -7058 +ycotted -7059 +▁amanda -7060 +▁backpa -7061 +▁duarte -7062 +▁fortià -7063 +▁huinga -7064 +▁hānere -7065 +▁konohe -7066 +▁ludlow -7067 +▁lílian -7068 +▁miscan -7069 +▁poland -7070 +▁sobral -7071 +▁tantra -7072 +▁tarawa -7073 +▁tuuraa -7074 +csimnáze -7075 +ministry -7076 +tnership -7077 +vinyenko -7078 +▁bonjorn -7079 +▁bonjour -7080 +▁bonmatí -7081 +▁bordils -7082 +▁buzsnyá -7083 +▁cabanes -7084 +▁cainito -7085 +▁calella -7086 +▁calophy -7087 +▁camalle -7088 +▁camargo -7089 +▁camozzi -7090 +▁cananga -7091 +▁capmany -7092 +▁cassini -7093 +▁cellera -7094 +▁cheveux -7095 +▁chicago -7096 +▁christi -7097 +▁cimángo -7098 +▁climent -7099 +") -7100 +hoe -7101 +jta -7102 +nux -7103 +ram -7104 +rao -7105 +vil -7106 +▁ip -7107 +▁it -7108 +▁tv -7109 +▁tx -7110 +▁tô -7111 +chel -7112 +chno -7113 +rema -7114 +veià -7115 +▁eiâ -7116 +▁ene -7117 +▁lec -7118 +▁mum -7119 +▁ult -7120 +hawai -7121 +jtari -7122 +leana -7123 +miere -7124 +narao -7125 +ohsiu -7126 +▁dans -7127 +▁gona -7128 +▁mose -7129 +▁musi -7130 +▁paru -7131 +▁waia -7132 +▁yara -7133 +ramort -7134 +tirara -7135 +ubuntu -7136 +▁auter -7137 +▁civil -7138 +▁enemi -7139 +▁etoto -7140 +▁linux -7141 +▁láves -7142 +▁maior -7143 +▁pavel -7144 +▁publi -7145 +▁rudol -7146 +▁tôvon -7147 +▁àveià -7148 +jtarija -7149 +nanahia -7150 +ohsiung -7151 +èperēra -7152 +▁joelle -7153 +▁jurema -7154 +▁lectin -7155 +▁manage -7156 +▁michel -7157 +▁mumura -7158 +▁parupa -7159 +▁platja -7160 +▁publie -7161 +▁rudolf -7162 +▁tavana -7163 +▁techno -7164 +▁tuaiva -7165 +▁србију -7166 +pflocher -7167 +ukairani -7168 +vanadate -7169 +▁cláudia -7170 +▁cláudio -7171 +▁college -7172 +▁commise -7173 +▁contour -7174 +▁coronel -7175 +▁crespià -7176 +▁császte -7177 +▁cynthia -7178 +▁daniela -7179 +▁darnius -7180 +▁delgado -7181 +▁dentist -7182 +▁despuig -7183 +▁details -7184 +▁diszkor -7185 +▁disznyu -7186 +▁drollet -7187 +▁dutronc -7188 +▁dámángo -7189 +▁edralin -7190 +▁emperor -7191 +▁engraça -7192 +▁escrava -7193 +▁escrito -7194 +▁espolla -7195 +▁esquina -7196 +▁essenti -7197 +▁etiopia -7198 +▁eudósia -7199 +eta -7200 +gel -7201 +hen -7202 +hgh -7203 +mij -7204 +ure -7205 +vić -7206 +▁ex -7207 +▁fc -7208 +▁fī -7209 +▁gy -7210 +▁xi -7211 +hiri -7212 +mily -7213 +mmij -7214 +ngel -7215 +ouma -7216 +rdis -7217 +reta -7218 +teen -7219 +then -7220 +vedo -7221 +▁eda -7222 +▁maō -7223 +▁rid -7224 +▁zsá -7225 +▁âte -7226 +ersti -7227 +pardi -7228 +▁angi -7229 +▁find -7230 +▁fītī -7231 +▁hali -7232 +▁jord -7233 +▁kibi -7234 +▁maes -7235 +▁riel -7236 +▁tito -7237 +▁tole -7238 +▁vasc -7239 +etabli -7240 +gelian -7241 +ollina -7242 +ródmie -7243 +tringa -7244 +zevedo -7245 +▁biure -7246 +▁cohen -7247 +▁corçà -7248 +▁douma -7249 +▁exter -7250 +▁hītoa -7251 +▁janei -7252 +▁lasso -7253 +▁milla -7254 +▁ordis -7255 +▁ridge -7256 +▁tossa -7257 +▁ôhiri -7258 +teensis -7259 +trommij -7260 +▁angitu -7261 +▁family -7262 +▁halifa -7263 +▁jordan -7264 +▁kibing -7265 +▁loreta -7266 +▁matani -7267 +▁moihaa -7268 +▁puurau -7269 +▁rangel -7270 +▁riells -7271 +▁temple -7272 +▁toleza -7273 +▁utahia -7274 +pardines -7275 +stigador -7276 +tīaniani -7277 +▁albanyà -7278 +▁azevedo -7279 +▁collina -7280 +▁eulàlia -7281 +▁faahere -7282 +▁faaueue -7283 +▁faaèraa -7284 +▁faimano -7285 +▁faraāni -7286 +▁farners -7287 +▁faufaai -7288 +▁febuare -7289 +▁feridos -7290 +▁ferrari -7291 +▁ferrite -7292 +▁foerthe -7293 +▁fonteta -7294 +▁francis -7295 +▁frutesc -7296 +▁fédéral -7297 +▁galenon -7298 +▁gateway -7299 +.' -7300 +éc -7301 +dak -7302 +epa -7303 +law -7304 +ndc -7305 +▁ah -7306 +▁ov -7307 +▁rs -7308 +▁sw -7309 +anaí -7310 +llar -7311 +scha -7312 +ório -7313 +▁ika -7314 +▁iot -7315 +▁māt -7316 +▁ngo -7317 +▁nov -7318 +▁pdf -7319 +▁tāà -7320 +▁xan -7321 +riana -7322 +rudak -7323 +écrit -7324 +▁chan -7325 +▁cole -7326 +▁paho -7327 +▁pedy -7328 +▁purū -7329 +▁swis -7330 +▁yare -7331 +anaína -7332 +hereta -7333 +kivále -7334 +lawton -7335 +maggio -7336 +pelkan -7337 +sienne -7338 +tīteni -7339 +▁frank -7340 +▁hamoa -7341 +▁iotua -7342 +▁overe -7343 +▁porte -7344 +▁swiss -7345 +▁turau -7346 +▁tāàmu -7347 +▁yaren -7348 +cananga -7349 +mutunga -7350 +océanie -7351 +▁colera -7352 +▁huntly -7353 +▁osório -7354 +▁purūmu -7355 +▁raroto -7356 +▁tūpoto -7357 +cecropia -7358 +csimonká -7359 +fanauhia -7360 +▁adriana -7361 +▁bàscara -7362 +▁chantal -7363 +▁gbentie -7364 +▁georges -7365 +▁giacomo -7366 +▁gilbert -7367 +▁gitanas -7368 +▁glasgow -7369 +▁golding -7370 +▁gominsk -7371 +▁goodybe -7372 +▁goulart -7373 +▁grandis -7374 +▁gregori -7375 +▁grányiz -7376 +▁guarnie -7377 +▁gugliel -7378 +▁guiller -7379 +▁guiomar -7380 +▁gustavo -7381 +▁guíxols -7382 +▁hakahau -7383 +▁halifax -7384 +▁hammura -7385 +▁hangaia -7386 +▁heimana -7387 +▁hilkias -7388 +▁hinarao -7389 +▁history -7390 +▁honiara -7391 +▁huriama -7392 +▁hussein -7393 +▁ihipapa -7394 +▁inseete -7395 +▁irenita -7396 +▁isabeau -7397 +▁jacquie -7398 +▁janaína -7399 +'. -7400 +it -7401 +jhi -7402 +vao -7403 +▁yi -7404 +buka -7405 +lowo -7406 +mila -7407 +ober -7408 +onet -7409 +▁hor -7410 +▁ior -7411 +▁rae -7412 +▁une -7413 +▁uri -7414 +▁vaù -7415 +bourg -7416 +chsen -7417 +mento -7418 +rates -7419 +troit -7420 +vanaa -7421 +álesz -7422 +едник -7423 +▁___? -7424 +▁akaa -7425 +▁anne -7426 +▁aunu -7427 +▁caso -7428 +▁efaa -7429 +▁jada -7430 +▁leys -7431 +▁maho -7432 +▁mori -7433 +▁peut -7434 +▁rafa -7435 +▁stre -7436 +rcumsp -7437 +rianum -7438 +wolowo -7439 +▁bojhi -7440 +▁faura -7441 +▁jacky -7442 +▁jamra -7443 +▁marty -7444 +▁meire -7445 +▁pimen -7446 +▁stats -7447 +▁strem -7448 +▁taura -7449 +komento -7450 +oncelos -7451 +▁angela -7452 +▁camila -7453 +▁coober -7454 +▁fauraò -7455 +▁fāpura -7456 +▁graffe -7457 +▁izdava -7458 +▁karzai -7459 +▁mahome -7460 +▁mieres -7461 +▁nuinga -7462 +▁pomare -7463 +▁rafael -7464 +▁sacalm -7465 +▁главни -7466 +vinyonet -7467 +▁aivanaa -7468 +▁aunuunu -7469 +▁awolowo -7470 +▁calonge -7471 +▁detroit -7472 +▁garrigo -7473 +▁haapoto -7474 +▁izdavač -7475 +▁janeiro -7476 +▁janvier -7477 +▁jaussen -7478 +▁jeanine -7479 +▁jinping -7480 +▁joachim -7481 +▁jussara -7482 +▁justine -7483 +▁kainuku -7484 +▁kaitito -7485 +▁karanga -7486 +▁kaupapa -7487 +▁kawongo -7488 +▁kilomin -7489 +▁klopper -7490 +▁knights -7491 +▁kuleana -7492 +▁kumanin -7493 +▁kôleeji -7494 +▁kōpūreo -7495 +▁larissa -7496 +▁lecythi -7497 +▁lexique -7498 +▁lietuva -7499 +.), -7500 +dam -7501 +fit -7502 +gol -7503 +mel -7504 +new -7505 +pys -7506 +uen -7507 +éon -7508 +▁ji -7509 +▁èà -7510 +duze -7511 +ffit -7512 +fifi -7513 +lleu -7514 +nunu -7515 +onto -7516 +équi -7517 +▁(), -7518 +▁bac -7519 +▁don -7520 +▁jor -7521 +▁muz -7522 +▁roc -7523 +▁sua -7524 +duzeć -7525 +mbusz -7526 +minum -7527 +munes -7528 +ngrua -7529 +tella -7530 +urval -7531 +▁esti -7532 +▁léon -7533 +▁mane -7534 +▁radc -7535 +▁rohe -7536 +duzeće -7537 +sminum -7538 +terera -7539 +équipe -7540 +▁afriy -7541 +▁atomi -7542 +▁dates -7543 +▁estre -7544 +▁gogol -7545 +▁homel -7546 +▁jordi -7547 +▁kopys -7548 +▁lycée -7549 +▁matua -7550 +▁muzeu -7551 +▁rouen -7552 +▁suave -7553 +▁tipen -7554 +istella -7555 +ngruang -7556 +phoenix -7557 +▁ahurei -7558 +▁cadaqu -7559 +▁durval -7560 +▁gentle -7561 +▁itiraa -7562 +▁limite -7563 +▁maneco -7564 +▁muzeum -7565 +▁māhora -7566 +▁navata -7567 +▁pānunu -7568 +▁rocles -7569 +▁ronald -7570 +▁sassou -7571 +▁sellal -7572 +▁suffit -7573 +▁tapone -7574 +▁ussher -7575 +▁vaiiho -7576 +jasminum -7577 +uixalleu -7578 +▁afriyie -7579 +▁cadaqué -7580 +▁jimángo -7581 +▁limited -7582 +▁llofriu -7583 +▁llogaia -7584 +▁llorenç -7585 +▁loisirs -7586 +▁londres -7587 +▁lottori -7588 +▁lourdes -7589 +▁lumiere -7590 +▁maestro -7591 +▁mandela -7592 +▁manihot -7593 +▁mapmuči -7594 +▁maraamu -7595 +▁maragai -7596 +▁marcelo -7597 +▁marinho -7598 +▁masarac -7599 +cad -7600 +fru -7601 +noi -7602 +ofe -7603 +▁ll -7604 +▁òu -7605 +calo -7606 +frug -7607 +muel -7608 +ncon -7609 +noha -7610 +tene -7611 +tāpa -7612 +zaré -7613 +▁ado -7614 +▁blo -7615 +▁llb -7616 +▁lle -7617 +▁são -7618 +▁tak -7619 +▁yaw -7620 +cados -7621 +gilev -7622 +ōporo -7623 +▁alvi -7624 +▁dala -7625 +▁deca -7626 +▁fano -7627 +▁itea -7628 +▁limi -7629 +▁smet -7630 +▁viri -7631 +samuel -7632 +▁adoni -7633 +▁blota -7634 +▁burgo -7635 +▁hanoi -7636 +▁llers -7637 +▁météo -7638 +▁nunes -7639 +▁rangi -7640 +▁sites -7641 +▁òutou -7642 +byteria -7643 +frugell -7644 +ncontre -7645 +▁alvise -7646 +▁cleyde -7647 +▁faatau -7648 +▁nazaré -7649 +▁papaya -7650 +▁sarrià -7651 +▁states -7652 +▁viride -7653 +▁whakau -7654 +byterian -7655 +ihianoha -7656 +▁hakihea -7657 +▁huitene -7658 +▁iteahia -7659 +▁limites -7660 +▁matangi -7661 +▁matehau -7662 +▁maupiha -7663 +▁maurice -7664 +▁mcgrath -7665 +▁meharry -7666 +▁mendoza -7667 +▁menezes -7668 +▁mennais -7669 +▁metturo -7670 +▁michael -7671 +▁mihiroa -7672 +▁miliona -7673 +▁minarii -7674 +▁mkpeyol -7675 +▁mogilev -7676 +▁moldova -7677 +▁monells -7678 +▁monstri -7679 +▁montcal -7680 +▁montgrí -7681 +▁morinda -7682 +▁moutame -7683 +▁musique -7684 +▁māremia -7685 +▁nationa -7686 +▁nevinha -7687 +▁nicolas -7688 +▁nirvana -7689 +▁nishani -7690 +▁nolasco -7691 +▁nucleic -7692 +▁obafemi -7693 +▁octobre -7694 +▁olivier -7695 +▁orriols -7696 +▁otumfuo -7697 +▁palikir -7698 +▁paltoga -7699 +sb -7700 +dar -7701 +ist -7702 +lda -7703 +nds -7704 +pee -7705 +ppe -7706 +òne -7707 +appe -7708 +arts -7709 +atae -7710 +core -7711 +iter -7712 +koba -7713 +mayd -7714 +orga -7715 +sboa -7716 +sola -7717 +urit -7718 +wata -7719 +èche -7720 +▁fēì -7721 +▁let -7722 +▁mit -7723 +▁oix -7724 +▁pho -7725 +amahu -7726 +haere -7727 +rends -7728 +uriri -7729 +èches -7730 +▁alar -7731 +▁apee -7732 +▁deis -7733 +▁dite -7734 +▁hope -7735 +▁hula -7736 +▁hutu -7737 +▁kape -7738 +▁oroa -7739 +▁puis -7740 +▁roca -7741 +▁rāau -7742 +▁seba -7743 +église -7744 +▁araba -7745 +▁haumi -7746 +▁hilda -7747 +▁patoi -7748 +▁pukae -7749 +▁queen -7750 +▁scran -7751 +▁taeae -7752 +▁taofe -7753 +▁teata -7754 +▁twist -7755 +▁vanua -7756 +▁vorga -7757 +amahuta -7758 +appelle -7759 +mprends -7760 +rdèches -7761 +solanum -7762 +▁capsec -7763 +▁ditema -7764 +▁encore -7765 +▁freire -7766 +▁iakoba -7767 +▁lisboa -7768 +▁mahama -7769 +▁mitche -7770 +▁pātete -7771 +▁sourit -7772 +▁thomas -7773 +▁wawata -7774 +▁âpīraa -7775 +▁dindiok -7776 +▁haamene -7777 +▁lettres -7778 +▁panedes -7779 +▁parlavà -7780 +▁parlors -7781 +▁pasqual -7782 +▁patuhia -7783 +▁pecados -7784 +▁peduase -7785 +▁peptide -7786 +▁phoenix -7787 +▁pimenta -7788 +▁pinkett -7789 +▁polatsk -7790 +▁polessa -7791 +▁pologra -7792 +▁polymer -7793 +▁polymor -7794 +▁portbou -7795 +▁poutine -7796 +▁premier -7797 +▁private -7798 +▁prozeny -7799 +bac -7800 +ely -7801 +faè -7802 +hee -7803 +ifa -7804 +lló -7805 +».( -7806 +āfa -7807 +babi -7808 +chps -7809 +ctey -7810 +mbac -7811 +puru -7812 +▁cas -7813 +▁caz -7814 +▁cel -7815 +▁ent -7816 +▁frs -7817 +▁las -7818 +▁pel -7819 +▁vaa -7820 +▁èpe -7821 +babić -7822 +ckely -7823 +graph -7824 +oteur -7825 +tenim -7826 +çaise -7827 +▁adwo -7828 +▁cazu -7829 +▁deux -7830 +▁four -7831 +▁inga -7832 +▁kapa -7833 +▁kari -7834 +▁kate -7835 +▁kava -7836 +▁komo -7837 +▁line -7838 +▁matā -7839 +▁mini -7840 +▁moça -7841 +▁sils -7842 +▁tadi -7843 +▁varo -7844 +▁what -7845 +caceae -7846 +lusion -7847 +▁armen -7848 +▁braga -7849 +▁casse -7850 +▁celso -7851 +▁entri -7852 +▁karin -7853 +▁matāu -7854 +▁mouse -7855 +▁nauru -7856 +▁orama -7857 +▁paula -7858 +▁prova -7859 +▁pāhee -7860 +▁tadić -7861 +▁tongu -7862 +▁váliá -7863 +clusion -7864 +itenati -7865 +perehia -7866 +▁ -7867 +a -7868 +i -7869 +t -7870 +e -7871 +r -7872 +o -7873 +n -7874 +u -7875 +m -7876 +h -7877 +’ -7878 +p -7879 +f -7880 +s -7881 +. -7882 +ō -7883 +ā -7884 +l -7885 +, -7886 +c -7887 +v -7888 +d -7889 +k -7890 +g -7891 +' -7892 +ē -7893 +ò -7894 +b -7895 +ū -7896 +y -7897 +ī -7898 +( -7899 +- -7900 +) -7901 +1 -7902 +w -7903 +2 -7904 +à -7905 +ì -7906 +ê -7907 +‘ -7908 +j -7909 +z -7910 +: -7911 +0 -7912 +á -7913 +â -7914 +é -7915 +4 -7916 +è -7917 +3 -7918 +5 -7919 +6 -7920 +" -7921 +7 -7922 +9 -7923 +8 -7924 +q -7925 +x -7926 +ʻ -7927 +ç -7928 +ô -7929 +; -7930 +û -7931 +í -7932 +и -7933 +| -7934 +ï -7935 +р -7936 +_ -7937 +ó -7938 +/ -7939 +î -7940 +ù -7941 +ǔ -7942 +• -7943 +е -7944 +? -7945 +« -7946 +а -7947 +» -7948 +с -7949 +б -7950 +к -7951 +ã -7952 +н -7953 +* -7954 +у -7955 +[ -7956 +° -7957 +ŭ -7958 +д -7959 += -7960 +ј -7961 ++ -7962 +] -7963 +о -7964 +п -7965 +ú -7966 +г -7967 +л -7968 +т -7969 +% -7970 +ˈ -7971 +в -7972 +ل -7973 +– -7974 +× -7975 +ć -7976 +č -7977 +з -7978 +ч -7979 +— -7980 +< -7981 +> -7982 +ä -7983 +ł -7984 +ш -7985 +ا -7986 +# -7987 +š -7988 +ʼ -7989 +й -7990 +ц -7991 +ы -7992 +я -7993 +ب -7994 +ع -7995 diff --git a/models/vocabulary/ty_vocabulary.parquet b/models/vocabulary/ty_vocabulary.parquet new file mode 100644 index 0000000000000000000000000000000000000000..328ae868e180f566c9f697dfc79fe951245f2836 --- /dev/null +++ b/models/vocabulary/ty_vocabulary.parquet @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6d7ad18695375b4bd6ff6f1caf91a26969de2756605921e9e80c8781a34419f6 +size 43931 diff --git a/models/vocabulary/ty_vocabulary_metadata.json b/models/vocabulary/ty_vocabulary_metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..a02ae21a2f6c6a240829838e66cbd7d50094184c --- /dev/null +++ b/models/vocabulary/ty_vocabulary_metadata.json @@ -0,0 +1,16 @@ +{ + "language": "ty", + "vocabulary_size": 2668, + "variant": "full", + "statistics": { + "type_token_ratio": 0.10297356828193832, + "coverage": { + "top_100": 0.6740981069174902, + "top_1000": 0.875431598999881, + "top_5000": 0.971440052387189 + }, + "hapax_count": 4251, + "hapax_ratio": 0.6143951438069085, + "total_documents": 1258 + } +} \ No newline at end of file diff --git a/models/word_markov/ty_markov_ctx1_word.parquet b/models/word_markov/ty_markov_ctx1_word.parquet new file mode 100644 index 0000000000000000000000000000000000000000..56618284effbeecc137f3041f7779ca33bcbb76a --- /dev/null +++ b/models/word_markov/ty_markov_ctx1_word.parquet @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:042159a23ed02fdce621479a2f066bd5ed16cbbb1bee27afd0494e97897a9e18 +size 198322 diff --git a/models/word_markov/ty_markov_ctx1_word_metadata.json b/models/word_markov/ty_markov_ctx1_word_metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..a8708ae0326d6b14c286ec5812c070f4d43268de --- /dev/null +++ b/models/word_markov/ty_markov_ctx1_word_metadata.json @@ -0,0 +1,7 @@ +{ + "context_size": 1, + "variant": "word", + "language": "ty", + "unique_contexts": 6845, + "total_transitions": 65934 +} \ No newline at end of file diff --git a/models/word_markov/ty_markov_ctx2_word.parquet b/models/word_markov/ty_markov_ctx2_word.parquet new file mode 100644 index 0000000000000000000000000000000000000000..6001c5c614bd28f59b4341f2cb8ba5f886af328e --- /dev/null +++ b/models/word_markov/ty_markov_ctx2_word.parquet @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f14056c40caec0df6121f159fc989ab54f18af4d7f90144996f3fa1dcaaec02f +size 385803 diff --git a/models/word_markov/ty_markov_ctx2_word_metadata.json b/models/word_markov/ty_markov_ctx2_word_metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..ad45449aae24993be108802883f3db2fe6733c1c --- /dev/null +++ b/models/word_markov/ty_markov_ctx2_word_metadata.json @@ -0,0 +1,7 @@ +{ + "context_size": 2, + "variant": "word", + "language": "ty", + "unique_contexts": 21075, + "total_transitions": 64676 +} \ No newline at end of file diff --git a/models/word_markov/ty_markov_ctx3_word.parquet b/models/word_markov/ty_markov_ctx3_word.parquet new file mode 100644 index 0000000000000000000000000000000000000000..950747f51a540458bffa1b282ba9b74e0704a21f --- /dev/null +++ b/models/word_markov/ty_markov_ctx3_word.parquet @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:010e49e0f5e05b0a7272124b938fd20a155ea9daf7446cd1f6bbcef9218c06a5 +size 575332 diff --git a/models/word_markov/ty_markov_ctx3_word_metadata.json b/models/word_markov/ty_markov_ctx3_word_metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..96aca9df229e395ed16c660b36c09f8c300826e6 --- /dev/null +++ b/models/word_markov/ty_markov_ctx3_word_metadata.json @@ -0,0 +1,7 @@ +{ + "context_size": 3, + "variant": "word", + "language": "ty", + "unique_contexts": 33605, + "total_transitions": 63418 +} \ No newline at end of file diff --git a/models/word_markov/ty_markov_ctx4_word.parquet b/models/word_markov/ty_markov_ctx4_word.parquet new file mode 100644 index 0000000000000000000000000000000000000000..5f27599777c0f06ac64e17b84bdcea0fb4f8202f --- /dev/null +++ b/models/word_markov/ty_markov_ctx4_word.parquet @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6ba05218fa96e06502b509bbec2cf36fd21b073c463d997cebedfcce597879e7 +size 686772 diff --git a/models/word_markov/ty_markov_ctx4_word_metadata.json b/models/word_markov/ty_markov_ctx4_word_metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..946a397d9529ede03092e423d3ccf76d701aee1c --- /dev/null +++ b/models/word_markov/ty_markov_ctx4_word_metadata.json @@ -0,0 +1,7 @@ +{ + "context_size": 4, + "variant": "word", + "language": "ty", + "unique_contexts": 41713, + "total_transitions": 62160 +} \ No newline at end of file diff --git a/models/word_ngram/ty_2gram_word.parquet b/models/word_ngram/ty_2gram_word.parquet new file mode 100644 index 0000000000000000000000000000000000000000..abf03c754bdec2c2a81ca9a2613c6fcb662a5c92 --- /dev/null +++ b/models/word_ngram/ty_2gram_word.parquet @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:10a78f718d5323cce64d8524b77687eaa54609dff2559a775dd56172d1955926 +size 20018 diff --git a/models/word_ngram/ty_2gram_word_metadata.json b/models/word_ngram/ty_2gram_word_metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..bad0f792a35d174b99991ff1cdb9abb2cd63cb9d --- /dev/null +++ b/models/word_ngram/ty_2gram_word_metadata.json @@ -0,0 +1,7 @@ +{ + "n": 2, + "variant": "word", + "language": "ty", + "unique_ngrams": 1465, + "total_ngrams": 65934 +} \ No newline at end of file diff --git a/models/word_ngram/ty_3gram_word.parquet b/models/word_ngram/ty_3gram_word.parquet new file mode 100644 index 0000000000000000000000000000000000000000..dbdbf13eb1c545c8f34d0009f125ea3bd27706bd --- /dev/null +++ b/models/word_ngram/ty_3gram_word.parquet @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a0c1587ab533095256c88270b781578cda738e60ab10aedecb9c056766687a02 +size 36289 diff --git a/models/word_ngram/ty_3gram_word_metadata.json b/models/word_ngram/ty_3gram_word_metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..feeda434e2c0a588f9e742cae95f658754befe52 --- /dev/null +++ b/models/word_ngram/ty_3gram_word_metadata.json @@ -0,0 +1,7 @@ +{ + "n": 3, + "variant": "word", + "language": "ty", + "unique_ngrams": 2559, + "total_ngrams": 64676 +} \ No newline at end of file diff --git a/models/word_ngram/ty_4gram_word.parquet b/models/word_ngram/ty_4gram_word.parquet new file mode 100644 index 0000000000000000000000000000000000000000..8ebace37567875d417f38460a82b3564cb4efa56 --- /dev/null +++ b/models/word_ngram/ty_4gram_word.parquet @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bc50d5ad3fa8222d6556b241e62500e2f8b5928b912757fed8c0123fe3c8340c +size 64883 diff --git a/models/word_ngram/ty_4gram_word_metadata.json b/models/word_ngram/ty_4gram_word_metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..d0d48637f06c202fab25535dd0a3bfd332797c7e --- /dev/null +++ b/models/word_ngram/ty_4gram_word_metadata.json @@ -0,0 +1,7 @@ +{ + "n": 4, + "variant": "word", + "language": "ty", + "unique_ngrams": 4355, + "total_ngrams": 63418 +} \ No newline at end of file diff --git a/models/word_ngram/ty_5gram_word.parquet b/models/word_ngram/ty_5gram_word.parquet new file mode 100644 index 0000000000000000000000000000000000000000..56551cb6641591ef4ccb5065b7117f29aee73169 --- /dev/null +++ b/models/word_ngram/ty_5gram_word.parquet @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ba9da1787575d0b6015435d92b9a1ea06e9e4ba2110420f91ccd86de1ae487c7 +size 51641 diff --git a/models/word_ngram/ty_5gram_word_metadata.json b/models/word_ngram/ty_5gram_word_metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..5ae7fe34b9cd35ea42a7cced8f2fc113df4f7ecb --- /dev/null +++ b/models/word_ngram/ty_5gram_word_metadata.json @@ -0,0 +1,7 @@ +{ + "n": 5, + "variant": "word", + "language": "ty", + "unique_ngrams": 3200, + "total_ngrams": 62160 +} \ No newline at end of file diff --git a/ty_morph_tokenizer.json b/ty_morph_tokenizer.json new file mode 100644 index 0000000000000000000000000000000000000000..688d6a59fbb77651107a22fb553572c37ee1d47a --- /dev/null +++ b/ty_morph_tokenizer.json @@ -0,0 +1,15631 @@ +{ + "language": "ty", + "prefixes": { + "t": 1204.3, + "a": 855.5, + "m": 714.9, + "p": 595.1, + "ta": 588.2, + "ma": 553.8, + "fa": 342.5, + "pa": 265.5, + "te": 254.3, + "ra": 203.7, + "tu": 176.3, + "ha": 145.4, + "ti": 130.6, + "mo": 126.6, + "sa": 125.1, + "ar": 113.3, + "an": 106.6, + "me": 105.4, + "po": 91.5, + "to": 87.7, + "pe": 85.3, + "ro": 80.1, + "ka": 76.7 + }, + "suffixes": { + "a": 3056.0, + "e": 872.4, + "ia": 789.1, + "i": 706.7, + "aa": 681.7, + "ra": 298.9, + "na": 228.7, + "ta": 222.3, + "ga": 208.0, + "re": 139.9, + "ro": 129.8, + "ti": 128.7, + "ne": 126.4, + "au": 125.1, + "ni": 116.4, + "hi": 107.2, + "la": 103.9, + "ae": 103.0, + "ea": 90.6, + "te": 81.4, + "er": 81.4, + "ru": 81.4, + "us": 72.5 + }, + "ngram_scores": { + "e": 14698, + "t": 13338, + "a": 13137, + "te": 10307, + "i": 9732, + "m": 6649, + "o": 6428, + "ra": 5910, + "ta": 5457, + "ma": 5364, + "u": 5289, + "n": 4946, + "au": 4158, + "aa": 3854, + "ar": 3847, + "re": 3838, + "ti": 3810, + "at": 3608, + "it": 3482, + "ia": 3378, + "r": 3058, + "h": 2979, + "f": 2950, + "p": 2916, + "ite": 2795, + "ua": 2779, + "ir": 2735, + "em": 2731, + "ot": 2695, + "hi": 2684, + "no": 2671, + "na": 2556, + "ema": 2393, + ".": 2368, + "tem": 2331, + "tu": 2284, + "ha": 2268, + "er": 2239, + ",": 2236, + "mau": 2183, + "ah": 2141, + "an": 2110, + "ote": 2085, + "or": 2068, + "ri": 2039, + "et": 2017, + "to": 1957, + "ni": 1950, + "ai": 1939, + "fa": 1874, + "iti": 1850, + "ata": 1800, + "pa": 1747, + "en": 1734, + "oi": 1656, + "’o": 1647, + "ne": 1566, + "ei": 1557, + "ahi": 1511, + "ro": 1492, + "raa": 1489, + "in": 1482, + "eh": 1416, + "’": 1407, + "ef": 1313, + "ur": 1305, + "ate": 1301, + "mo": 1275, + "am": 1268, + "’a": 1246, + "ara": 1241, + "ho": 1195, + "ire": 1194, + "not": 1191, + "a’": 1190, + "ō": 1123, + "nō": 1109, + "ere": 1105, + "teh": 1060, + "ap": 1041, + "oir": 1038, + "a.": 1036, + "oire": 1035, + "rei": 1024, + "’oi": 1011, + "tef": 1009, + "’oir": 1008, + "ira": 1002, + "a’a": 994, + "nu": 980, + "tin": 961, + "eit": 960, + "inō": 939, + "s": 932, + "tet": 892, + "a,": 871, + "mā": 855, + "va": 854, + "oa": 842, + "ana": 830, + "po": 827, + "ao": 826, + "mat": 809, + "fe": 807, + "ep": 797, + "pi": 780, + "far": 777, + "tah": 760, + "mata": 759, + "ea": 754, + "ii": 745, + "faa": 735, + "af": 734, + "mot": 731, + "ru": 729, + "otu": 729, + "ae": 728, + "eta": 728, + "nua": 709, + "um": 706, + "motu": 706, + "on": 701, + "ete": 691, + "me": 688, + "k": 686, + "tahi": 679, + ",e": 672, + "aat": 670, + "pe": 669, + "ih": 668, + "ra’": 665, + "up": 663, + "ra’a": 663, + "enu": 661, + "enua": 658, + "pu": 653, + "he": 650, + "ora": 650, + "fen": 649, + "fenu": 649, + "ter": 645, + "afa": 642, + "io": 639, + "efa": 637, + "oh": 636, + "nia": 630, + ".m": 629, + "haa": 629, + "ān": 628, + "hit": 625, + "are": 618, + "iraa": 614, + "ato": 612, + "ura": 610, + "mai": 605, + "ka": 599, + "ng": 597, + "’at": 595, + "ē": 591, + "un": 590, + "ōt": 583, + "nōt": 581, + "tat": 580, + "ori": 577, + "eti": 577, + "aup": 572, + "ò": 569, + "v": 567, + "ama": 565, + "tar": 564, + "ut": 563, + "ano": 563, + "hiti": 563, + "so": 561, + "efe": 561, + "hō": 560, + "ahit": 552, + "mu": 548, + "era": 545, + "hia": 541, + "taa": 541, + "par": 534, + "a'": 533, + "es": 529, + "eo": 522, + "tata": 520, + "ehō": 517, + "’ē": 513, + "ita": 512, + "ō’": 511, + "hō’": 511, + "ō’ē": 511, + "hō’ē": 511, + "ia.": 507, + "ari": 507, + "tua": 504, + "net": 500, + "ē’": 499, + "’ē’": 499, + "ē’o": 499, + "la": 498, + "rū": 496, + "ou": 494, + "tep": 491, + "iai": 489, + "atar": 489, + "uno": 487, + ".ma": 484, + "ten": 481, + "im": 480, + "ūn": 478, + "ria": 478, + "tere": 476, + "hu": 475, + "atah": 471, + "ūni": 468, + "ūnia": 467, + "arū": 466, + "rūn": 466, + "tarū": 466, + "arūn": 466, + "rūni": 466, + "ōta": 465, + "ga": 464, + "rā": 464, + "rau": 462, + "a.m": 462, + "ie": 461, + "u’": 460, + "para": 460, + "au’": 457, + "u’o": 456, + "al": 455, + "tea": 454, + "tia": 453, + "d": 451, + "'a": 450, + "om": 449, + "mar": 449, + "ui": 441, + "eha": 439, + "i.": 438, + "b": 431, + "el": 431, + "oia": 429, + "1": 428, + "tit": 426, + "per": 424, + "sor": 419, + "atu": 415, + "sori": 415, + "av": 412, + "aap": 406, + "li": 393, + ".t": 389, + "aur": 387, + "rah": 386, + "oto": 386, + "aum": 386, + "eno": 386, + "si": 379, + "rahi": 376, + "de": 375, + ",i": 375, + "api": 373, + "arau": 372, + "le": 371, + "oria": 371, + "haap": 371, + "l": 364, + "pii": 362, + "nga": 362, + "ōs": 361, + "nōs": 360, + "ōso": 360, + "uh": 358, + "aut": 358, + "(": 357, + "c": 356, + "ati": 356, + "ak": 355, + "ve": 349, + "ām": 349, + "fare": 349, + "2": 347, + "rit": 346, + "han": 345, + "rot": 343, + "ip": 341, + "apii": 341, + "uf": 340, + "i,": 339, + "āni": 339, + "aam": 339, + "aapi": 338, + ",t": 337, + "tā": 335, + "tam": 333, + "sa": 328, + "g": 327, + "hau": 327, + "aura": 327, + "ihi": 325, + "arā": 325, + "rān": 325, + ".te": 325, + "roto": 325, + "nau": 322, + "umā": 322, + "nt": 321, + "rāni": 321, + "iro": 320, + "arān": 320, + "is": 319, + "nei": 318, + "auf": 318, + "farā": 317, + "aha": 313, + "ene": 312, + "epa": 312, + "pere": 312, + ".u": 311, + "a,e": 310, + "amo": 309, + "eho": 309, + ".ua": 309, + "vi": 308, + "ine": 307, + "ā": 306, + "mi": 304, + "tei": 304, + "man": 303, + "eni": 302, + "iir": 302, + "auh": 301, + "op": 299, + "iira": 298, + "uam": 295, + "faat": 295, + "tor": 293, + "rat": 292, + "apa": 292, + "os": 291, + "āt": 288, + "ê": 287, + "tau": 287, + "ee": 286, + "piir": 285, + "pō": 283, + "a‘": 283, + "tun": 283, + "her": 281, + "iri": 280, + "rii": 280, + "amot": 280, + "ol": 278, + "ōr": 278, + "iho": 278, + "etia": 278, + "ret": 277, + "hor": 276, + ",te": 276, + "hin": 275, + "e,": 274, + "uar": 273, + "ait": 272, + "e.": 271, + "rī": 271, + "il": 270, + "iaf": 268, + "'i": 267, + "toi": 267, + "aata": 267, + "w": 264, + "pōr": 263, + "arii": 263, + "ko": 262, + "se": 260, + "ki": 260, + "ohe": 260, + "uta": 259, + "neti": 259, + "eret": 258, + "upa": 257, + "poh": 256, + "teo": 256, + "’ot": 256, + "uha": 254, + "upo": 254, + "ca": 253, + "nai": 253, + "oê": 252, + "aro": 252, + "hoê": 252, + "īn": 251, + "tai": 251, + "nia.": 251, + "pohe": 251, + "taat": 251, + "īne": 250, + "tite": 250, + "iten": 249, + "ohi": 248, + "aai": 247, + "aamo": 247, + "uan": 246, + "ōrī": 245, + "ater": 245, + "ic": 244, + "īnet": 244, + "hana": 244, + "rīn": 243, + "rīne": 243, + "oo": 242, + "uma": 241, + "reti": 241, + "etit": 241, + "teni": 241, + "taam": 241, + "pū": 240, + "ev": 239, + "fā": 239, + "’i": 239, + "as": 238, + "pōrī": 238, + "ōrīn": 238, + "tama": 237, + "mari": 237, + "‘a": 235, + "oro": 235, + "’ar": 234, + "ino": 234, + "toa": 233, + "mua": 233, + "da": 231, + "aan": 231, + "i'": 230, + "ani": 230, + "āna": 230, + ":": 228, + "ahin": 228, + "aate": 227, + "go": 226, + "eter": 226, + "lo": 225, + "rav": 225, + "eat": 225, + "hine": 224, + "o'": 223, + "uru": 222, + "a’ar": 222, + "ac": 220, + "oru": 220, + "tum": 220, + "ad": 218, + "bu": 218, + "atoa": 218, + "fān": 217, + "uah": 217, + "fāna": 217, + "naur": 217, + "oma": 215, + "ha’": 215, + "reh": 215, + "ha’a": 215, + "ānau": 215, + "amar": 215, + "oraa": 214, + "pae": 213, + "ihia": 213, + "roa": 211, + "hera": 210, + "tene": 210, + "ll": 209, + "st": 209, + "uat": 208, + "ang": 206, + "ute": 206, + "a'i": 204, + "ura’": 204, + "era’": 204, + "ara’": 203, + "’ara": 202, + "āmo": 201, + "oher": 201, + "vah": 200, + "amu": 200, + "ce": 199, + "mah": 199, + "ra,": 198, + "ufā": 198, + "uā": 197, + "enet": 197, + "iae": 197, + "nete": 196, + "toru": 195, + "araa": 194, + "āmot": 194, + "etu": 193, + "tuā": 191, + "uām": 191, + "tuām": 191, + "uāmo": 191, + "ik": 190, + "ni.": 190, + "ria.": 190, + "eu": 189, + "ipa": 189, + "rep": 189, + "vahi": 189, + "ba": 188, + "hip": 188, + "ue": 186, + "fi": 186, + "i’": 186, + "ito": 186, + "tuat": 186, + "hora": 185, + "māt": 184, + "ss": 183, + "hipa": 183, + "us": 182, + "ku": 182, + "'n": 182, + "tir": 182, + "nio": 182, + "tur": 182, + "uaf": 182, + "ke": 181, + "ren": 181, + "ta’": 181, + "tou": 181, + "tih": 181, + "ch": 180, + ";": 179, + "rar": 179, + "'na": 179, + "uo": 178, + "eva": 178, + "ima": 178, + "tan": 177, + ".e": 177, + "ave": 175, + "ator": 175, + "'": 172, + "uraa": 172, + "gh": 171, + "irit": 171, + "tihi": 171, + "wh": 170, + "āni.": 170, + "rir": 169, + "j": 168, + "iu": 168, + "di": 168, + "nom": 168, + "à": 167, + "ab": 167, + "i'a": 167, + "ohip": 167, + "nat": 166, + "pir": 166, + "0": 165, + "rita": 165, + "ran": 164, + "uai": 164, + "tira": 164, + "â": 163, + "aia": 163, + "be": 162, + "‘e": 161, + "uato": 161, + "ina": 160, + "aar": 160, + "’n": 159, + "ìt": 159, + "rg": 158, + "u,": 158, + "rave": 157, + "piri": 157, + "ci": 156, + "rai": 156, + "fr": 155, + "nd": 155, + "wa": 155, + "tuh": 155, + ")": 154, + "aò": 154, + "iat": 154, + "a,i": 154, + "if": 153, + "mon": 153, + "ane": 153, + "’na": 153, + "run": 153, + "amā": 153, + "uri": 152, + "aer": 152, + "ipō": 152, + "ihor": 152, + ",n": 151, + "ìti": 151, + "co": 150, + "ini": 150, + "hae": 150, + "rev": 149, + "ereh": 149, + "por": 148, + "aita": 147, + "uk": 146, + "aho": 146, + "ota": 146, + "reva": 146, + "aere": 146, + "ìtih": 146, + "aka": 145, + "mait": 145, + "ore": 144, + "tae": 144, + "riro": 144, + "ehau": 144, + "ma'": 143, + "aua": 143, + "do": 142, + "aui": 142, + "eò": 142, + "haer": 142, + "y": 141, + "air": 141, + "wha": 141, + "oe": 140, + "òi": 140, + "pap": 140, + "aei": 140, + "reha": 140, + "ma'i": 140, + "-": 139, + "āì": 139, + "māì": 139, + "āìt": 139, + "uap": 139, + "tuha": 139, + "māìt": 139, + "āìti": 139, + "aru": 138, + "og": 137, + "ov": 137, + "òir": 137, + "òire": 137, + "una": 136, + "aao": 136, + ".i": 136, + "atir": 136, + "ūp": 135, + "tām": 135, + "aoi": 135, + "anga": 135, + "ava": 134, + "a‘e": 134, + "gha": 134, + "aii": 134, + "uhaa": 134, + "ghan": 134, + "i‘": 133, + "aah": 133, + "hur": 133, + "pūp": 133, + "'e": 132, + "iv": 132, + "aau": 132, + "epū": 132, + "ūpi": 132, + "repū": 132, + "epūp": 132, + "pūpi": 132, + "ūpir": 132, + "th": 130, + "'o": 130, + "6": 130, + "uir": 129, + "fan": 129, + "nar": 129, + "noa": 129, + "ny": 128, + "eir": 128, + "emo": 127, + "ātā": 127, + "āmu": 127, + "tita": 127, + "tāmu": 127, + "eòi": 127, + "),": 126, + "ram": 126, + ",u": 126, + "ioi": 126, + "ph": 125, + "mea": 125, + "rap": 125, + "nam": 125, + "atou": 125, + "i,e": 125, + "mātā": 125, + "ātām": 125, + "āmua": 125, + "āi": 124, + "òn": 124, + "hui": 124, + "anu": 124, + "atua": 124, + "ed": 123, + "5": 123, + "òna": 123, + "upu": 123, + "a,t": 122, + "tr": 121, + "aor": 121, + "ifa": 121, + "tev": 121, + "rao": 121, + "māi": 121, + "maha": 121, + "uira": 121, + "eira": 121, + "eua": 121, + ",ua": 121, + "ahu": 120, + "met": 120, + "ona": 119, + "a’i": 119, + "ge": 118, + "id": 118, + "‘o": 118, + "imā": 118, + "aati": 118, + "3": 117, + "o,": 117, + "tao": 117, + "eto": 116, + "iao": 116, + "aot": 116, + "hak": 116, + "huru": 116, + "eie": 115, + ",o": 115, + "bur": 115, + "pā": 114, + "uhi": 114, + "reir": 113, + "ra.": 112, + "reo": 111, + "poo": 111, + "oao": 111, + "fana": 111, + "itit": 111, + "rama": 110, + "ta'": 109, + "tui": 109, + "eor": 109, + "iaa": 109, + "urg": 109, + "of": 108, + "ya": 108, + "4": 108, + "nap": 108, + "maa": 108, + "mara": 108, + "faah": 108, + "ata’": 108, + "ta’i": 108, + "’im": 108, + "burg": 108, + "ant": 107, + "rer": 107, + "huir": 107, + "teie": 107, + "iaò": 107, + "nin": 106, + "apu": 106, + "ika": 105, + "ume": 105, + "ti'": 105, + "aun": 105, + "itai": 105, + "7": 104, + "ïa": 104, + "utu": 104, + "erā": 104, + "anau": 104, + "ag": 103, + "ono": 103, + "to'": 103, + "gos": 103, + "tap": 103, + "ōte": 103, + "aram": 103, + "nog": 103, + "ti'a": 103, + "ns": 102, + "rik": 102, + "a(": 102, + "oor": 102, + "iua": 102, + "ul": 101, + "rt": 101, + "iò": 101, + "non": 101, + "rgo": 101, + "rapa": 101, + "ahan": 101, + "haka": 101, + "ï": 100, + "ār": 100, + "pun": 100, + "hoi": 100, + "eme": 100, + "ogh": 100, + "pua": 99, + "tut": 99, + "ōb": 99, + "epe": 99, + "rato": 99, + "nōb": 99, + "urgo": 99, + "su": 98, + "ek": 98, + "ape": 98, + "ahia": 98, + "ōbu": 98, + "rgos": 98, + "bi": 97, + "oli": 97, + "opa": 97, + "a'n": 97, + "uhia": 97, + "tura": 97, + "whak": 97, + "9": 96, + "ti’": 96, + "metu": 96, + "a'na": 96, + "nte": 95, + "ion": 95, + "ufa": 95, + "ess": 95, + "uò": 95, + "ā’": 94, + "paa": 94, + "esi": 94, + "apo": 94, + "‘er": 94, + "hii": 94, + "oora": 94, + "ià": 93, + "lu": 93, + "e’": 93, + "ham": 93, + "aim": 93, + "i’a": 93, + "puna": 93, + "oai": 93, + "riti": 93, + "imu": 93, + "nop": 93, + "etua": 93, + "‘era": 93, + "fo": 92, + "ok": 92, + "res": 92, + "e,e": 92, + "aote": 92, + "tī": 91, + "tt": 91, + "ala": 91, + "sia": 91, + "ing": 91, + "pit": 91, + "pat": 91, + "i’i": 91, + "raat": 91, + "a‘er": 91, + "\"": 90, + "ēt": 90, + "ent": 90, + "mur": 90, + "tiu": 90, + "iha": 90, + "ace": 90, + "mani": 90, + "teò": 90, + "taot": 90, + "uka": 89, + "na,": 89, + "hir": 89, + "o'a": 89, + "uaa": 89, + "eraa": 89, + "poor": 89, + "bo": 88, + "a-": 88, + "rē": 88, + "u.": 88, + "ste": 88, + "avi": 88, + "êt": 88, + "nae": 88, + "raro": 88, + "8": 87, + "o‘": 87, + "ew": 87, + "tot": 87, + "’au": 87, + "hio": 87, + "aira": 87, + "ont": 86, + "āti": 86, + "a'e": 86, + "taua": 86, + "tuò": 86, + "rd": 85, + "san": 85, + "oni": 85, + "and": 85, + "eao": 85, + "ae.": 85, + "pr": 84, + "rom": 84, + "iih": 84, + ",m": 84, + "naa": 84, + "te’": 84, + "aaa": 84, + "aae": 84, + "i.m": 84, + "ā’a": 83, + "ēti": 83, + "o'n": 83, + "eoh": 83, + "muri": 83, + "fari": 83, + "i.u": 83, + "pori": 83, + "to'n": 83, + "o'na": 83, + "nc": 82, + "a)": 82, + "e1": 82, + "eae": 82, + "piti": 82, + "a’at": 82, + "rera": 82, + "tete": 82, + "atam": 82, + ".mo": 82, + "atur": 82, + "s.": 81, + "nah": 81, + "aih": 81, + "tii": 81, + "a.u": 81, + "oêt": 81, + "),n": 81, + "haam": 81, + "aama": 81, + "tamu": 81, + "qu": 80, + "jo": 80, + "fē": 80, + "pol": 80, + "etā": 80, + "oa,": 80, + "ear": 80, + "ā’au": 80, + "mana": 80, + "auo": 80, + "’io": 80, + "eae.": 80, + "uare": 80, + "sc": 79, + "’e": 79, + "gi": 79, + "ta.": 79, + "nao": 79, + "rā’": 79, + "imi": 79, + "a.t": 79, + "rā’a": 79, + "horo": 79, + "efē": 79, + "‘i": 78, + "o.": 78, + "eri": 78, + "tes": 78, + "fēt": 78, + "cea": 78, + ",nō": 78, + "fēti": 78, + "ēti’": 78, + "ti’i": 78, + "acea": 78, + "ceae": 78, + "amua": 78, + "aì": 77, + "hi.": 77, + "a’n": 77, + "aa,": 77, + "’am": 77, + "iam": 77, + "faai": 77, + "gu": 76, + ".1": 76, + "râ": 76, + "ada": 76, + "vai": 76, + "ame": 76, + "oan": 76, + "epi": 76, + "ain": 76, + "ne,": 76, + "e2": 76, + "ooi": 76, + "rika": 76, + "ēn": 75, + "āp": 75, + "fri": 75, + "iar": 75, + "ako": 75, + "manu": 75, + "ong": 74, + "mor": 74, + "rem": 74, + "aem": 74, + "ta'n": 74, + "du": 73, + "ig": 73, + "oc": 73, + "top": 73, + "sso": 73, + "rara": 73, + "īt": 72, + "ā.": 72, + "e'": 72, + "les": 72, + "ici": 72, + "pup": 72, + "moa": 72, + "'ai": 72, + "aw": 71, + "a;": 71, + "na.": 71, + "uro": 71, + ".’": 71, + "eâ": 71, + "a'a": 71, + "arev": 71, + "mair": 71, + "eb": 70, + "omo": 70, + "pur": 70, + "mal": 70, + "ian": 70, + "hua": 70, + ".2": 70, + "auhi": 70, + "orit": 70, + "ja": 69, + "gr": 69, + "i-": 69, + "ton": 69, + "ale": 69, + "men": 69, + "tio": 69, + "mir": 69, + "1n": 69, + "aman": 69, + "mahi": 69, + "br": 68, + "one": 68, + "afr": 68, + "ure": 68, + "rea": 68, + "ela": 68, + "ei,": 68, + "iah": 68, + "mont": 68, + "aaho": 68, + "emā": 68, + "erer": 68, + "sz": 67, + "den": 67, + "i‘a": 67, + "eia": 67, + "pai": 67, + "epo": 67, + "ipe": 67, + "āra": 67, + "tup": 67, + "ni’": 67, + "hama": 67, + "ni’a": 67, + "òh": 66, + "ât": 66, + "ell": 66, + "tià": 66, + "rop": 66, + "ehu": 66, + "1no": 66, + "sh": 65, + "ô": 65, + "ye": 65, + "ec": 65, + "ero": 65, + "har": 65, + "epu": 65, + "iva": 65, + "òhi": 65, + "a.e": 65, + "tee": 65, + ".’o": 65, + "tema": 65, + "iio": 65, + "nei,": 65, + "eoi": 65, + "rr": 64, + "a:": 64, + "è": 64, + "eli": 64, + "fic": 64, + "i‘o": 64, + "ehe": 64, + "rua": 64, + "roo": 64, + "iap": 64, + "kit": 64, + ";e": 64, + "papa": 64, + "afri": 64, + "nā": 63, + "lin": 63, + "buk": 63, + ".f": 63, + "mou": 63, + "nor": 63, + "mā.": 63, + "oâ": 63, + "nati": 63, + "apaa": 63, + "i.t": 63, + "eii": 63, + "naf": 63, + "epā": 63, + "opō": 62, + "aare": 62, + "oana": 62, + "uv": 61, + "‘": 61, + "mer": 61, + "cie": 61, + "fau": 61, + "ehi": 61, + "eim": 61, + "noâ": 61, + "oaf": 61, + "onte": 61, + "rite": 61, + "moan": 61, + "mira": 61, + "ewh": 61, + "ob": 60, + "i(": 60, + "e'a": 60, + "aana": 60, + "te1": 60, + "omā": 60, + "tupu": 60, + "u,e": 60, + "paau": 60, + "aaur": 60, + "âp": 59, + "ia,": 59, + "uae": 59, + "iia": 59, + ",ma": 59, + "tara": 59, + "hira": 59, + "oât": 59, + "aòn": 59, + "e,t": 59, + "rn": 58, + "ts": 58, + ".h": 58, + "aea": 58, + "rur": 58, + "òt": 58, + "ua,": 58, + "elo": 58, + "uih": 58, + "a,u": 58, + "anah": 58, + "tepa": 58, + "esso": 58, + "ntes": 58, + "imir": 58, + "ā.t": 58, + "tew": 58, + "mē": 57, + "'ar": 57, + "eur": 57, + "lla": 57, + "tān": 57, + "āne": 57, + "tie": 57, + "nya": 57, + "oti": 57, + "osa": 57, + "fici": 57, + "a,o": 57, + "eap": 57, + "rs": 56, + ").": 56, + "ome": 56, + "ica": 56, + "van": 56, + "nan": 56, + "ric": 56, + "tion": 56, + "orom": 56, + "ita.": 56, + "arah": 56, + "cr": 55, + "-a": 55, + "aï": 55, + "lan": 55, + "re,": 55, + "nov": 55, + "mel": 55, + "‘ai": 55, + "aora": 55, + "aïa": 55, + "iit": 55, + "aria": 55, + "arav": 55, + "tess": 55, + "ssor": 55, + "00": 54, + "10": 54, + "aaf": 54, + "rae": 54, + "noh": 54, + "ti,": 54, + "àm": 54, + "teu": 54, + "a‘a": 54, + "oat": 54, + "ni'": 54, + "maar": 54, + "nof": 54, + "pupu": 54, + "u-": 53, + "mb": 53, + "nk": 53, + "20": 53, + "lle": 53, + "fra": 53, + "hou": 53, + "lit": 53, + "aen": 53, + "ove": 53, + "ova": 53, + "ner": 53, + "auv": 53, + "’os": 53, + "eâp": 53, + "ni'a": 53, + "nn": 52, + "āò": 52, + "ris": 52, + "pan": 52, + "itu": 52, + "ror": 52, + "âpo": 52, + "māò": 52, + "āòh": 52, + "aio": 52, + "uva": 52, + "vam": 52, + "esia": 52, + "ta’a": 52, + "e’o": 52, + "arit": 52, + "iòn": 52, + "māti": 52, + "âpoo": 52, + "māòh": 52, + "āòhi": 52, + "dr": 51, + "èn": 51, + "del": 51, + "a‘i": 51, + "oho": 51, + "tīt": 51, + "ber": 51, + "ier": 51, + "ena": 51, + "gat": 51, + "6n": 51, + "os.": 51, + "pār": 51, + "sant": 51, + "tāne": 51, + "a.i": 51, + "tera": 51, + "puar": 51, + "pape": 51, + "pato": 51, + "ārah": 51, + "gak": 51, + "maim": 51, + "aimi": 51, + "o’": 50, + "tē": 50, + "ill": 50, + "vin": 50, + "car": 50, + "kai": 50, + "2n": 50, + "aite": 50, + "raa,": 50, + "aufa": 50, + "ahir": 50, + "ly": 49, + "12": 49, + "que": 49, + "i'o": 49, + "oui": 49, + "unu": 49, + "nui": 49, + "eau": 49, + "5n": 49, + "ro'": 49, + "icie": 49, + "aait": 49, + "orar": 49, + "gos.": 49, + "s.m": 49, + "reâ": 49, + "'ara": 49, + "frik": 49, + "rl": 48, + "uu": 48, + "ub": 48, + "ila": 48, + "ime": 48, + "mit": 48, + "ron": 48, + "ide": 48, + "aa.": 48, + "nen": 48, + "ein": 48, + "a),": 48, + "ahur": 48, + "atio": 48, + "2no": 48, + "6no": 48, + "etep": 48, + "i,t": 48, + "5no": 48, + "àmā": 48, + ".mā": 48, + "pāra": 48, + "tane": 48, + "iàm": 48, + "aj": 47, + "11": 47, + "ili": 47, + "rin": 47, + "0n": 47, + "hiò": 47, + "nok": 47, + "mala": 47, + "eih": 47, + "fauf": 47, + "i,i": 47, + "nauh": 47, + "iti,": 47, + "eip": 47, + "atau": 47, + "eei": 47, + "oro'": 47, + "ro'a": 47, + "ū": 46, + "āh": 46, + "lia": 46, + "hi,": 46, + "òm": 46, + "ta,": 46, + "kar": 46, + "iet": 46, + "4n": 46, + "hov": 46, + "mui": 46, + "ken": 46, + "awh": 46, + "oaa": 46, + "faao": 46, + "ana,": 46, + ".ta": 46, + "aahi": 46, + "raau": 46, + "je": 45, + "vo": 45, + "od": 45, + "ay": 45, + "ū.": 45, + "aè": 45, + "za": 45, + "sk": 45, + "i;": 45, + "iur": 45, + "hen": 45, + "hap": 45, + "opu": 45, + "sta": 45, + "lar": 45, + "ake": 45, + "tek": 45, + "ali": 45, + "ofe": 45, + "3n": 45, + "hi'": 45, + "uhu": 45, + "ieh": 45, + "here": 45, + "eif": 45, + "buka": 45, + "omē": 45, + "ahor": 45, + "ieho": 45, + "ehov": 45, + "hova": 45, + "mp": 44, + "cu": 44, + "ib": 44, + "vil": 44, + "sit": 44, + ")t": 44, + "tav": 44, + "pū.": 44, + "ola": 44, + "opo": 44, + "a1": 44, + "hoa": 44, + "oar": 44, + "7n": 44, + "afe": 44, + "fran": 44, + "ana.": 44, + "ira’": 44, + "aore": 44, + "niò": 44, + "4no": 44, + "topa": 44, + "hi'o": 44, + "raua": 44, + "poli": 44, + "olit": 44, + "7no": 44, + "eg": 43, + "ld": 43, + "uc": 43, + "ff": 43, + "êp": 43, + "cs": 43, + "nta": 43, + "our": 43, + "sie": 43, + "ngo": 43, + "iun": 43, + "vem": 43, + "êpe": 43, + "eio": 43, + "amah": 43, + ",no": 43, + "êta": 43, + "te2": 43, + "faaa": 43, + "nove": 43, + "3no": 43, + "urai": 43, + "i.f": 43, + "melo": 43, + "êper": 43, + "òhi.": 43, + "rang": 43, + "tō": 42, + "ze": 42, + "ct": 42, + "ry": 42, + "21": 42, + "sti": 42, + "for": 42, + "ēni": 42, + "sid": 42, + "ien": 42, + "ne.": 42, + "est": 42, + "uku": 42, + "ru,": 42, + "'or": 42, + "put": 42, + "oit": 42, + "fep": 42, + "toro": 42, + "faar": 42, + "pura": 42, + "amai": 42, + "oêp": 42, + "amui": 42, + "noê": 42, + "a.2": 42, + "we": 41, + "16": 41, + "15": 41, + "ast": 41, + "rēn": 41, + "ua.": 41, + "fei": 41, + "che": 41, + "gra": 41, + "abe": 41, + "ti.": 41, + "oei": 41, + ",k": 41, + "iura": 41, + "eres": 41, + "rēni": 41, + "fepu": 41, + "epua": 41, + "tapu": 41, + "nata": 41, + "liti": 41, + "i'ar": 41, + "a.1": 41, + "rc": 40, + "22": 40, + "’u": 40, + "e-": 40, + "ēr": 40, + "art": 40, + "isi": 40, + "mes": 40, + "var": 40, + "umu": 40, + "nit": 40, + "oca": 40, + ",h": 40, + "out": 40, + ".ò": 40, + "hop": 40, + "chi": 40, + "erē": 40, + "iii": 40, + "īte": 40, + "aon": 40, + "nee": 40, + "urē": 40, + "teb": 40, + "ufaa": 40, + "feia": 40, + "erâ": 40, + "uao": 40, + "ovem": 40, + "tiur": 40, + "tiun": 40, + "amau": 40, + "turu": 40, + "u,i": 40, + "ey": 39, + "m²": 39, + "14": 39, + "uà": 39, + "to’": 39, + ".n": 39, + "vau": 39, + "roi": 39, + "au,": 39, + "uav": 39, + "ope": 39, + "tte": 39, + "9n": 39, + "the": 39, + "ēra": 39, + "tom": 39, + "ipo": 39, + "ve'": 39, + "euro": 39, + "tuo": 39, + "’oc": 39, + "arat": 39, + ")te": 39, + "'ei": 39, + "’ata": 39, + "iti.": 39, + "0no": 39, + "vema": 39, + "iunu": 39, + "perē": 39, + "tang": 39, + "aroa": 39, + "aatu": 39, + "tīte": 39, + "ve'a": 39, + "és": 38, + "-h": 38, + "z": 38, + "iz": 38, + "all": 38, + "ist": 38, + "pui": 38, + "can": 38, + "kur": 38, + "‘oa": 38, + "o‘a": 38, + "êf": 38, + "aie": 38, + "pea": 38, + "aki": 38, + "rut": 38, + "kat": 38, + "i2": 38, + "min": 38, + "ett": 38, + "rēr": 38, + "kor": 38, + "pah": 38, + "vih": 38, + "tumu": 38, + "i‘oa": 38, + "oêf": 38, + "9no": 38, + "e.t": 38, + "tana": 38, + "rora": 38, + "omet": 38, + "erēr": 38, + "rēra": 38, + "aiti": 38, + "paf": 38, + ".fa": 38, + "nuar": 38, + "otī": 38, + "ītem": 38, + "ravi": 38, + "avih": 38, + "vihi": 38, + "apoo": 38, + "cl": 37, + "18": 37, + "23": 37, + "ver": 37, + "rac": 37, + "ra‘": 37, + "eka": 37, + ",a": 37, + ")i": 37, + "dam": 37, + "lis": 37, + "nih": 37, + "nce": 37, + "hiv": 37, + "aue": 37, + "rus": 37, + "ean": 37, + "asi": 37, + "ra-": 37, + ":t": 37, + "eam": 37, + "faan": 37, + "naho": 37, + "side": 37, + "iden": 37, + "deni": 37, + "ehia": 37, + "ufe": 37, + "vini": 37, + "hane": 37, + "orao": 37, + "raor": 37, + "n,": 36, + "cc": 36, + "km": 36, + "zi": 36, + "wi": 36, + "-m": 36, + "gy": 36, + "àt": 36, + "ade": 36, + "eny": 36, + "oph": 36, + "ia’": 36, + "ard": 36, + "va,": 36, + "iki": 36, + "iau": 36, + "nea": 36, + ",f": 36, + "nie": 36, + "kaa": 36, + "ra;": 36, + "urop": 36, + "ropa": 36, + "a,n": 36, + "aaro": 36, + "lt": 35, + "-r": 35, + "sp": 35, + "mm": 35, + "az": 35, + "’t": 35, + "sm": 35, + "17": 35, + "ì": 35, + "āv": 35, + "iw": 35, + "s)": 35, + "ord": 35, + "err": 35, + "nes": 35, + "ofa": 35, + "uni": 35, + "e(": 35, + "-ma": 35, + "ovi": 35, + "aô": 35, + "la,": 35, + "ma,": 35, + "gam": 35, + "resi": 35, + "'ora": 35, + "nere": 35, + "aina": 35, + "êti": 35, + "yo": 34, + "ī": 34, + "oà": 34, + "rk": 34, + "òa": 34, + "uer": 34, + "hon": 34, + "neh": 34, + "’eu": 34, + "ior": 34, + "des": 34, + "ree": 34, + "'ah": 34, + "ede": 34, + "ern": 34, + "o(": 34, + "nii": 34, + ".k": 34, + "’eur": 34, + "arua": 34, + "ere,": 34, + "puta": 34, + "etah": 34, + "aner": 34, + "otē": 34, + "kura": 34, + "lv": 33, + "ow": 33, + "e:": 33, + "’ā": 33, + "ōê": 33, + "á": 33, + "bl": 33, + "km²": 33, + "tif": 33, + "ni‘": 33, + "eru": 33, + "pia": 33, + "ei.": 33, + "iel": 33, + "rte": 33, + "āta": 33, + "ffi": 33, + "tim": 33, + "uti": 33, + "pāp": 33, + "nti": 33, + "ise": 33, + "âto": 33, + "awa": 33, + "na'": 33, + "tāh": 33, + "hōê": 33, + "him": 33, + "tēn": 33, + "i’e": 33, + "tahu": 33, + "adam": 33, + "’op": 33, + "’ati": 33, + "ni‘a": 33, + "eai": 33, + ",ei": 33, + "rome": 33, + "apat": 33, + "atai": 33, + "gao": 33, + "o,i": 33, + "e‘": 32, + "fu": 32, + "-ra": 32, + "sd": 32, + "ra:": 32, + "upe": 32, + "het": 32, + "phi": 32, + "ach": 32, + "ais": 32, + "puk": 32, + "ouà": 32, + "aku": 32, + "off": 32, + "nal": 32, + "cia": 32, + "0t": 32, + "fir": 32, + "tta": 32, + "pih": 32, + "ami": 32, + "kan": 32, + "tas": 32, + "re.": 32, + "eke": 32, + "ēnu": 32, + "ai-": 32, + "’ov": 32, + "onga": 32, + "amat": 32, + "aime": 32, + "apar": 32, + "iem": 32, + "ahou": 32, + "esid": 32, + "êfa": 32, + "enei": 32, + "âtop": 32, + "uru,": 32, + "iaha": 32, + "mouà": 32, + "ohia": 32, + "uahi": 32, + "tēnu": 32, + "ēnua": 32, + "ré": 31, + "r,": 31, + "ck": 31, + "24": 31, + "ʻ": 31, + "bel": 31, + "cas": 31, + "tre": 31, + "td": 31, + "phe": 31, + "eah": 31, + "na‘": 31, + "ahe": 31, + "nis": 31, + "uto": 31, + "ifi": 31, + "te.": 31, + "âte": 31, + "au.": 31, + "ho'": 31, + "rui": 31, + "aak": 31, + "ia'": 31, + "nana": 31, + "uata": 31, + "’ol": 31, + "i.e": 31, + "eof": 31, + "taur": 31, + "ū.’": 31, + "site": 31, + "offi": 31, + "ffic": 31, + "vana": 31, + "airi": 31, + "uaò": 31, + "taha": 31, + "tino": 31, + "pahi": 31, + "hope": 31, + "roa,": 31, + "uoh": 31, + "ju": 30, + "rf": 30, + "u‘": 30, + "29": 30, + "13": 30, + "ij": 30, + "tal": 30, + "gar": 30, + "anc": 30, + "ass": 30, + "aba": 30, + "ler": 30, + "nem": 30, + "ai.": 30, + "fer": 30, + "eng": 30, + "too": 30, + "tue": 30, + "kut": 30, + "tak": 30, + "āpa": 30, + "tāv": 30, + "cha": 30, + "usa": 30, + "imo": 30, + "i1": 30, + "rim": 30, + "noi": 30, + "o'i": 30, + "àte": 30, + "nei.": 30, + "hitu": 30, + "a’na": 30, + "oie": 30, + "nehe": 30, + "oae": 30, + ",ta": 30, + "noho": 30, + "âtet": 30, + "rava": 30, + "ine,": 30, + "o,e": 30, + "e.u": 30, + "afar": 30, + "damu": 30, + "ave'": 30, + "d'": 29, + "ça": 29, + "fl": 29, + "ud": 29, + "30": 29, + "25": 29, + "é": 29, + "gn": 29, + "hn": 29, + "ár": 29, + "kw": 29, + "êr": 29, + "upi": 29, + "ins": 29, + "ose": 29, + "e‘a": 29, + "o’n": 29, + "-hi": 29, + "taf": 29, + "cra": 29, + "atā": 29, + ",p": 29, + "acc": 29, + "rle": 29, + "tro": 29, + "ung": 29, + "pot": 29, + "kot": 29, + "sab": 29, + "att": 29, + "ann": 29, + "pa'": 29, + "a'o": 29, + "tuu": 29, + "āhō": 29, + "ōêr": 29, + "êra": 29, + "oha": 29, + "eman": 29, + "ira:": 29, + "mona": 29, + "tato": 29, + "tavi": 29, + "ania": 29, + "firi": 29, + "e,i": 29, + "uaè": 29, + "utur": 29, + "iahi": 29, + "aito": 29, + "puka": 29, + "utua": 29, + "tāhō": 29, + "āhōê": 29, + "hōêr": 29, + "ōêra": 29, + "êraa": 29, + "'an": 29, + "aapu": 29, + "nç": 28, + "?": 28, + "x": 28, + "(m": 28, + "i)": 28, + "s,": 28, + "u'": 28, + "(t": 28, + "tū": 28, + "yi": 28, + "ens": 28, + "nge": 28, + "ort": 28, + "mo‘": 28, + ".o": 28, + "mil": 28, + "don": 28, + "ony": 28, + "kau": 28, + "int": 28, + "1t": 28, + "isa": 28, + "abu": 28, + "fa'": 28, + "ihu": 28, + "oio": 28, + "taim": 28, + "’ob": 28, + "rata": 28, + "iei": 28, + "a,m": 28, + "ahap": 28, + "hapa": 28, + "ette": 28, + "piha": 28, + "ahi,": 28, + "apa'": 28, + "i'or": 28, + "‘ei": 28, + "inaa": 28, + "ruo": 28, + "rica": 28, + "enya": 28, + "q": 27, + "l.": 27, + "²": 27, + "ūt": 27, + "oj": 27, + "sl": 27, + "lá": 27, + "ers": 27, + "nel": 27, + "adu": 27, + "enc": 27, + "nim": 27, + "erf": 27, + "êa": 27, + "son": 27, + "’tu": 27, + "pa.": 27, + "pet": 27, + "lam": 27, + "ènā": 27, + "nāt": 27, + "omi": 27, + "u(": 27, + "sse": 27, + "len": 27, + "nir": 27, + "hei": 27, + "nun": 27, + "une": 27, + "fa’": 27, + "aoh": 27, + "8n": 27, + "ebu": 27, + "'in": 27, + "'ir": 27, + "vila": 27, + "ment": 27, + "itia": 27, + "ief": 27, + "’om": 27, + "ahi.": 27, + "mesi": 27, + "teit": 27, + "eite": 27, + "itei": 27, + "raa.": 27, + "iete": 27, + "unaa": 27, + ":te": 27, + ",ia": 27, + "aèn": 27, + "atan": 27, + "utou": 27, + "iin": 27, + "òma": 27, + "eina": 27, + "maro": 27, + "ènāt": 27, + "nāta": 27, + "keny": 27, + "akaa": 27, + "a;e": 27, + "aoe": 27, + "aaap": 27, + "rm": 26, + "yn": 26, + "né": 26, + "()": 26, + "ā'": 26, + "pǔ": 26, + "pŭ": 26, + "ase": 26, + "anç": 26, + "sup": 26, + "rfi": 26, + "hun": 26, + "rad": 26, + "com": 26, + "pou": 26, + "nak": 26, + "bar": 26, + "ros": 26, + "sot": 26, + "mao": 26, + "'it": 26, + "oa.": 26, + "meh": 26, + "aip": 26, + "poi": 26, + "pue": 26, + "kwa": 26, + "unō": 26, + "uper": 26, + "moro": 26, + "aapa": 26, + "ana‘": 26, + "taea": 26, + "avin": 26, + "onal": 26, + "taie": 26, + "aiet": 26, + "tapa": 26, + "a'it": 26, + "ei‘": 26, + "uoi": 26, + "maur": 26, + "tiar": 26, + "outo": 26, + "naô": 26, + "aari": 26, + "aab": 26, + "rura": 26, + "ahi'": 26, + "tiah": 26, + "loo": 26, + "ls": 25, + "ug": 25, + "'u": 25, + "ez": 25, + "pû": 25, + "î": 25, + "(a": 25, + "e\"": 25, + "pî": 25, + "ʻo": 25, + "(c": 25, + "ky": 25, + "hy": 25, + "ole": 25, + "umo": 25, + ":1": 25, + "ind": 25, + "eph": 25, + "iak": 25, + "eut": 25, + "ési": 25, + "hil": 25, + "sto": 25, + "ndr": 25, + "ka,": 25, + "pen": 25, + "ssi": 25, + "e3": 25, + "tip": 25, + "joh": 25, + "ger": 25, + "oa'": 25, + "êo": 25, + "ccr": 25, + "ii,": 25, + "ahua": 25, + "teri": 25, + "arap": 25, + "ranç": 25, + ".hu": 25, + "supe": 25, + "perf": 25, + "erfi": 25, + "rfic": 25, + "romo": 25, + "ira,": 25, + "tini": 25, + "atta": 25, + "fa’a": 25, + "ine.": 25, + "nira": 25, + "taut": 25, + "noo": 25, + "naha": 25, + "hang": 25, + "ukut": 25, + "akar": 25, + "anaa": 25, + "8no": 25, + "atae": 25, + "accr": 25, + "'ira": 25, + "veo": 25, + "pa'i": 25, + "pl": 24, + "l-": 24, + "gl": 24, + "hr": 24, + "-o": 24, + "nh": 24, + "26": 24, + "n-": 24, + "ás": 24, + "zt": 24, + "ilo": 24, + "asa": 24, + "vat": 24, + "ium": 24, + "ie:": 24, + "cat": 24, + "pha": 24, + "kal": 24, + "a’t": 24, + "u‘a": 24, + "tāp": 24, + "va'": 24, + "ssa": 24, + "bas": 24, + "fat": 24, + "èna": 24, + "òr": 24, + "òp": 24, + "oua": 24, + "gne": 24, + "raf": 24, + "ai,": 24, + "iss": 24, + "roh": 24, + "'ao": 24, + "shi": 24, + "êm": 24, + "i-a": 24, + "asu": 24, + "yan": 24, + "szt": 24, + "koa": 24, + "iwh": 24, + "gaw": 24, + "opa.": 24, + "uran": 24, + "’oa": 24, + "ales": 24, + "cie:": 24, + "omon": 24, + "uho": 24, + "ille": 24, + "aohi": 24, + "apur": 24, + "nuna": 24, + "aara": 24, + "fa'a": 24, + ".fe": 24, + "te‘": 24, + "ture": 24, + "mām": 24, + "etan": 24, + "rima": 24, + "ruru": 24, + "kain": 24, + "ana'": 24, + "ccra": 24, + "19": 23, + "e)": 23, + "27": 23, + "kh": 23, + "bd": 23, + "sen": 23, + "tel": 23, + "ven": 23, + "rie": 23, + "ndi": 23, + "lio": 23, + "war": 23, + "uts": 23, + "ni,": 23, + "nda": 23, + "ert": 23, + "hel": 23, + "uis": 23, + "igh": 23, + "sal": 23, + "kap": 23, + "ele": 23, + "ign": 23, + "s),": 23, + "eon": 23, + "ohn": 23, + "bet": 23, + "fet": 23, + "toà": 23, + "5t": 23, + "a2": 23, + "apî": 23, + "oa‘": 23, + "-at": 23, + "nos": 23, + "-hia": 23, + "tde": 23, + "lari": 23, + "itih": 23, + "pani": 23, + "repu": 23, + "teta": 23, + "nett": 23, + "tori": 23, + "race": 23, + "òta": 23, + "orea": 23, + "paru": 23, + "aa‘": 23, + "ahaa": 23, + "aad": 23, + "john": 23, + "t-": 22, + "iq": 22, + "lm": 22, + "nm": 22, + "(,": 22, + "o-": 22, + "t,": 22, + "•": 22, + "hā": 22, + "ā‘": 22, + "e|": 22, + "ons": 22, + "lon": 22, + "col": 22, + "cor": 22, + "au-": 22, + "arl": 22, + "sel": 22, + "pri": 22, + "aga": 22, + "sca": 22, + "uel": 22, + "nav": 22, + "bra": 22, + ".p": 22, + "sep": 22, + "emi": 22, + "ivi": 22, + ")n": 22, + ",)": 22, + "uit": 22, + "ida": 22, + "ga,": 22, + "kah": 22, + "ngi": 22, + "kam": 22, + ".a": 22, + "vig": 22, + "ma’": 22, + "ref": 22, + "abd": 22, + "paì": 22, + "hai": 22, + "2t": 22, + "dia": 22, + "ngu": 22, + "eth": 22, + "ife": 22, + "o’a": 22, + "'at": 22, + "afi": 22, + "dan": 22, + "tec": 22, + "pao": 22, + "vae": 22, + "a‘o": 22, + "'i,": 22, + "ie.": 22, + "kuf": 22, + "hiva": 22, + "oam": 22, + "a.’": 22, + "ciel": 22, + "otea": 22, + "ite.": 22, + "nua.": 22, + "aal": 22, + "eria": 22, + "oror": 22, + "nua,": 22, + "ènat": 22, + "tuaf": 22, + "uafa": 22, + "huaa": 22, + "iara": 22, + "paar": 22, + "ia'n": 22, + "'t": 21, + "n.": 21, + "-t": 21, + "hī": 21, + "ká": 21, + "ōp": 21, + "m)": 21, + "rp": 21, + "pal": 21, + "lau": 21, + "gen": 21, + "lva": 21, + "str": 21, + "mas": 21, + "sem": 21, + "mis": 21, + "ho‘": 21, + "ben": 21, + "fa‘": 21, + "iqu": 21, + "con": 21, + "ooa": 21, + "oka": 21, + "oly": 21, + "eve": 21, + "sil": 21, + "din": 21, + "ipi": 21, + "ea,": 21, + "te,": 21, + "0m": 21, + "hot": 21, + "e4": 21, + "āte": 21, + "ndo": 21, + "edo": 21, + "bal": 21, + "ohu": 21, + "gas": 21, + "oum": 21, + "tri": 21, + "rana": 21, + "tooa": 21, + "anih": 21, + "eav": 21, + "oêa": 21, + "hito": 21, + "hene": 21, + "maru": 21, + "otop": 21, + "init": 21, + "iona": 21, + "vign": 21, + "igne": 21, + "gnet": 21, + "ma’a": 21, + "a’am": 21, + "mati": 21, + "pāpa": 21, + "20n": 21, + "teâ": 21, + "poto": 21, + "avae": 21, + "autu": 21, + "arar": 21, + "oêm": 21, + "oroa": 21, + "oêo": 21, + "moni": 21, + "opea": 21, + "maf": 21, + "inga": 21, + "nima": 21, + "ango": 21, + "yang": 21, + "alar": 21, + "puaa": 21, + "urur": 21, + "'iti": 21, + "tc": 20, + "rb": 20, + "û": 20, + "â,": 20, + "ōn": 20, + "‘u": 20, + "..": 20, + "-p": 20, + "np": 20, + "l,": 20, + "rê": 20, + "'ā": 20, + "yt": 20, + "rra": 20, + "rge": 20, + "ies": 20, + "gue": 20, + "hie": 20, + "lek": 20, + "ado": 20, + "ajo": 20, + "cam": 20, + "nça": 20, + "ous": 20, + "òf": 20, + "ro,": 20, + "hao": 20, + "mus": 20, + "ich": 20, + "a’u": 20, + "ice": 20, + "āva": 20, + "los": 20, + "eca": 20, + "mad": 20, + "noc": 20, + "edi": 20, + "nic": 20, + "eco": 20, + "oko": 20, + "ra'": 20, + "a't": 20, + "'tu": 20, + "vii": 20, + "set": 20, + "ia‘": 20, + "eer": 20, + "áre": 20, + "eot": 20, + "erau": 20, + "ique": 20, + "erem": 20, + "rema": 20, + "nihi": 20, + "sde": 20, + "poly": 20, + "efr": 20, + "osep": 20, + "ra‘i": 20, + "auro": 20, + "phet": 20, + "heta": 20, + "ta’n": 20, + "elia": 20, + "ekal": 20, + "kale": 20, + "lesi": 20, + "tuar": 20, + ".no": 20, + "varu": 20, + "enō": 20, + "āpaì": 20, + "ataa": 20, + "a.ò": 20, + "atoà": 20, + "hina": 20, + "a'tu": 20, + "feti": 20, + "tua,": 20, + ".ko": 20, + "anim": 20, + "abet": 20, + "uamo": 20, + "ua‘": 20, + "ix": 19, + "ér": 19, + "«": 19, + "zo": 19, + ".\"": 19, + "i:": 19, + "ji": 19, + "cal": 19, + "las": 19, + "llo": 19, + "esc": 19, + "sar": 19, + "dis": 19, + "to‘": 19, + "o‘i": 19, + "‘or": 19, + "hoh": 19, + "ītī": 19, + "uem": 19, + "rne": 19, + "çai": 19, + "nde": 19, + "lyn": 19, + "lou": 19, + "ao,": 19, + "tik": 19, + "ūti": 19, + "i7": 19, + "org": 19, + "ash": 19, + "ial": 19, + "aph": 19, + "ues": 19, + "rum": 19, + "iac": 19, + "kin": 19, + "uia": 19, + "aet": 19, + "iiv": 19, + "sha": 19, + "oer": 19, + "tsa": 19, + "gah": 19, + "ïa,": 19, + "ia(": 19, + "nter": 19, + "enta": 19, + "amer": 19, + "ança": 19, + "çais": 19, + "cast": 19, + "andr": 19, + "seph": 19, + "ioni": 19, + "pam": 19, + "iihi": 19, + "ïai": 19, + "e,o": 19, + "iare": 19, + "(,)": 19, + "roma": 19, + "bela": 19, + "’are": 19, + "oab": 19, + "upoo": 19, + "aroo": 19, + "to’a": 19, + "auri": 19, + "ātea": 19, + "hiah": 19, + "dona": 19, + "òte": 19, + "ata'": 19, + "ata,": 19, + "arai": 19, + "lisa": 19, + "āne,": 19, + "beth": 19, + "isab": 19, + "sabe": 19, + "tuam": 19, + "gaa": 19, + ",he": 19, + "ava'": 19, + "ho'i": 19, + "lb": 18, + "(e": 18, + "(p": 18, + "èr": 18, + "āf": 18, + "sn": 18, + "gs": 18, + "ʻi": 18, + "emp": 18, + "lat": 18, + "niu": 18, + "oll": 18, + "mt": 18, + "ta‘": 18, + "apû": 18, + "a-o": 18, + "râ,": 18, + "dor": 18, + "cle": 18, + "vie": 18, + "hat": 18, + "pre": 18, + "a'u": 18, + "ald": 18, + "lde": 18, + "eiv": 18, + "kei": 18, + "pin": 18, + "rūt": 18, + ",s": 18, + "7t": 18, + "cto": 18, + "pop": 18, + "ula": 18, + "abi": 18, + "qui": 18, + "oot": 18, + "pāt": 18, + "mei": 18, + "pro": 18, + "sou": 18, + "tic": 18, + "sin": 18, + "eà": 18, + "med": 18, + "wai": 18, + "hoe": 18, + "ago": 18, + "seb": 18, + "rel": 18, + "'au": 18, + "o‘o": 18, + "hi‘": 18, + "erk": 18, + "ász": 18, + "ri-": 18, + "toe": 18, + "u'a": 18, + "ella": 18, + "eop": 18, + "nçai": 18, + "eso": 18, + "olyn": 18, + "-raa": 18, + "iter": 18, + "atea": 18, + "hara": 18, + "topu": 18, + "hoho": 18, + "pupi": 18, + "upir": 18, + "rūti": 18, + "ūtia": 18, + "mite": 18, + "ti’a": 18, + "land": 18, + "tāva": 18, + "āvan": 18, + "riki": 18, + "maor": 18, + "14n": 18, + "apao": 18, + "hiro": 18, + "titi": 18, + "iaè": 18, + "i,u": 18, + "15n": 18, + "ea‘": 18, + "anat": 18, + "unga": 18, + "nga,": 18, + "akam": 18, + "taei": 18, + "toa,": 18, + "'aa": 18, + "rii,": 18, + "reer": 18, + "nyan": 18, + "buku": 18, + "kuts": 18, + "utsa": 18, + "imal": 18, + "lp": 17, + "pp": 17, + "ft": 17, + "31": 17, + "40": 17, + "-n": 17, + "tm": 17, + "ù": 17, + "any": 17, + "ser": 17, + "bol": 17, + "ban": 17, + "rio": 17, + "ral": 17, + "pau": 17, + "lor": 17, + "ōra": 17, + "rés": 17, + "ios": 17, + "nur": 17, + "āri": 17, + "dt": 17, + "dem": 17, + "ank": 17, + "nés": 17, + "ces": 17, + "lli": 17, + "esa": 17, + "bia": 17, + "ou,": 17, + "raì": 17, + "mak": 17, + "kum": 17, + "arī": 17, + "moh": 17, + "te|": 17, + "pa’": 17, + "aif": 17, + "ode": 17, + "arc": 17, + "lik": 17, + "āto": 17, + "dol": 17, + "thi": 17, + "ico": 17, + "vei": 17, + "rob": 17, + "sle": 17, + "mba": 17, + "aa'": 17, + "ewa": 17, + "oip": 17, + "uor": 17, + "hem": 17, + "ofo": 17, + ")nō": 17, + "tani": 17, + "pora": 17, + "ta'i": 17, + "rere": 17, + "onya": 17, + "nōp": 17, + "to’n": 17, + "o’na": 17, + "aaor": 17, + "papû": 17, + "ehen": 17, + "epup": 17, + "nava": 17, + "tern": 17, + "tte|": 17, + "eani": 17, + "lap": 17, + "e.h": 17, + "12n": 17, + "ange": 17, + "enti": 17, + "i.i": 17, + "23n": 17, + "rani": 17, + "patu": 17, + "apae": 17, + "oa't": 17, + "oia.": 17, + "èno": 17, + "anua": 17, + "fara": 17, + "taia": 17, + "ra‘a": 17, + "aaip": 17, + "aipo": 17, + "ipoi": 17, + "poip": 17, + "oipo": 17, + ",na": 17, + "parī": 17, + ",fa": 17, + "i,m": 17, + "tape": 17, + "whan": 17, + "avai": 17, + "rira": 17, + "noe": 17, + "niho": 17, + "21n": 17, + "11n": 17, + "aoti": 17, + "a,k": 17, + "akoa": 17, + "arik": 17, + "oke": 17, + "i.1": 17, + "aein": 17, + "eree": 17, + "eere": 17, + "abuk": 17, + "ofor": 17, + "fori": 17, + "ri-a": 17, + "l'": 16, + "ps": 16, + "ds": 16, + "ej": 16, + "ʻa": 16, + "28": 16, + "‘ā": 16, + "‘ō": 16, + "(r": 16, + "īi": 16, + "yl": 16, + "án": 16, + "ty": 16, + "nto": 16, + "olo": 16, + "liu": 16, + "tra": 16, + "erg": 16, + "oad": 16, + "rti": 16, + "let": 16, + "8t": 16, + "nsi": 16, + "dic": 16, + "‘ar": 16, + "ti‘": 16, + "esu": 16, + "eda": 16, + "tār": 16, + ".3": 16, + "oa-": 16, + "yné": 16, + "ive": 16, + "ost": 16, + "oss": 16, + "ri,": 16, + "rīi": 16, + "īih": 16, + "e9": 16, + "bla": 16, + "uss": 16, + "ru.": 16, + "6t": 16, + "vit": 16, + "maì": 16, + "m),": 16, + "an-": 16, + "kon": 16, + "uba": 16, + "wan": 16, + "mic": 16, + "jos": 16, + "uki": 16, + "amb": 16, + "eô": 16, + "nna": 16, + "ae,": 16, + "obo": 16, + "ihe": 16, + "ouh": 16, + "ufu": 16, + "'im": 16, + "'op": 16, + "orl": 16, + "ti;": 16, + "eel": 16, + "fuo": 16, + "eld": 16, + "anta": 16, + "bert": 16, + "renc": 16, + "lyné": 16, + "ynés": 16, + "nési": 16, + "ésie": 16, + "ence": 16, + "a.h": 16, + "tati": 16, + "ophe": 16, + "aato": 16, + "evan": 16, + "ti‘a": 16, + "ho‘i": 16, + "itau": 16, + "piih": 16, + "arâ": 16, + "mili": 16, + "poro": 16, + "ora,": 16, + "o,t": 16, + "tean": 16, + "airo": 16, + "e20": 16, + "teô": 16, + "apā": 16, + "aoro": 16, + "24n": 16, + "tair": 16, + "miti": 16, + "teti": 16, + "apot": 16, + "repo": 16, + "hi‘o": 16, + "itah": 16, + "arīi": 16, + "rīih": 16, + "īihi": 16, + ",to": 16, + "naan": 16, + "atup": 16, + "upur": 16, + "tuah": 16, + "mono": 16, + "meha": 16, + "kore": 16, + "elis": 16, + "22n": 16, + "afir": 16, + "16n": 16, + "eeh": 16, + "oera": 16, + "a'i,": 16, + "na'o": 16, + "'ahi": 16, + "va'e": 16, + "lc": 15, + "-s": 15, + "ō'": 15, + "t.": 15, + "rv": 15, + "dé": 15, + "nf": 15, + "ym": 15, + "(n": 15, + "\"t": 15, + "mf": 15, + "lad": 15, + "arr": 15, + "rri": 15, + "val": 15, + "bre": 15, + "ius": 15, + "der": 15, + "bou": 15, + "azi": 15, + "a-h": 15, + "pa‘": 15, + "pee": 15, + "sch": 15, + "ogr": 15, + "age": 15, + "uli": 15, + "fol": 15, + "bac": 15, + "vao": 15, + "i6": 15, + "rna": 15, + "vic": 15, + "enk": 15, + "ri.": 15, + "al-": 15, + "aìt": 15, + "evi": 15, + "tho": 15, + "nno": 15, + "nac": 15, + "dad": 15, + "rdo": 15, + "fif": 15, + "whi": 15, + "sma": 15, + "lic": 15, + "usi": 15, + "osi": 15, + ";u": 15, + "e6": 15, + "a‘u": 15, + "kil": 15, + "ka.": 15, + "gye": 15, + "3t": 15, + "sah": 15, + "ha,": 15, + "po'": 15, + "eï": 15, + "ao'": 15, + "sum": 15, + "fatu": 15, + "mori": 15, + "erra": 15, + "pōra": 15, + "ōran": 15, + "e,u": 15, + "iesu": 15, + "e.e": 15, + "eneh": 15, + "eek": 15, + "auta": 15, + "lion": 15, + "ātia": 15, + "tia.": 15, + "āria": 15, + "oal": 15, + "te\"": 15, + "ranc": 15, + "port": 15, + "pari": 15, + "inte": 15, + "te3": 15, + "aran": 15, + "anav": 15, + "itor": 15, + "ouri": 15, + "u,t": 15, + "i,o": 15, + "rati": 15, + "iata": 15, + "oii": 15, + ";ua": 15, + "taui": 15, + "aise": 15, + "pāti": 15, + "mota": 15, + "orin": 15, + "inet": 15, + "ctor": 15, + "na‘o": 15, + "eva,": 15, + "hotu": 15, + "iman": 15, + "apor": 15, + "enga": 15, + "tou,": 15, + "fifi": 15, + "itir": 15, + "noa,": 15, + "kato": 15, + "iie": 15, + "atat": 15, + "ahau": 15, + "anti": 15, + "nip": 15, + "no’": 15, + "taj": 15, + "achi": 15, + "17n": 15, + "neo": 15, + "ngar": 15, + "anei": 15, + "anna": 15, + "aupa": 15, + "ori-": 15, + "'ie": 15, + "'io": 15, + "eïa": 15, + "aaot": 15, + "arur": 15, + "iti;": 15, + "sier": 15, + "i'op": 15, + "'opo": 15, + "sota": 15, + "otai": 15, + "o'ah": 15, + "tao'": 15, + "ao'a": 15, + "irik": 15, + "kufu": 15, + "ufuo": 15, + "fuor": 15, + "ex": 14, + "wo": 14, + "xa": 14, + "1.": 14, + "té": 14, + "-f": 14, + "(i": 14, + "sb": 14, + "(h": 14, + "d.": 14, + "-e": 14, + "35": 14, + "\".": 14, + "e;": 14, + "r.": 14, + "-g": 14, + "má": 14, + "fre": 14, + "ras": 14, + "ult": 14, + "riu": 14, + "dre": 14, + "pon": 14, + ":2": 14, + "nep": 14, + "itā": 14, + "tad": 14, + "adi": 14, + "log": 14, + "obe": 14, + "nye": 14, + "lie": 14, + "tol": 14, + "iè": 14, + "nuk": 14, + "hik": 14, + "aoa": 14, + "rak": 14, + "rek": 14, + "pie": 14, + "000": 14, + "ro.": 14, + "iot": 14, + "sco": 14, + "e5": 14, + "sis": 14, + "cen": 14, + "oue": 14, + "ect": 14, + "vea": 14, + "flo": 14, + "lma": 14, + "ifo": 14, + "hal": 14, + "e’a": 14, + "dou": 14, + "jac": 14, + "lei": 14, + "òj": 14, + "tch": 14, + "’or": 14, + "ifā": 14, + "toh": 14, + "ted": 14, + "hue": 14, + "fai": 14, + "raw": 14, + "n1": 14, + "ngs": 14, + "agh": 14, + "cse": 14, + "oak": 14, + "oah": 14, + "rā'": 14, + "'i.": 14, + "ei;": 14, + "sa-": 14, + "-on": 14, + "hu'": 14, + "yte": 14, + "nuku": 14, + "esd": 14, + "mart": 14, + "ojo": 14, + "ti(": 14, + "urit": 14, + "indi": 14, + "ata.": 14, + "uara": 14, + "na‘e": 14, + "iim": 14, + "ogra": 14, + "anda": 14, + "rist": 14, + "scar": 14, + "aris": 14, + "erna": 14, + "eom": 14, + "uita": 14, + "’amo": 14, + "inā": 14, + "i,h": 14, + "reta": 14, + "29n": 14, + "uaru": 14, + "rohi": 14, + "teà": 14, + "era,": 14, + "erit": 14, + "ther": 14, + "fa‘a": 14, + "o.t": 14, + "aiat": 14, + "char": 14, + "line": 14, + "mo‘o": 14, + "êma": 14, + "eara": 14, + ".he": 14, + "pene": 14, + "niè": 14, + "ièn": 14, + "apuk": 14, + "akat": 14, + "akah": 14, + "ngat": 14, + "gata": 14, + "kama": 14, + "maui": 14, + "ooe": 14, + "ama,": 14, + "aaoh": 14, + "riir": 14, + "leke": 14, + "’ate": 14, + "nace": 14, + "abel": 14, + "ra'a": 14, + "chim": 14, + "nup": 14, + "tomi": 14, + "kapu": 14, + "koak": 14, + "oako": 14, + "ngah": 14, + "a'i.": 14, + "i;e": 14, + "nei;": 14, + "i.2": 14, + "ioe": 14, + "fric": 14, + "tsa-": 14, + "sa-o": 14, + "a-on": 14, + "-ony": 14, + "hu'a": 14, + "i-at": 14, + "-att": 14, + "korl": 14, + "orle": 14, + "ware": 14, + "uï": 13, + "ks": 13, + "āu": 13, + "1,": 13, + "nl": 13, + "ân": 13, + "ìr": 13, + "ão": 13, + "vr": 13, + "nb": 13, + "ál": 13, + "5.": 13, + ",0": 13, + "nr": 13, + "ōm": 13, + "yá": 13, + "dd": 13, + "ǔp": 13, + "ǔ": 13, + "u;": 13, + "ŭp": 13, + "alo": 13, + "pel": 13, + "alt": 13, + "reg": 13, + "rre": 13, + "roe": 13, + "obr": 13, + "sol": 13, + "arm": 13, + "aul": 13, + "aiv": 13, + "‘ir": 13, + "sio": 13, + "nso": 13, + "red": 13, + "ro‘": 13, + "oa’": 13, + "ai‘": 13, + "onu": 13, + "pra": 13, + "’it": 13, + "uet": 13, + ".v": 13, + "luv": 13, + "uvi": 13, + "gai": 13, + "mpa": 13, + "nue": 13, + "mae": 13, + "'oe": 13, + "omm": 13, + "sf": 13, + "ois": 13, + "oso": 13, + "alv": 13, + "rol": 13, + "reu": 13, + "soc": 13, + "rid": 13, + "tu,": 13, + "òv": 13, + "kia": 13, + "kir": 13, + "i3": 13, + "i9": 13, + "nko": 13, + "’ap": 13, + "dri": 13, + "a’e": 13, + "oci": 13, + "num": 13, + "sai": 13, + "ski": 13, + "til": 13, + "hes": 13, + "nas": 13, + "um)": 13, + "oac": 13, + "osc": 13, + "itr": 13, + "jea": 13, + ":m": 13, + "peh": 13, + "eba": 13, + "’oh": 13, + "yam": 13, + "jan": 13, + "ker": 13, + "ley": 13, + "uin": 13, + "na’": 13, + "eik": 13, + "rec": 13, + "ua’": 13, + "etr": 13, + "a•": 13, + "ā‘a": 13, + "êh": 13, + "âi": 13, + "‘an": 13, + "ēf": 13, + "dil": 13, + "s1": 13, + "aou": 13, + "obi": 13, + "4t": 13, + "oki": 13, + "ket": 13, + "kaw": 13, + "uau": 13, + "kua": 13, + "ā'a": 13, + "ige": 13, + "pǔp": 13, + "ǔpǔ": 13, + "oku": 13, + "ïa.": 13, + ";o": 13, + "ôa": 13, + "wag": 13, + "uïa": 13, + "pŭp": 13, + "ŭpŭ": 13, + "'ih": 13, + "-gy": 13, + "a()": 13, + "i.h": 13, + "luvi": 13, + "ller": 13, + "stan": 13, + "arle": 13, + "anet": 13, + "a:1": 13, + "ensi": 13, + "vair": 13, + "sion": 13, + "anel": 13, + "neli": 13, + "mo‘a": 13, + "eaa": 13, + "mai.": 13, + "nif": 13, + ".ha": 13, + "pure": 13, + "iora": 13, + "erep": 13, + "a.3": 13, + ",me": 13, + "tia,": 13, + "icia": 13, + "0ta": 13, + "mini": 13, + "ande": 13, + "ooti": 13, + "na(": 13, + "mene": 13, + "iana": 13, + "itea": 13, + "u.u": 13, + "apō": 13, + "anui": 13, + "emen": 13, + "u.e": 13, + "tava": 13, + "mate": 13, + "atia": 13, + "imot": 13, + "etō": 13, + "hing": 13, + "a:t": 13, + "hare": 13, + "ro(": 13, + "ēfa": 13, + "aine": 13, + "nām": 13, + "arut": 13, + "rutu": 13, + "kara": 13, + "rane": 13, + "ane,": 13, + "enia": 13, + "iteh": 13, + "tehi": 13, + "ndol": 13, + "dola": 13, + "25n": 13, + "laa": 13, + "musa": 13, + "um),": 13, + "chel": 13, + "jean": 13, + "orua": 13, + "ifol": 13, + "foli": 13, + "whai": 13, + "ling": 13, + "peri": 13, + "rong": 13, + "upap": 13, + "gaha": 13, + "ā'au": 13, + "a'ir": 13, + "pǔpǔ": 13, + "ïah": 13, + "kwag": 13, + "wagh": 13, + "'af": 13, + "pŭpŭ": 13, + "cler": 13, + "lerk": 13, + "ms": 12, + "ûr": 12, + "h,": 12, + "с": 12, + "01": 12, + "sé": 12, + "ox": 12, + "tl": 12, + "[": 12, + "vā": 12, + "ā,": 12, + "a\"": 12, + "iā": 12, + "50": 12, + "ōh": 12, + "(s": 12, + "iy": 12, + "ŭ": 12, + "ega": 12, + "bor": 12, + "ebe": 12, + "-fa": 12, + ",d": 12, + "aus": 12, + "olu": 12, + "lum": 12, + "ves": 12, + "ned": 12, + "ese": 12, + "mun": 12, + "vav": 12, + "aìr": 12, + "ike": 12, + "to,": 12, + "uak": 12, + "ia)": 12, + "uve": 12, + "asc": 12, + "ild": 12, + "nst": 12, + "ael": 12, + "hol": 12, + "re-": 12, + "rto": 12, + "nne": 12, + "act": 12, + "inh": 12, + "dio": 12, + "aso": 12, + "luc": 12, + "ile": 12, + "nca": 12, + "elm": 12, + "ta)": 12, + "poa": 12, + "tac": 12, + "edu": 12, + "rce": 12, + "ōf": 12, + "mma": 12, + "ail": 12, + "mār": 12, + "ea.": 12, + "rag": 12, + "dav": 12, + "iko": 12, + "ott": 12, + "tig": 12, + "ict": 12, + "use": 12, + "on,": 12, + "ans": 12, + "er,": 12, + "ory": 12, + "bis": 12, + "ubi": 12, + "(te": 12, + ",r": 12, + "nut": 12, + "āvi": 12, + ":e": 12, + "tab": 12, + "rip": 12, + "-te": 12, + "re‘": 12, + "mam": 12, + "ēp": 12, + ",1": 12, + "nad": 12, + "lda": 12, + ";i": 12, + "opi": 12, + "zer": 12, + "lif": 12, + "e7": 12, + "lee": 12, + "nyá": 12, + "esz": 12, + "nyi": 12, + "dag": 12, + "'oh": 12, + "ôi": 12, + "4e": 12, + "ilu": 12, + "mte": 12, + "a-hi": 12, + "elle": 12, + "nces": 12, + "dep": 12, + ").t": 12, + "dica": 12, + "epha": 12, + "oron": 12, + "roph": 12, + "meri": 12, + "misi": 12, + "vane": 12, + "-faa": 12, + "aaha": 12, + "ilio": 12, + "tītī": 12, + "repi": 12, + "peti": 12, + "illa": 12, + "pera": 12, + "deg": 12, + "olin": 12, + "ti2": 12, + "ance": 12, + "1te": 12, + "nōm": 12, + "ōma": 12, + "te4": 12, + "titu": 12, + "imat": 12, + "eren": 12, + "cent": 12, + "e12": 12, + "soci": 12, + "cial": 12, + "maìt": 12, + "aìti": 12, + "anur": 12, + "mera": 12, + "sain": 12, + "hono": 12, + "’ohi": 12, + "ston": 12, + "tāvi": 12, + "āvin": 12, + "ātou": 12, + "upun": 12, + "ato'": 12, + "noa'": 12, + "uter": 12, + "tiri": 12, + "auu": 12, + "ruta": 12, + "rine": 12, + "anue": 12, + "tong": 12, + "re‘a": 12, + "pehe": 12, + "heo": 12, + "oêh": 12, + "râi": 12, + "area": 12, + "arer": 12, + "anir": 12, + "aapo": 12, + "aiva": 12, + "òfa": 12, + "te'": 12, + "nōf": 12, + "roa'": 12, + "orge": 12, + "akap": 12, + "nahi": 12, + "ola,": 12, + "etii": 12, + "10n": 12, + "otia": 12, + "uard": 12, + "ouis": 12, + "kaha": 12, + "aiao": 12, + "cana": 12, + "iace": 12, + "eki": 12, + "ta),": 12, + "ingi": 12, + "risi": 12, + "tapo": 12, + "pear": 12, + "ings": 12, + "kaup": 12, + "tuhi": 12, + "'ohi": 12, + "'ii": 12, + "ameh": 12, + "o'ir": 12, + "oti'": 12, + "kuma": 12, + "xi": 11, + "dy": 11, + "ux": 11, + "mc": 11, + "8.": 11, + "ić": 11, + "ć": 11, + "īm": 11, + "īr": 11, + "aà": 11, + "u:": 11, + "“": 11, + "ùp": 11, + "sy": 11, + "sr": 11, + "*": 11, + "-b": 11, + "uz": 11, + "yu": 11, + "by": 11, + "kp": 11, + "y,": 11, + "(f": 11, + "c)": 11, + "tp": 11, + "uw": 11, + "mǎ": 11, + "d'e": 11, + "gua": 11, + "rup": 11, + "orr": 11, + "oel": 11, + "boa": 11, + "ule": 11, + "rdi": 11, + "rde": 11, + "zil": 11, + ":4": 11, + "ou-": 11, + "g1": 11, + "aeh": 11, + "’āt": 11, + "rse": 11, + "isc": 11, + "cre": 11, + "end": 11, + "pas": 11, + "tha": 11, + "atr": 11, + "vel": 11, + "cel": 11, + "aca": 11, + "alm": 11, + "sus": 11, + "huk": 11, + "iku": 11, + "’en": 11, + "aja": 11, + "bli": 11, + "bri": 11, + "ōpū": 11, + ",c": 11, + "aya": 11, + "rou": 11, + "eet": 11, + "nol": 11, + "gui": 11, + "oco": 11, + "nth": 11, + "bro": 11, + "zin": 11, + "dul": 11, + "ond": 11, + "alp": 11, + "add": 11, + "inu": 11, + "ntr": 11, + "ary": 11, + "det": 11, + "èra": 11, + "lbe": 11, + "ust": 11, + "hri": 11, + "rba": 11, + "ias": 11, + "hut": 11, + "pep": 11, + "now": 11, + "gor": 11, + "itc": 11, + "puh": 11, + "rue": 11, + "ma.": 11, + "āhi": 11, + "eā": 11, + "ēm": 11, + "pa,": 11, + "taì": 11, + "o1": 11, + "no.": 11, + "i-r": 11, + "ri’": 11, + "‘ao": 11, + "îi": 11, + "va.": 11, + "tu.": 11, + "\"te": 11, + "iwa": 11, + "'am": 11, + "hea": 11, + ".4": 11, + "oun": 11, + "eko": 11, + "naw": 11, + "a3": 11, + "hoo": 11, + "csi": 11, + "ebi": 11, + "amf": 11, + "8e": 11, + "yem": 11, + "esl": 11, + "kye": 11, + "taru": 11, + "hif": 11, + "ntm": 11, + "terr": 11, + "lte": 11, + "ntal": 11, + "’oe": 11, + "’of": 11, + "tien": 11, + "nota": 11, + "rau-": 11, + "comm": 11, + "oos": 11, + "pres": 11, + "anio": 11, + "ōpō": 11, + "cati": 11, + "iose": 11, + "apa‘": 11, + "a‘ir": 11, + "pero": 11, + "erop": 11, + "‘ara": 11, + "tua.": 11, + "apap": 11, + "opua": 11, + "ro‘a": 11, + "dte": 11, + "anō": 11, + "oris": 11, + "vill": 11, + "anto": 11, + "toni": 11, + "isti": 11, + "stin": 11, + "tina": 11, + "oag": 11, + "ente": 11, + "enko": 11, + "pier": 11, + "e,f": 11, + "poot": 11, + "o,u": 11, + "ite,": 11, + "),e": 11, + "mora": 11, + "oap": 11, + "erp": 11, + "13n": 11, + "iran": 11, + "o.e": 11, + "itan": 11, + "ato’": 11, + "aute": 11, + "ātit": 11, + "itif": 11, + "tifā": 11, + "mete": 11, + "au(": 11, + "ipā": 11, + "nuel": 11, + "nald": 11, + "ri’i": 11, + "aaru": 11, + "),i": 11, + "aain": 11, + "inei": 11, + "eine": 11, + "vava": 11, + "tena": 11, + "òmo": 11, + "oen": 11, + "tein": 11, + "urei": 11, + "taki": 11, + "tika": 11, + "anak": 11, + "karo": 11, + "ina,": 11, + "rât": 11, + "turi": 11, + "egr": 11, + "rand": 11, + "uaai": 11, + "a,a": 11, + "bera": 11, + "e10": 11, + "orer": 11, + "18n": 11, + "ika.": 11, + "27n": 11, + "niti": 11, + "fait": 11, + "lika": 11, + "mich": 11, + "phil": 11, + "ura.": 11, + "toa.": 11, + "itch": 11, + "utai": 11, + "aure": 11, + "noha": 11, + "urut": 11, + "-mai": 11, + "ican": 11, + "tohu": 11, + "hi(": 11, + "olan": 11, + "26n": 11, + "lame": 11, + "himo": 11, + "akan": 11, + "taho": 11, + "robi": 11, + "whar": 11, + "gap": 11, + "eku": 11, + "iger": 11, + "oho'": 11, + "ho'a": 11, + "'ip": 11, + "huer": 11, + "uero": 11, + "inah": 11, + "arir": 11, + "ophi": 11, + "sema": 11, + "dilu": 11, + "iluv": 11, + "nair": 11, + "aho'": 11, + "omit": 11, + "uaar": 11, + "umas": 11, + "masi": 11, + "í": 10, + "'ē": 10, + "ln": 10, + "4.": 10, + "41": 10, + "е": 10, + "\"p": 10, + ".c": 10, + "mâ": 10, + "āa": 10, + "56": 10, + "aʻ": 10, + "i\"": 10, + "ôm": 10, + "gt": 10, + "o)": 10, + "-k": 10, + "hl": 10, + "97": 10, + "0,": 10, + "(g": 10, + "lh": 10, + "lk": 10, + "-j": 10, + "rá": 10, + "bá": 10, + "tá": 10, + "áv": 10, + "sá": 10, + "h.": 10, + "wl": 10, + "alb": 10, + "pla": 10, + "lac": 10, + "tf": 10, + "rro": 10, + "ges": 10, + "gel": 10, + "rme": 10, + "mol": 10, + "pré": 10, + "ité": 10, + "vir": 10, + "pōt": 10, + "sac": 10, + "amp": 10, + "'ap": 10, + "erc": 10, + "spe": 10, + "nch": 10, + "ars": 10, + "hos": 10, + "uda": 10, + "ude": 10, + "vid": 10, + "vet": 10, + "arg": 10, + "nou": 10, + "roc": 10, + "ink": 10, + "a).": 10, + "i8": 10, + "oth": 10, + "’a’": 10, + "moe": 10, + "ra)": 10, + "bde": 10, + "àò": 10, + "hām": 10, + "ho,": 10, + "cti": 10, + "is)": 10, + "nha": 10, + "dec": 10, + "dal": 10, + "liv": 10, + "cho": 10, + "mos": 10, + "git": 10, + "auc": 10, + "osu": 10, + "dac": 10, + "cit": 10, + "tru": 10, + "āpo": 10, + "òg": 10, + "sur": 10, + "2m": 10, + "oul": 10, + "ego": 10, + "rod": 10, + "eun": 10, + "chr": 10, + "mfi": 10, + "o'o": 10, + "ruh": 10, + "rāt": 10, + "mā’": 10, + ",v": 10, + "to.": 10, + ")e": 10, + "moo": 10, + ";t": 10, + "ìra": 10, + "hep": 10, + "‘at": 10, + "oet": 10, + "rma": 10, + "sir": 10, + "was": 10, + "‘ah": 10, + "pūn": 10, + "ùpō": 10, + "ōrū": 10, + "pak": 10, + "re'": 10, + "ubu": 10, + "ebo": 10, + "eo,": 10, + "n2": 10, + "kom": 10, + "inc": 10, + "apr": 10, + "hah": 10, + "pok": 10, + "isz": 10, + ":k": 10, + "ā1": 10, + "whe": 10, + "ogy": 10, + "hih": 10, + "owa": 10, + "pe'": 10, + "3u": 10, + ".6": 10, + ".8": 10, + "2u": 10, + "gya": 10, + "awl": 10, + "wli": 10, + "or,": 10, + "huat": 10, + "urā": 10, + "lst": 10, + "temp": 10, + "ôma": 10, + "etd": 10, + "ndre": 10, + "prés": 10, + "ndic": 10, + "atif": 10, + "‘ira": 10, + "hou-": 10, + "sia.": 10, + "ora.": 10, + "utah": 10, + "eura": 10, + "apee": 10, + "otā": 10, + "i’ā": 10, + "’āti": 10, + "nior": 10, + "ra(": 10, + "a(,": 10, + "epia": 10, + ".vi": 10, + "pala": 10, + "ti3": 10, + "ti7": 10, + "ti8": 10, + "ti9": 10, + "00m": 10, + "ita,": 10, + "e,m": 10, + "rnat": 10, + "russ": 10, + "eror": 10, + "’ama": 10, + "u.t": 10, + "nsti": 10, + "stit": 10, + "stat": 10, + "ied": 10, + "tour": 10, + "abde": 10, + "bdel": 10, + "arti": 10, + "ocia": 10, + "eete": 10, + "iho,": 10, + "aint": 10, + "afā": 10, + "ress": 10, + "a(e": 10, + "gast": 10, + "asto": 10, + "e.i": 10, + "òhip": 10, + "nara": 10, + "e’ā": 10, + "rian": 10, + "'eo": 10, + "atin": 10, + "utā": 10, + "teā": 10, + "auia": 10, + "uanu": 10, + "ìraa": 10, + "e‘ā": 10, + "o‘or": 10, + "òpa": 10, + "dent": 10, + "unit": 10, + "angi": 10, + "‘oa,": 10, + "a.p": 10, + "aro,": 10, + "apit": 10, + "orot": 10, + "tear": 10, + "ri(": 10, + "ùpōr": 10, + "pōrū": 10, + "aput": 10, + "huah": 10, + "òva": 10, + "itat": 10, + "te6": 10, + "atep": 10, + "òra": 10, + "nake": 10, + "oia,": 10, + "meni": 10, + "naar": 10, + "muo": 10, + ".na": 10, + "dade": 10, + "piah": 10, + "ford": 10, + "olia": 10, + "stro": 10, + "ilda": 10, + "asso": 10, + "laur": 10, + "lber": 10, + "reo,": 10, + "arin": 10, + "tiai": 10, + "anth": 10, + "eric": 10, + "pei": 10, + "ata)": 10, + "loui": 10, + "ii1": 10, + "mēf": 10, + "lone": 10, + "mā1": 10, + "5te": 10, + "otir": 10, + "kang": 10, + "kaar": 10, + "uwa": 10, + "rā'a": 10, + "a'ah": 10, + "oee": 10, + "pe'a": 10, + "kana": 10, + "3ua": 10, + "a;u": 10, + "2ua": 10, + ".13": 10, + ".20": 10, + "aha,": 10, + "’tur": 10, + "aphe": 10, + "osie": 10, + "nob": 10, + "erê": 10, + "'et": 10, + "ta'u": 10, + "nene": 10, + "apea": 10, + "rawl": 10, + "awli": 10, + "wlin": 10, + "ó": 9, + "-l": 9, + "ys": 9, + "aç": 9, + "rz": 9, + "lg": 9, + "3.": 9, + "ht": 9, + "nē": 9, + "иј": 9, + "а": 9, + "àh": 9, + "ài": 9, + "oè": 9, + "6.": 9, + "45": 9, + "yc": 9, + "dj": 9, + "oy": 9, + "éd": 9, + "ūr": 9, + "àp": 9, + "\",": 9, + "yd": 9, + "dn": 9, + "cq": 9, + "oz": 9, + "=": 9, + "46": 9, + "d,": 9, + "zk": 9, + "hm": 9, + "s-": 9, + "vá": 9, + "kr": 9, + "gá": 9, + "’ō": 9, + "kā": 9, + "lā": 9, + "]": 9, + "mpo": 9, + "lom": 9, + "rig": 9, + "àd": 9, + "thu": 9, + "uei": 9, + "igu": 9, + "jon": 9, + "rab": 9, + "lim": 9, + "ses": 9, + "iba": 9, + "raz": 9, + "il.": 9, + "9t": 9, + "uâ": 9, + "ōnē": 9, + "itō": 9, + "aco": 9, + "emu": 9, + "gli": 9, + "ish": 9, + "hav": 9, + "und": 9, + "arb": 9, + "lot": 9, + "jul": 9, + "ki,": 9, + "riv": 9, + "lal": 9, + "e8": 9, + ".r": 9, + "’ai": 9, + "pho": 9, + "cou": 9, + "she": 9, + "mā'": 9, + "’a.": 9, + "sul": 9, + "mbr": 9, + "onc": 9, + "tīr": 9, + "(re": 9, + "āfi": 9, + "ize": 9, + "xan": 9, + "ìp": 9, + "āma": 9, + "es.": 9, + "on.": 9, + "ack": 9, + "s).": 9, + "bat": 9, + "iso": 9, + "odi": 9, + ":o": 9, + "ibe": 9, + "ofi": 9, + "cul": 9, + "us)": 9, + "cum": 9, + "umi": 9, + "rch": 9, + "odo": 9, + "sea": 9, + "piu": 9, + "a-m": 9, + "oin": 9, + "dra": 9, + "cos": 9, + "hīm": 9, + "īme": 9, + "map": 9, + "gov": 9, + "ija": 9, + "dua": 9, + "acq": 9, + "cqu": 9, + "vas": 9, + "sci": 9, + "dom": 9, + "aza": 9, + "gil": 9, + "mih": 9, + "oon": 9, + "dat": 9, + "rub": 9, + ";1": 9, + "aaà": 9, + "o2": 9, + "ha‘": 9, + "ngt": 9, + "āfa": 9, + "0e": 9, + "mēt": 9, + "i),": 9, + "pu,": 9, + "i'i": 9, + ",'": 9, + "mia": 9, + "uhe": 9, + "tōn": 9, + "gre": 9, + "grâ": 9, + "rân": 9, + "ând": 9, + "vre": 9, + "lah": 9, + "rog": 9, + "df": 9, + "ōhi": 9, + "enr": 9, + "kha": 9, + "ufo": 9, + "tus": 9, + "ále": 9, + "e'i": 9, + "ā3": 9, + "ā4": 9, + "9u": 9, + "6e": 9, + "aiw": 9, + "ua;": 9, + "waa": 9, + "koi": 9, + "pum": 9, + "kae": 9, + "ne'": 9, + ".7": 9, + "3e": 9, + "po,": 9, + "9e": 9, + ";p": 9, + "yek": 9, + "agy": 9, + "’ena": 9, + "enan": 9, + "i.n": 9, + "tutu": 9, + "a(p": 9, + "alla": 9, + "àde": 9, + "anot": 9, + "otau": 9, + "osta": 9, + "juli": 9, + "tell": 9, + "tres": 9, + "nhu": 9, + "roni": 9, + "huna": 9, + "pa‘i": 9, + ").e": 9, + "sia,": 9, + "a.n": 9, + "aafa": 9, + "a.o": 9, + "ng1": 9, + "ehar": 9, + "rehi": 9, + "tuâ": 9, + "‘ora": 9, + "ache": 9, + "nitō": 9, + "uete": 9, + "lles": 9, + "’og": 9, + "astr": 9, + "arme": 9, + "boad": 9, + "ānia": 9, + "rena": 9, + "()t": 9, + "o.u": 9, + "atet": 9, + "iano": 9, + "oau": 9, + "inst": 9, + "itut": 9, + "pour": 9, + "ques": 9, + "(reo": 9, + "āfir": 9, + ",fā": 9, + "aìp": 9, + "mai,": 9, + "peet": 9, + "tero": 9, + "te9": 9, + "2ta": 9, + "mada": 9, + "lanc": 9, + "tano": 9, + "r,t": 9, + "faae": 9, + "aaea": 9, + "item": 9, + "faaà": 9, + "tomo": 9, + "aret": 9, + "aom": 9, + "avea": 9, + "uii": 9, + "mero": 9, + "0ti": 9, + "hata": 9, + "tai.": 9, + "hune": 9, + "nuan": 9, + "ataì": 9, + "ere.": 9, + "mii": 9, + "onia": 9, + "pati": 9, + "ha‘a": 9, + "vern": 9, + "eni.": 9, + "shin": 9, + "ton,": 9, + "oft": 9, + "harl": 9, + "rles": 9, + "ari’": 9, + "‘ore": 9, + "pîi": 9, + "kilo": 9, + "ahar": 9, + "êpa": 9, + "e15": 9, + "te5": 9, + "jose": 9, + "ia‘u": 9, + "aìra": 9, + "a)i": 9, + "mea,": 9, + "utap": 9, + "maup": 9, + "aupi": 9, + "eoe": 9, + "ruhi": 9, + "lca": 9, + "jacq": 9, + "acqu": 9, + "ōfe": 9, + "uka,": 9, + "rung": 9, + "hau,": 9, + "neng": 9, + "kuta": 9, + ".11": 9, + "oou": 9, + "hīme": 9, + "īmen": 9, + "grân": 9, + "rând": 9, + "ândo": 9, + "a,h": 9, + "rate": 9, + "idad": 9, + "mpan": 9, + "gran": 9, + "goi": 9, + "vict": 9, + "icto": 9, + "mum": 9, + "itoi": 9, + "oara": 9, + "a.f": 9, + "ū.t": 9, + "auru": 9, + "iche": 9, + "mina": 9, + "frit": 9, + "maat": 9, + "ean-": 9, + "chri": 9, + "hris": 9, + "nef": 9, + "pium": 9, + "nma": 9, + "itar": 9, + "ardo": 9, + "oed": 9, + ",ka": 9, + "e21": 9, + "etī": 9, + "puhi": 9, + "arie": 9, + "moha": 9, + "oham": 9, + "ongo": 9, + "uke": 9, + "nawa": 9, + "muit": 9, + "akw": 9, + "cseb": 9, + "olog": 9, + "agas": 9, + ",ko": 9, + "mā3": 9, + "mā4": 9, + "ahoe": 9, + "hoer": 9, + "era'": 9, + "a.k": 9, + "taon": 9, + "aong": 9, + "ori,": 9, + "kaat": 9, + "ape'": 9, + "'ia": 9, + "tige": 9, + "epǔ": 9, + ".19": 9, + ".21": 9, + ".pe": 9, + "ova,": 9, + "ôa‘": 9, + "enoh": 9, + "i,f": 9, + ";po": 9, + "iaph": 9, + "usia": 9, + "irob": 9, + "oned": 9, + "nedo": 9, + "edon": 9, + "opo'": 9, + "po'a": 9, + "epŭ": 9, + "i'am": 9, + "esle": 9, + "sley": 9, + "opok": 9, + "poku": 9, + "kuw": 9, + "gyam": 9, + "yamf": 9, + "amfi": 9, + "agye": 9, + "nq": 8, + "aî": 8, + "nv": 8, + "my": 8, + "n'": 8, + ".)": 8, + "2,": 8, + "a/": 8, + ".:": 8, + "+": 8, + "55": 8, + "»": 8, + "ср": 8, + "рб": 8, + "би": 8, + "-c": 8, + "âr": 8, + "èt": 8, + "9.": 8, + "2.": 8, + "vī": 8, + "\"a": 8, + "90": 8, + "âv": 8, + "él": 8, + "ūk": 8, + "o:": 8, + "uj": 8, + "‎": 8, + "zu": 8, + "ná": 8, + "nz": 8, + "g-": 8, + "zs": 8, + "mn": 8, + "cy": 8, + "|t": 8, + "mō": 8, + "bon": 8, + "d'a": 8, + "nt-": 8, + "cri": 8, + "elv": 8, + "dar": 8, + "hum": 8, + "lop": 8, + "iny": 8, + "iol": 8, + "cad": 8, + "cap": 8, + "rni": 8, + "lf": 8, + "ped": 8, + "el.": 8, + "‘a-": 8, + "mut": 8, + "i-f": 8, + "’to": 8, + "u-h": 8, + "da,": 8, + "oba": 8, + "āpō": 8, + "pōn": 8, + "ī(": 8, + "срб": 8, + "рби": 8, + "биј": 8, + "evo": 8, + "lag": 8, + "orn": 8, + "jor": 8, + "lem": 8, + "lex": 8, + "ngl": 8, + "wel": 8, + "aev": 8, + "you": 8, + "mme": 8, + "uur": 8, + "eak": 8, + "gla": 8, + "lai": 8, + "qua": 8, + "cin": 8, + "mie": 8, + "fin": 8, + "unt": 8, + "ats": 8, + "'en": 8, + "ue,": 8, + "fak": 8, + "iru": 8, + "teg": 8, + "rih": 8, + "rov": 8, + "mg": 8, + "i4": 8, + ":5": 8, + "chy": 8, + "ōa": 8, + ":3": 8, + "tis": 8, + "t1": 8, + "ubl": 8, + "-1": 8, + "fit": 8, + "’āf": 8, + "a*": 8, + "uad": 8, + "en,": 8, + "oò": 8, + "tok": 8, + "vaa": 8, + "rpo": 8, + "enn": 8, + "phy": 8, + "eci": 8, + "nev": 8, + "rib": 8, + "lme": 8, + "eid": 8, + "scu": 8, + "ā(": 8, + "agi": 8, + "llu": 8, + "lus": 8, + "eac": 8, + "icu": 8, + "alu": 8, + "vac": 8, + "geo": 8, + "n-r": 8, + "²m": 8, + "kim": 8, + "pos": 8, + "lip": 8, + "tāt": 8, + "inn": 8, + ",«": 8, + "nfo": 8, + ".g": 8, + "bai": 8, + "a’o": 8, + "aye": 8, + "yer": 8, + "zan": 8, + "sim": 8, + "gon": 8, + "ick": 8, + "omu": 8, + "amm": 8, + "ʻia": 8, + "duc": 8, + "von": 8, + "nbu": 8, + "u1": 8, + "1e": 8, + "eil": 8, + "his": 8, + "sno": 8, + "nus": 8, + "sam": 8, + "hyl": 8, + "ā’o": 8, + "aav": 8, + "-2": 8, + "ua'": 8, + "ou.": 8, + "ioa": 8, + "'a'": 8, + "aê": 8, + "mue": 8, + "2i": 8, + "‘a.": 8, + "‘am": 8, + "ech": 8, + "gto": 8, + "pu.": 8, + "dim": 8, + "a-n": 8, + "ūka": 8, + "ha.": 8, + "ma‘": 8, + ":a": 8, + "...": 8, + "(ta": 8, + "kiw": 8, + "bil": 8, + "âo": 8, + "u-m": 8, + "ên": 8, + "esb": 8, + "òe": 8, + "bi,": 8, + "1h": 8, + "faf": 8, + "āpu": 8, + "dna": 8, + "-pe": 8, + "lph": 8, + "a9": 8, + "l2": 8, + "wer": 8, + "has": 8, + "ng-": 8, + "a8": 8, + "a4": 8, + "rgh": 8, + "nig": 8, + "kik": 8, + "wes": 8, + "ics": 8, + "szk": 8, + "osz": 8, + "lij": 8, + "inb": 8, + "ā2": 8, + "wah": 8, + "oop": 8, + "7e": 8, + "ôn": 8, + "oe,": 8, + "ooh": 8, + "ya.": 8, + "uut": 8, + "tey": 8, + "oas": 8, + "du-": 8, + "u-g": 8, + "()n": 8, + "apet": 8, + "huka": 8, + "rihi": 8, + "va(": 8, + "ador": 8, + "selv": 8, + "elva": 8, + "anan": 8, + "nell": 8, + "erri": 8, + "awe": 8, + "usp": 8, + "tian": 8, + "'ahu": 8, + "assa": 8, + "aste": 8, + "alva": 8, + "a:2": 8, + "sent": 8, + "onh": 8, + "icat": 8, + "fte": 8, + "ata‘": 8, + "ato‘": 8, + "isio": 8, + "eiu": 8, + "nson": 8, + "a’to": 8, + "’toa": 8, + "tauh": 8, + "ïat": 8, + "u-hi": 8, + "aaï": 8, + "aher": 8, + ",ai": 8, + "ia’n": 8, + "urer": 8, + "ani,": 8, + "tāpō": 8, + "āpōn": 8, + "pōnē": 8, + "itār": 8, + "tāri": 8, + "срби": 8, + "рбиј": 8, + "nōr": 8, + "nton": 8, + "llan": 8, + "aban": 8, + "uera": 8, + "ntd": 8, + "5.t": 8, + "link": 8, + "a,s": 8, + "elar": 8, + "laru": 8, + "arus": 8, + "led": 8, + "ussi": 8, + "e30": 8, + "āni,": 8, + "e11": 8, + "rito": 8, + "rési": 8, + "raph": 8, + "ubli": 8, + "lati": 8, + "n,t": 8, + "),t": 8, + "’āfi": 8, + "roò": 8, + "o.i": 8, + "ierr": 8, + "utun": 8, + "is),": 8, + "ta(": 8, + "mere": 8, + "oliv": 8, + "anca": 8, + "rauh": 8, + "mā’o": 8, + "ā’oh": 8, + "onf": 8, + "nfl": 8, + "osse": 8, + "ava,": 8, + "popa": 8, + "aa(": 8, + "eiah": 8, + "aamu": 8, + ",ho": 8, + "moor": 8, + "oore": 8, + "ipu": 8, + "vera": 8, + "toto": 8, + "ra1": 8, + "aef": 8, + "1ti": 8, + "pete": 8, + "a‘at": 8, + "anā": 8, + "a‘or": 8, + "issa": 8, + "teur": 8, + "atol": 8, + "mman": 8, + "a'at": 8, + "hiw": 8, + "ashi": 8, + "ingt": 8, + "ngto": 8, + "gton": 8, + "aof": 8, + "fth": 8, + "tate": 8, + "oa(": 8, + "tifi": 8, + "atap": 8, + "aop": 8, + "tine": 8, + "entr": 8, + "nohu": 8, + "enat": 8, + "a,r": 8, + ",ha": 8, + "are.": 8, + "faro": 8, + "ring": 8, + "raap": 8, + "nein": 8, + "aima": 8, + "uàò": 8, + "a,f": 8, + "kiwa": 8, + "ster": 8, + "ivav": 8, + "vaha": 8, + "atak": 8, + "faka": 8, + "ura,": 8, + "taka": 8, + "fang": 8, + "make": 8, + "oran": 8, + "aiar": 8, + "deo": 8, + "oro‘": 8, + "ïae": 8, + "aub": 8, + "au-m": 8, + "u-ma": 8, + "aaat": 8, + "êno": 8, + "berg": 8, + "lent": 8, + "tora": 8, + "toit": 8, + "oito": 8, + "ani.": 8, + "viiv": 8, + "iivi": 8, + "ivii": 8, + "fafa": 8, + "fata": 8, + "tiha": 8, + "anm": 8, + "toli": 8, + "bala": 8, + "hew": 8, + "arum": 8, + "graf": 8, + "doua": 8, + "ouar": 8, + "ōhip": 8, + "-per": 8, + "otur": 8, + "a-ma": 8, + "citr": 8, + "iati": 8, + "rina": 8, + "uise": 8, + "ifer": 8, + "gae": 8, + "biac": 8, + "e.v": 8, + "us),": 8, + "iber": 8, + "erac": 8, + "m²m": 8, + "²ma": 8, + "inan": 8, + "waia": 8, + "arte": 8, + "paul": 8, + "iaj": 8, + "turo": 8, + "ecr": 8, + "rasi": 8, + "mihi": 8, + "hill": 8, + "nbur": 8, + "uric": 8, + "npe": 8, + "hame": 8, + "nuf": 8, + "mēp": 8, + "davi": 8, + "avid": 8, + "edin": 8, + "etio": 8, + "thon": 8, + "otor": 8, + "ifr": 8, + "tuni": 8, + "sang": 8, + "e22": 8, + "ászt": 8, + "áres": 8, + "rote": 8, + "a.\"": 8, + "esse": 8, + "adag": 8, + "daga": 8, + "riri": 8, + "paea": 8, + "ukap": 8, + "mā2": 8, + "3te": 8, + "kaiw": 8, + "keta": 8, + "hapo": 8, + "maa,": 8, + "katu": 8, + "hek": 8, + "cien": 8, + "auah": 8, + "tai-": 8, + "l,i": 8, + "atoe": 8, + ",ke": 8, + "to'i": 8, + "9ua": 8, + ".23": 8, + ".24": 8, + "e;e": 8, + "raah": 8, + "enos": 8, + "i;p": 8, + "faau": 8, + "rooh": 8, + "oohi": 8, + "toa-": 8, + "ala,": 8, + "ghu": 8, + "ene'": 8, + "ne'i": 8, + "re'a": 8, + "atil": 8, + "tild": 8, + "hann": 8, + "utuu": 8, + "tuut": 8, + "uutu": 8, + "cra.": 8, + "rusi": 8, + "oadu": 8, + "adu-": 8, + "du-g": 8, + "u-gy": 8, + "-gya": 8, + "gyem": 8, + "yema": 8, + "uor,": 8, + "dà": 7, + "s'": 7, + "tí": 7, + "tb": 7, + "p.": 7, + ".9": 7, + "tw": 7, + "lé": 7, + "69": 7, + "34": 7, + "4,": 7, + "».": 7, + "је": 7, + "ê,": 7, + "à,": 7, + "xf": 7, + "dg": 7, + "51": 7, + "7.": 7, + "m,": 7, + "cé": 7, + "àr": 7, + "bé": 7, + "nī": 7, + "éa": 7, + "‘n": 7, + "nū": 7, + "32": 7, + "70": 7, + "k=": 7, + "k.": 7, + "44": 7, + ",2": 7, + "/": 7, + "bb": 7, + "sw": 7, + "kl": 7, + "hd": 7, + "á.": 7, + ".,": 7, + "kū": 7, + "īs": 7, + "'ō": 7, + "oʻ": 7, + "’‘": 7, + "dc": 7, + "'em": 7, + "sad": 7, + "heu": 7, + "fon": 7, + "-sa": 7, + "lav": 7, + "umb": 7, + "ull": 7, + "agu": 7, + "arn": 7, + "esp": 7, + "nqu": 7, + "erd": 7, + "uga": 7, + "i).": 7, + "a-r": 7, + "pûr": 7, + "ûra": 7, + "hu‘": 7, + "heh": 7, + "wit": 7, + "ōtī": 7, + "eog": 7, + "ије": 7, + "raj": 7, + "aje": 7, + "mac": 7, + "rta": 7, + "mul": 7, + "ney": 7, + "app": 7, + "ppe": 7, + "'oa": 7, + "rst": 7, + "lea": 7, + "hō'": 7, + "ō'ē": 7, + "tj": 7, + "pip": 7, + "ke,": 7, + "ui,": 7, + "nu,": 7, + "ie,": 7, + "nk=": 7, + "āme": 7, + "orū": 7, + "o'e": 7, + "vis": 7, + "nsk": 7, + ",b": 7, + "ā'o": 7, + "'oi": 7, + "tiq": 7, + "uil": 7, + "tob": 7, + "pub": 7, + "ism": 7, + "âva": 7, + "oky": 7, + "(co": 7, + "sei": 7, + "kij": 7, + "arp": 7, + "rez": 7, + "nho": 7, + "pis": 7, + "uci": 7, + "cil": 7, + "bos": 7, + "itt": 7, + "ntu": 7, + "gib": 7, + "e),": 7, + "gau": 7, + "uch": 7, + "|te": 7, + "ea)": 7, + "vaè": 7, + "l(": 7, + "emm": 7, + "’ōp": 7, + "urs": 7, + "yg": 7, + "hee": 7, + "bab": 7, + "tsk": 7, + "db": 7, + "toè": 7, + "ei)": 7, + "ulo": 7, + "rno": 7, + "uth": 7, + "och": 7, + "iza": 7, + "kel": 7, + "to)": 7, + "hom": 7, + "uck": 7, + "se.": 7, + "hu,": 7, + "dir": 7, + "²t": 7, + "gog": 7, + "ogo": 7, + "urt": 7, + "spa": 7, + "ibi": 7, + "tle": 7, + "u’a": 7, + "lae": 7, + "yll": 7, + "o’o": 7, + "aèr": 7, + "nuu": 7, + "ūi": 7, + "ai’": 7, + "moi": 7, + "\"i": 7, + "àn": 7, + "ai'": 7, + ".è": 7, + "rof": 7, + "mā‘": 7, + "dea": 7, + "tuv": 7, + "gan": 7, + "-nu": 7, + "i-t": 7, + "te-": 7, + "ao.": 7, + "iāt": 7, + "ue.": 7, + "‘na": 7, + "āpū": 7, + "erm": 7, + "erv": 7, + "au‘": 7, + "cte": 7, + "ou‘": 7, + "nià": 7, + "ha'": 7, + "a-a": 7, + "’ao": 7, + "sla": 7, + "-ta": 7, + "ark": 7, + "uiu": 7, + "iui": 7, + "amâ": 7, + "mâr": 7, + "êu": 7, + "omb": 7, + "ith": 7, + "oxf": 7, + "xfo": 7, + "dge": 7, + "ii-": 7, + "ska": 7, + "ogi": 7, + "uon": 7, + "ui.": 7, + "‘ōh": 7, + "owe": 7, + "v1": 7, + "a6": 7, + "v2": 7, + "hns": 7, + "tōm": 7, + "ōmi": 7, + "yat": 7, + "a7": 7, + "mk": 7, + "kao": 7, + "mom": 7, + "ebá": 7, + "bás": 7, + "szo": 7, + "lár": 7, + "kul": 7, + "veh": 7, + "yh": 7, + "tub": 7, + "100": 7, + "8u": 7, + "tuk": 7, + "kee": 7, + "bio": 7, + "mōr": 7, + "rīs": 7, + "īsi": 7, + ".ʻ": 7, + "si,": 7, + "an,": 7, + ".5": 7, + "1u": 7, + "5e": 7, + "0u": 7, + "2e": 7, + "a’‘": 7, + "’‘e": 7, + "oda": 7, + "ʻor": 7, + "ya,": 7, + "aid": 7, + "le-": 7, + "e-b": 7, + "-bu": 7, + "nkw": 7, + "aky": 7, + "siw": 7, + "gok": 7, + "jat": 7, + "nba": 7, + "iàt": 7, + "iad": 7, + "rade": 7, + "lada": 7, + "afan": 7, + "onel": 7, + "itie": 7, + "empo": 7, + "mpor": 7, + "oa-h": 7, + "onm": 7, + "ita'": 7, + "au'": 7, + "retā": 7, + "etān": 7, + "nesi": 7, + "hō'ē": 7, + "aes": 7, + "reda": 7, + "ssan": 7, + "’oo": 7, + "pane": 7, + "onta": 7, + "ferr": 7, + "anya": 7, + "dàt": 7, + "tma": 7, + "oane": 7, + "braz": 7, + "razi": 7, + "azil": 7, + "zil.": 7, + "ntat": 7, + "sité": 7, + "ift": 7, + "tel.": 7, + "semi": 7, + "emit": 7, + "mita": 7, + "to‘a": 7, + "ahon": 7, + "pûra": 7, + "ûraa": 7, + "‘ii": 7, + "i-fa": 7, + "fa‘i": 7, + "ira.": 7, + "ona,": 7, + "afau": 7, + ",oi": 7, + "hu‘a": 7, + "arae": 7, + "‘ae": 7, + "ni(": 7, + "pōtī": 7, + "ōtīt": 7, + "eogr": 7, + "sand": 7, + "бије": 7, + "'emp": 7, + "omer": 7, + "ogu": 7, + "ramo": 7, + "oliu": 7, + "lius": 7, + "nque": 7, + "olle": 7, + "imen": 7, + "oren": 7, + "1.t": 7, + "4.t": 7, + "ink=": 7, + "insk": 7, + "e.m": 7, + "omin": 7, + "ssie": 7, + "30n": 7, + "nōa": 7, + "iero": 7, + "rorū": 7, + "orūt": 7, + "aik": 7, + "mā'o": 7, + "’a’a": 7, + "māf": 7, + "tist": 7, + "tiqu": 7, + "6ta": 7, + "publ": 7, + "npo": 7, + "tipe": 7, + "alex": 7, + "ìpa": 7, + "urev": 7, + "s.e": 7, + "-mar": 7, + "ntin": 7, + "tiet": 7, + "patr": 7, + "ista": 7, + "more": 7, + "alen": 7, + "live": 7, + "blan": 7, + "alme": 7, + "eida": 7, + "lian": 7, + "esm": 7, + "ora’": 7, + "’et": 7, + "flos": 7, + "loss": 7, + "auò": 7, + "tea,": 7, + "emar": 7, + "aèra": 7, + "èraa": 7, + "māra": 7, + "inir": 7, + "maoh": 7, + "hāmo": 7, + "āmoa": 7, + "naa.": 7, + "ua'a": 7, + "taio": 7, + "tona": 7, + "erah": 7, + "poe": 7, + "emai": 7, + "etm": 7, + "m²t": 7, + "auir": 7, + "anie": 7, + "otar": 7, + "eāt": 7, + "oàn": 7, + "terā": 7, + ";te": 7, + "anum": 7, + "tea.": 7, + "iria": 7, + "tito": 7, + "avan": 7, + "aron": 7, + "ne2": 7, + "ietu": 7, + "reia": 7, + "āap": 7, + "iene": 7, + "enp": 7, + "oem": 7, + "te(": 7, + "over": 7, + "nite": 7, + "ecto": 7, + "tory": 7, + "tuva": 7, + "iāte": 7, + "u,u": 7, + "‘aa": 7, + "êha": 7, + "a(n": 7, + "e16": 7, + ",pa": 7, + "eaf": 7, + "sete": 7, + "ma‘i": 7, + "i,n": 7, + "asia": 7, + "hia,": 7, + "au‘a": 7, + "‘in": 7, + "mou‘": 7, + "ou‘a": 7, + "paìr": 7, + "5ti": 7, + ":ma": 7, + "ara,": 7, + "apu,": 7, + "eti’": 7, + "òtu": 7, + "earo": 7, + "eran": 7, + "cata": 7, + "eita": 7, + "ori.": 7, + "ta'a": 7, + "naru": 7, + "cque": 7, + "chir": 7, + "e29": 7, + "nico": 7, + "icol": 7, + "ònu": 7, + "tuan": 7, + "oto,": 7, + "ahun": 7, + "tung": 7, + "utav": 7, + "uiui": 7, + "eev": 7, + "sala": 7, + "aror": 7, + "e25": 7, + "ando": 7, + "i,a": 7, + "oxfo": 7, + "xfor": 7, + "faur": 7, + "atop": 7, + "rii-": 7, + "i-ra": 7, + "rare": 7, + "soti": 7, + "ïan": 7, + "rau,": 7, + "noto": 7, + "medi": 7, + "uman": 7, + "tric": 7, + "iàp": 7, + "àpō": 7, + "iane": 7, + "edou": 7, + "rdf": 7, + "dfr": 7, + "ritc": 7, + "a’ap": 7, + "’ae": 7, + "pira": 7, + "‘ōhi": 7, + "u,n": 7, + "ahot": 7, + "well": 7, + "rair": 7, + "inda": 7, + "ophy": 7, + "phyl": 7, + "hyll": 7, + "nsis": 7, + "ufi": 7, + "roli": 7, + "trus": 7, + "inen": 7, + "rant": 7, + "mang": 7, + "rubi": 7, + "kiri": 7, + "gauc": 7, + "kong": 7, + "tace": 7, + "euf": 7, + "ezi": 7, + "zing": 7, + "ngib": 7, + "gibe": 7, + "anno": 7, + "nnon": 7, + "nona": 7, + "an-r": 7, + "n-ra": 7, + "king": 7, + "eima": 7, + "aian": 7, + "inia": 7, + "ical": 7, + "erto": 7, + "yma": 7, + "dani": 7, + "vare": 7, + "rela": 7, + "acl": 7, + "unes": 7, + "asil": 7, + "essi": 7, + "n,e": 7, + "ream": 7, + "mauh": 7, + "atum": 7, + "nger": 7, + "prin": 7, + "shan": 7, + "dela": 7, + "01n": 7, + "llah": 7, + "hali": 7, + "asca": 7, + "ohns": 7, + "uaj": 7, + "tōmi": 7, + "uim": 7, + "8ti": 7, + "opoa": 7, + "sebá": 7, + "ebás": 7, + "bász": 7, + ",ki": 7, + "r,i": 7, + "inai": 7, + "dinb": 7, + "inbu": 7, + "urgh": 7, + "ikan": 7, + "6te": 7, + "7te": 7, + "8ua": 7, + "ngai": 7, + "koe": 7, + ".ka": 7, + "nong": 7, + "a;i": 7, + "akiw": 7, + "0ng": 7, + "ahae": 7, + "taak": 7, + "uui": 7, + "aihi": 7, + "anaw": 7, + "e'ā": 7, + "ara'": 7, + "omō": 7, + "mōrī": 7, + "ōrīs": 7, + "rīsi": 7, + "īsia": 7, + "e'ar": 7, + ".ʻo": 7, + "a.4": 7, + "a.8": 7, + ".10": 7, + "1ua": 7, + ".14": 7, + ".16": 7, + ".17": 7, + "0ua": 7, + ".22": 7, + "uaô": 7, + "u.1": 7, + ".15": 7, + "e.1": 7, + ".18": 7, + "’ui": 7, + "a’‘e": 7, + "uput": 7, + "etus": 7, + "seta": 7, + "vaï": 7, + "ema,": 7, + "putu": 7, + "aaue": 7, + "-ato": 7, + "faaf": 7, + "nya.": 7, + "ʻora": 7, + "iror": 7, + "arê": 7, + "anad": 7, + "a'or": 7, + "toer": 7, + "u'ah": 7, + "ahu'": 7, + "susa": 7, + "usan": 7, + "oof": 7, + "rle-": 7, + "le-b": 7, + "e-bu": 7, + "kufo": 7, + "issi": 7, + "goka": 7, + "resa": 7, + "alij": 7, + "lija": 7, + "ijat": 7, + "jata": 7, + "unis": 7, + "'h": 6, + "vu": 6, + "ós": 6, + "aq": 6, + "93": 6, + "nj": 6, + "a?": 6, + "fé": 6, + "ém": 6, + "96": 6, + "/k": 6, + "43": 6, + "tn": 6, + "aā": 6, + "ww": 6, + "w.": 6, + "ôr": 6, + "já": 6, + "0.": 6, + "33": 6, + "ço": 6, + "’ī": 6, + "āo": 6, + "rō": 6, + "âa": 6, + "f)": 6, + "v.": 6, + "ég": 6, + "mé": 6, + "bs": 6, + "3,": 6, + "ôo": 6, + "ūm": 6, + "ùo": 6, + "87": 6, + "ís": 6, + "38": 6, + "71": 6, + "k,": 6, + ".0": 6, + "06": 6, + "5,": 6, + ",6": 6, + "a‎": 6, + "yr": 6, + "gg": 6, + "hs": 6, + "bh": 6, + "gb": 6, + "y-": 6, + "j,": 6, + "tz": 6, + "tô": 6, + "ī’": 6, + "hf": 6, + "gā": 6, + "\"h": 6, + "ǎr": 6, + "rô": 6, + "ê.": 6, + "ǒ": 6, + "s\"": 6, + "%": 6, + "rdà": 6, + "lls": 6, + "urn": 6, + "ual": 6, + "lta": 6, + "sat": 6, + "fel": 6, + "ols": 6, + "rug": 6, + "cla": 6, + "nyo": 6, + "yon": 6, + "rtí": 6, + "abr": 6, + "cli": 6, + "bes": 6, + "ése": 6, + "a/k": 6, + "l.:": 6, + "u-r": 6, + "aft": 6, + "300": 6, + "ae’": 6, + "’ne": 6, + "oga": 6, + "sau": 6, + "lab": 6, + ",l": 6, + "in,": 6, + "avo": 6, + "how": 6, + "ruu": 6, + "lez": 6, + "hp": 6, + "thr": 6, + "fou": 6, + "sev": 6, + "uny": 6, + "yol": 6, + "via": 6, + "tos": 6, + "joa": 6, + "nts": 6, + "loc": 6, + "ets": 6, + "auk": 6, + "go,": 6, + "vak": 6, + "mek": 6, + "gie": 6, + "nīt": 6, + "īti": 6, + "idi": 6, + "200": 6, + ",’": 6, + "abl": 6, + "niv": 6, + "aux": 6, + "pul": 6, + ":6": 6, + "īri": 6, + "6k": 6, + "sme": 6, + "l-s": 6, + "exa": 6, + "sua": 6, + "nid": 6, + "ido": 6, + "nço": 6, + "çoi": 6, + "4o": 6, + "lec": 6, + "utr": 6, + "òs": 6, + "bay": 6, + "rpu": 6, + "lti": 6, + "pec": 6, + "dos": 6, + "sod": 6, + "nci": 6, + "cio": 6, + "uja": 6, + "abo": 6, + "adr": 6, + "fia": 6, + "uza": 6, + "gun": 6, + "(am": 6, + "izo": 6, + "(mu": 6, + "vān": 6, + "hid": 6, + "(ca": 6, + "gif": 6, + "mān": 6, + "lne": 6, + "wil": 6, + "bak": 6, + "yev": 6, + "ibo": 6, + "wal": 6, + "sne": 6, + "r:": 6, + "n-m": 6, + "inf": 6, + "vec": 6, + "ère": 6, + "ed.": 6, + "rgi": 6, + "gio": 6, + "leg": 6, + "naj": 6, + "gin": 6, + "gus": 6, + "kak": 6, + "old": 6, + "sg": 6, + "rva": 6, + "alc": 6, + "osé": 6, + "ath": 6, + "een": 6, + "rda": 6, + "tōt": 6, + "sop": 6, + "aʻa": 6, + "lib": 6, + "māo": 6, + "āor": 6, + "•t": 6, + "vīt": 6, + ")a": 6, + "eià": 6, + "rār": 6, + "muh": 6, + "èi": 6, + "ouv": 6, + "nme": 6, + "anq": 6, + "cd": 6, + "(mo": 6, + "‘a,": 6, + "ūo": 6, + "tūk": 6, + "2k": 6, + "cp": 6, + ":\"": 6, + "ôoà": 6, + ":-": 6, + "huà": 6, + "isl": 6, + "na:": 6, + "erl": 6, + "rko": 6, + "mbi": 6, + "oï": 6, + "ii.": 6, + "âra": 6, + "eaè": 6, + "idg": 6, + "eê": 6, + "vev": 6, + "iï": 6, + "ōno": 6, + "er.": 6, + "āpi": 6, + "āru": 6, + "mid": 6, + "ziz": 6, + "k1": 6, + "nri": 6, + "erb": 6, + "bah": 6, + "nik": 6, + "kos": 6, + "nku": 6, + "ivo": 6, + "nny": 6, + "afu": 6, + "g2": 6, + "kol": 6, + "lay": 6, + "ouf": 6, + "u2": 6, + "nsa": 6, + "ztá": 6, + "csk": 6, + "zop": 6, + "ány": 6, + "zte": 6, + "csá": 6, + "kus": 6, + "le,": 6, + "la.": 6, + "elu": 6, + "pu-": 6, + ":h": 6, + "ko.": 6, + "ngā": 6, + "oi,": 6, + "al,": 6, + "lyd": 6, + "ock": 6, + "'ār": 6, + "rāh": 6, + "'āp": 6, + "ō'o": 6, + "'ur": 6, + ";f": 6, + "pe,": 6, + "7u": 6, + "mǎr": 6, + ";h": 6, + "mu,": 6, + "ei:": 6, + "uua": 6, + "phd": 6, + "ǔn": 6, + "nkr": 6, + "ahl": 6, + "hle": 6, + "\"u": 6, + "kof": 6, + "allo": 6, + "nia,": 6, + "'ape": 6, + "quel": 6, + "gaia": 6, + "ad'": 6, + "tall": 6, + "ilan": 6, + "lana": 6, + "alle": 6, + "ober": 6, + "ratā": 6, + "atān": 6, + "rain": 6, + "ropu": 6, + "stt": 6, + "onn": 6, + "than": 6, + "uruu": 6, + "ruur": 6, + "uuru": 6, + "uie": 6, + "parl": 6, + "host": 6, + "ntf": 6, + "deb": 6, + "ntj": 6, + "ines": 6, + "ocar": 6, + "artí": 6, + "gte": 6, + "sho": 6, + "i(m": 6, + "ibr": 6, + ".pr": 6, + "rése": 6, + "ésen": 6, + "el.:": 6, + "‘im": 6, + "a-ra": 6, + "erik": 6, + "i‘a-": 6, + "hona": 6, + "apûr": 6, + "‘if": 6, + "teat": 6, + "ahu‘": 6, + "hehe": 6, + "eheu": 6, + "ared": 6, + "haro": 6, + "nura": 6, + "’itā": 6, + "ūnō": 6, + "ōre": 6, + "’nei": 6, + "erse": 6, + "bell": 6, + "d'em": 6, + "pord": 6, + "ordà": 6, + "lome": 6, + "el'": 6, + "ded": 6, + "humb": 6, + "amor": 6, + "llt": 6, + "rmen": 6, + "’od": 6, + "olla": 6, + "arac": 6, + "llet": 6, + "’on": 6, + "aver": 6, + "6.t": 6, + "8.t": 6, + "ti4": 6, + "0.t": 6, + "2.t": 6, + "9.t": 6, + "ti6": 6, + "7.t": 6, + "3.t": 6, + "mins": 6, + "s.u": 6, + "iver": 6, + "uso": 6, + "bara": 6, + "e17": 6, + "rici": 6, + "31t": 6, + "ai(": 6, + "’a(": 6, + "sili": 6, + "grap": 6, + "atis": 6, + "stiq": 6, + "esti": 6, + "ions": 6, + "1ta": 6, + "erre": 6, + "refe": 6, + "efer": 6, + "fere": 6, + "tīri": 6, + "viti": 6, + "itip": 6, + "’ari": 6, + "’api": 6, + "ifit": 6, + "lexa": 6, + "exan": 6, + "xand": 6, + "anço": 6, + "nçoi": 6, + "çois": 6, + "n,i": 6, + "part": 6, + "nure": 6, + "ngel": 6, + "int-": 6, + "ngh": 6, + "viet": 6, + "etie": 6, + ").u": 6, + "cet": 6, + "ieti": 6, + "smo": 6, + "piso": 6, + "ngue": 6, + "cess": 6, + "lmei": 6, + "meid": 6, + "iep": 6, + "\".t": 6, + "e23": 6, + "aiu": 6, + "osca": 6, + "rete": 6, + "eòh": 6, + "otō": 6, + "efā": 6, + "rāto": 6, + "nīti": 6, + "ītia": 6, + "māor": 6, + "āori": 6, + "vītī": 6, + "tou.": 6, + "tepo": 6, + "hau.": 6, + "tāpa": 6, + "uati": 6, + "tāma": 6, + "evā": 6, + "tmt": 6, + "àno": 6, + "rāri": 6, + "90t": 6, + "ai'a": 6, + "i'ao": 6, + "oto.": 6, + "une,": 6, + "eâv": 6, + "âvaè": 6, + "u,m": 6, + "aaê": 6, + "roro": 6, + "amue": 6, + "2ti": 6, + "hepe": 6, + "itet": 6, + "erne": 6, + "elh": 6, + "cher": 6, + ":ta": 6, + "emma": 6, + "ante": 6, + "wash": 6, + "whit": 6, + "epr": 6, + "ited": 6, + "ates": 6, + "egor": 6, + "’ie": 6, + "anqu": 6, + "o’or": 6, + "ea),": 6, + "-nui": 6, + "ore‘": 6, + "ai‘a": 6, + "pūo": 6, + "‘oi": 6, + "ta‘u": 6, + "arue": 6, + "ilom": 6, + "pāpū": 6, + "otū": 6, + "tūka": 6, + "avar": 6, + "a,p": 6, + "erei": 6, + "hia.": 6, + "a‘am": 6, + "atoi": 6, + "‘ui": 6, + "onar": 6, + "h,t": 6, + "angu": 6, + "ctio": 6, + "omat": 6, + "ôra": 6, + "otu.": 6, + "hure": 6, + "iup": 6, + "ahuà": 6, + "eài": 6, + "tuai": 6, + "upit": 6, + "ēmo": 6, + "heti": 6, + "orap": 6, + "rapo": 6, + "isla": 6, + "gene": 6, + "nera": 6, + "lita": 6, + "esta": 6, + "owh": 6, + ".me": 6, + "ttar": 6, + "arel": 6, + "rell": 6, + "i,1": 6, + "roa.": 6, + "tenu": 6, + "anov": 6, + "òha": 6, + "napu": 6, + "òan": 6, + "urun": 6, + "pata": 6, + "ika,": 6, + "uana": 6, + "ake,": 6, + "utea": 6, + "òni": 6, + "òre": 6, + "koto": 6, + "emat": 6, + "papu": 6, + "tuet": 6, + "aini": 6, + "atit": 6, + "’na.": 6, + "auiu": 6, + "oïa": 6, + "eta,": 6, + "ipar": 6, + "rii.": 6, + "amâr": 6, + "mâra": 6, + "âraa": 6, + "râo": 6, + "ta1": 6, + "ilia": 6, + "oêu": 6, + "e,a": 6, + "utar": 6, + "eaèr": 6, + "eal": 6, + "a,v": 6, + "rden": 6, + "goe": 6, + "ògr": 6, + "ême": 6, + "oih": 6, + "erea": 6, + "(mus": 6, + "hamm": 6, + "uab": 6, + "aham": 6, + "opan": 6, + "ridg": 6, + "idge": 6, + "veve": 6, + "iïa": 6, + "urir": 6, + "i20": 6, + "i23": 6, + "apan": 6, + "tōno": 6, + "ōnot": 6, + "arad": 6, + "isia": 6, + "atri": 6, + "uche": 6, + "ā.ò": 6, + "teva": 6, + "huta": 6, + "aro.": 6, + "hant": 6, + "taip": 6, + "uiha": 6, + "isto": 6, + "albe": 6, + "raiv": 6, + "upua": 6, + "puai": 6, + "i.è": 6, + ".èn": 6, + "yllu": 6, + "ndan": 6, + "anus": 6, + "ntho": 6, + "haru": 6, + "itru": 6, + "ia),": 6, + "ubia": 6, + "i(c": 6, + "i.k": 6, + "anac": 6, + "tez": 6, + "e’ō": 6, + "card": 6, + "marc": 6, + "hani": 6, + "iner": 6, + "elen": 6, + "ihi.": 6, + "edua": 6, + "duar": 6, + "nita": 6, + "seba": 6, + "mand": 6, + "elin": 6, + "rona": 6, + "rari": 6, + "oeu": 6, + "kari": 6, + "josé": 6, + "eym": 6, + "i(t": 6, + "t,i": 6, + "sour": 6, + "roon": 6, + "iic": 6, + "cec": 6, + "crea": 6, + "raia": 6, + "eab": 6, + "a(a": 6, + "llin": 6, + "bola": 6, + "neta": 6, + "ni2": 6, + "iea": 6, + "enri": 6, + "a12": 6, + "7ti": 6, + "auti": 6, + "ii6": 6, + "anp": 6, + "amed": 6, + "alif": 6, + "lifa": 6, + "wang": 6, + "puru": 6, + "on1": 6, + "ong-": 6, + "ruk": 6, + "inis": 6, + "nist": 6, + "kata": 6, + "22t": 6, + "bach": 6, + "alal": 6, + "15t": 6, + "tag": 6, + "apri": 6, + "slei": 6, + "leim": 6, + "hnso": 6, + "kait": 6, + "henr": 6, + "hnk": 6, + "19n": 6, + "nuh": 6, + "bron": 6, + "came": 6, + "aoo": 6, + "eone": 6, + "biss": 6, + "sztá": 6, + "resz": 6, + "szop": 6, + "oszt": 6, + "szte": 6, + "láre": 6, + "iszt": 6, + "te7": 6, + "ien,": 6, + "agog": 6, + "geri": 6, + "rapu": 6, + "apu-": 6, + "2te": 6, + "rok": 6, + "aiwh": 6, + "iwha": 6, + "kaak": 6, + "aako": 6, + "ako.": 6, + "waah": 6, + "hake": 6, + "aroh": 6, + "erek": 6, + "awar": 6, + "oru.": 6, + ",ku": 6, + "momo": 6, + "akor": 6, + "u.m": 6, + "awan": 6, + "onon": 6, + "ssoc": 6, + "ciat": 6, + ",in": 6, + "irim": 6, + "y,i": 6, + "rero": 6, + "a,2": 6, + "i,k": 6, + "apai": 6, + "haki": 6, + "rock": 6, + "gasc": 6, + "otte": 6, + "gara": 6, + "logy": 6, + "ā'oh": 6, + "rāhi": 6, + "'ea": 6, + "'ef": 6, + "'ait": 6, + "ra'i": 6, + "aoto": 6, + "'aho": 6, + "'ura": 6, + "'atu": 6, + "taai": 6, + "aair": 6, + ";fa": 6, + "a.6": 6, + "ape,": 6, + "a.7": 6, + "7ua": 6, + "a.9": 6, + "nua;": 6, + "ero,": 6, + ".12": 6, + "18e": 6, + "19e": 6, + ".25": 6, + "nuo": 6, + "e.2": 6, + ";ei": 6, + "eden": 6, + "dene": 6, + "a;o": 6, + "ïao": 6, + "amu,": 6, + "o’u": 6, + "hopo": 6, + "opoi": 6, + "nei:": 6, + "ima,": 6, + "ela,": 6, + "taih": 6, + "nosa": 6, + "êa‘": 6, + "êah": 6, + "sela": 6, + "êor": 6, + "pǔn": 6, + "rose": 6, + "mary": 6, + "usn": 6, + "nada": 6, + "sahl": 6, + "ahle": 6, + "wesl": 6, + "cra,": 6, + "empa": 6, + "hess": 6, + "gyek": 6, + "yei": 6, + "man-": 6, + "-raw": 6, + "olik": 6, + "là": 5, + "pm": 5, + "pt": 5, + ",8": 5, + "80": 5, + "é:": 5, + ",9": 5, + "+5": 5, + "1)": 5, + "pf": 5, + "ē,": 5, + "ī,": 5, + "р": 5, + "на": 5, + "и": 5, + "1:": 5, + "g.": 5, + "ée": 5, + "rh": 5, + "37": 5, + "ūʻ": 5, + "v,": 5, + "<": 5, + "76": 5, + "àu": 5, + "°c": 5, + "ét": 5, + "éo": 5, + "(u": 5, + "u)": 5, + "ws": 5, + "'é": 5, + "66": 5, + "-i": 5, + "-v": 5, + "o\"": 5, + "75": 5, + "pé": 5, + "àe": 5, + "72": 5, + "-w": 5, + "zy": 5, + "36": 5, + "68": 5, + "79": 5, + "88": 5, + "47": 5, + "04": 5, + "°": 5, + "r)": 5, + ",7": 5, + "ïd": 5, + "âm": 5, + "-u": 5, + "dl": 5, + "dm": 5, + "á,": 5, + "pk": 5, + "ác": 5, + "):": 5, + "×": 5, + "|g": 5, + "»,": 5, + "–": 5, + "kī": 5, + "": 2, + "aude": 2, + "ssin": 2, + "sini": 2, + "cens": 2, + "ense": 2, + "erj": 2, + "janv": 2, + "anvi": 2, + "nvie": 2, + "emie": 2, + "emps": 2, + "usv": 2, + "erro": 2, + "rons": 2, + "nsq": 2, + "tco": 2, + ",et": 2, + "fini": 2, + "iil": 2, + "lse": 2, + "sert": 2, + "ent,": 2, + ",il": 2, + "d'u": 2, + "d'un": 2, + "uns": 2, + "meu": 2, + "ol,": 2, + "tent": 2, + "sole": 2, + "olei": 2, + "leil": 2, + "shir": 2, + "qu'": 2, + "qu'i": 2, + "u'il": 2, + "iln": 2, + "livi": 2, + "ivie": 2, + "ives": 2, + "djo": 2, + "k.m": 2, + "guil": 2, + "uila": 2, + "a:6": 2, + "090": 2, + "3)t": 2, + "nath": 2, + "thor": 2, + "horn": 2, + "uang": 2, + "oong": 2, + "ongr": 2, + "itic": 2, + "ē,f": 2, + "wie": 2, + "wien": 2, + "icio": 2, + "ious": 2, + "bask": 2, + "aski": 2, + "skin": 2, + "robb": 2, + "obbi": 2, + "bbin": 2, + "bins": 2, + "nchi": 2, + "30f": 2, + "merg": 2, + "rger": 2, + "amv": 2, + "mve": 2, + "ntur": 2, + "tba": 2, + "ns,": 2, + "mfa": 2, + "snow": 2, + "nowb": 2, + "owbi": 2, + "wbir": 2, + "bird": 2, + "rdp": 2, + "dpa": 2, + "flav": 2, + "uruh": 2, + "eib": 2, + "sler": 2, + "panu": 2, + "ulac": 2, + "īpan": 2, + "ria)": 2, + "(cor": 2, + "lus)": 2, + "tchi": 2, + "apin": 2, + "ndac": 2, + "aceu": 2, + "ceum": 2, + "e(h": 2, + "(hi": 2, + "(hib": 2, + "ibis": 2, + "bisc": 2, + "scus": 2, + "rēmu": 2, + "ēmun": 2, + "muna": 2, + "cag": 2, + "ythr": 2, + "attl": 2, + "ttle": 2, + "emy": 2, + "myr": 2, + "myrt": 2, + "yrta": 2, + "rtac": 2, + "u(c": 2, + "e’ī": 2, + "’ī’": 2, + "’ī’ī": 2, + "ī’īt": 2, + "’ītā": 2, + "ītā": 2, + "tā(": 2, + "cari": 2, + "aric": 2, + "icac": 2, + "ua’a": 2, + "icul": 2, + "cula": 2, + "urep": 2, + "epur": 2, + "(alp": 2, + "alpi": 2, + "lpin": 2, + "pini": 2, + "a’ur": 2, + "’ura": 2, + "gera": 2, + "hi’": 2, + "’ute": 2, + "urat": 2, + "smin": 2, + "inum": 2, + "thri": 2, + "thur": 2, + "uriu": 2, + "uarā": 2, + "arāt": 2, + "rātā": 2, + "(me": 2, + "eros": 2, + "cult": 2, + "tiva": 2, + "spri": 2, + "(ch": 2, + "lico": 2, + "icon": 2, + "ambo": 2, + "pole": 2, + "e)a": 2, + "afet": 2, + "feta": 2, + "idk": 2, + "dka": 2, + "karz": 2, + "arza": 2, + "jaco": 2, + "acob": 2, + "obz": 2, + "bzu": 2, + "zum": 2, + "zuma": 2, + "ēar": 2, + "ujar": 2, + "izb": 2, + "zbo": 2, + "utef": 2, + "tefl": 2, + "efli": 2, + "flik": 2, + "lmal": 2, + "male": 2, + "kse": 2, + "sell": 2, + "llal": 2, + "joac": 2, + "oach": 2, + "mga": 2, + "auck": 2, + "merk": 2, + "erke": 2, + "rkel": 2, + "uif": 2, + "de1": 2, + "ui’": 2, + "’epi": 2, + "poj": 2, + "nric": 2, + "ubac": 2, + "dod": 2, + "os1": 2, + "bald": 2, + "-sao": 2, + "saou": 2, + "aoud": 2, + "dez": 2, + "r10": 2, + "auj": 2, + "gec": 2, + "ch2": 2, + "sarg": 2, + "args": 2, + "rgsi": 2, + "gsia": 2, + "’epe": 2, + "nbr": 2, + "utet": 2, + "baïd": 2, + "aïdj": 2, + "ïdja": 2, + "djan": 2, + "alie": 2, + "liev": 2, + "amas": 2, + "oulk": 2, + "edb": 2, + "dbe": 2, + "al-k": 2, + "l-kh": 2, + "-kha": 2, + "alma": 2, + "lman": 2, + "shp": 2, + "ulh": 2, + "chei": 2, + "asin": 2, + "ii3": 2, + "llio": 2, + "ve1": 2, + "ndel": 2, + "mab": 2, + "dean": 2, + "yay": 2, + "chen": 2, + "sher": 2, + "y30": 2, + "20f": 2, + "s22": 2, + "ić1": 2, + "slav": 2, + "inū": 2, + "ūnaa": 2, + "bots": 2, + "nkh": 2, + "kham": 2, + "a01": 2, + "rous": 2, + "anal": 2, + "bolk": 2, + "olki": 2, + "kiah": 2, + "ah1": 2, + "levn": 2, + "ev2": 2, + "adol": 2, + "dolp": 2, + "olph": 2, + "lphe": 2, + "tiao": 2, + "ao1": 2, + "za2": 2, + "noro": 2, + "odom": 2, + "oms": 2, + "iham": 2, + "amon": 2, + "en1": 2, + "neé": 2, + "eél": 2, + "élis": 2, + "harp": 2, + "arpe": 2, + "sém": 2, + "éma": 2, + "eves": 2, + "netu": 2, + "tax": 2, + "axi": 2, + "lsa": 2, + "lilo": 2, + "n29": 2, + "un1": 2, + "n11": 2, + "pāru": 2, + "ārur": 2, + "am5": 2, + "ng-j": 2, + "oàp": 2, + "àpe": 2, + "on2": 2, + "n26": 2, + "lass": 2, + "lka": 2, + "ing-": 2, + "ader": 2, + "rka": 2, + "lmo": 2, + "ōmin": 2, + "mans": 2, + "anso": 2, + "04n": 2, + "haz": 2, + "ayed": 2, + "ahya": 2, + "mmed": 2, + "akto": 2, + "work": 2, + "iju": 2, + "rajo": 2, + "hend": 2, + "drik": 2, + "ilve": 2, + "mula": 2, + "aile": 2, + "dess": 2, + "īpe": 2, + "nail": 2, + "au3": 2, + "u30": 2, + "kba": 2, + "en2": 2, + "ayra": 2, + "ndon": 2, + "ma2": 2, + "tamo": 2, + "h22": 2, + "tiho": 2, + "iorg": 2, + "achv": 2, + "chvi": 2, + "hvil": 2, + "vili": 2, + "arib": 2, + "dram": 2, + "papo": 2, + "s12": 2, + "gren": 2, + "enad": 2, + "mitc": 2, + "otto": 2, + "ndé": 2, + "dfo": 2, + "madj": 2, + "idu": 2, + "ne-": 2, + "hind": 2, + "s11": 2, + "notu": 2, + "ktor": 2, + "abm": 2, + "mēî": 2, + "mban": 2, + "no2": 2, + "rāti": 2, + "ni7": 2, + "4ti": 2, + "irur": 2, + "enda": 2, + "kenn": 2, + "enny": 2, + "sson": 2, + "shim": 2, + "s15": 2, + "rico": 2, + "a28": 2, + "ilf": 2, + "kaz": 2, + "kaza": 2, + "zakh": 2, + "akhs": 2, + "khst": 2, + "hsta": 2, + "soul": 2, + "ltan": 2, + "baïe": 2, + "aïev": 2, + "meto": 2, + "uhur": 2, + "aldi": 2, + "g10": 2, + "ahja": 2, + "mth": 2, + "al-a": 2, + "l-ah": 2, + "-ahm": 2, + "ahma": 2, + "hmad": 2, + "al-j": 2, + "l-ja": 2, + "jabe": 2, + "-sab": 2, + "chou": 2, + "houm": 2, + "oumm": 2, + "umma": 2, + "mmal": 2, + "maly": 2, + "aly": 2, + "yaso": 2, + "sone": 2, + "ne8": 2, + "amma": 2, + "dris": 2, + "vski": 2, + "is1": 2, + "rīp": 2, + "naji": 2, + "ajib": 2, + "jib": 2, + "mika": 2, + "enj": 2, + "af1": 2, + "algi": 2, + "kevi": 2, + "s13": 2, + "tiut": 2, + "v12": 2, + "evsk": 2, + "rbe": 2, + "msh": 2, + "shah": 2, + "amee": 2, + "n17": 2, + "y5": 2, + "enki": 2, + "k10": 2, + "ould": 2, + "dmo": 2, + "dla": 2, + "uep": 2, + "rota": 2, + "avia": 2, + "iuri": 2, + "urie": 2, + "lean": 2, + "a25": 2, + "roge": 2, + "oger": 2, + "hiag": 2, + "elbe": 2, + "kano": 2, + "arma": 2, + "nami": 2, + "amip": 2, + "mipi": 2, + "ipia": 2, + "yep": 2, + "hag": 2, + "eing": 2, + "baro": 2, + "v23": 2, + "lra": 2, + "ga1": 2, + "brig": 2, + "luck": 2, + "rym": 2, + "ae3": 2, + "aqa": 2, + "qab": 2, + "qabo": 2, + "usb": 2, + "ïd2": 2, + "kist": 2, + "yre": 2, + "anam": 2, + "inel": 2, + "will": 2, + "llem": 2, + "r30": 2, + "28t": 2, + "beni": 2, + "udo": 2, + "lth": 2, + "nass": 2, + "u20": 2, + "ta7": 2, + "dca": 2, + "mēr": 2, + "ne7": 2, + "game": 2, + "umur": 2, + "mure": 2, + "ntk": 2, + "tki": 2, + "doug": 2, + "ougl": 2, + "ugla": 2, + "nadi": 2, + "onsa": 2, + "rdon": 2, + "darc": 2, + "akao": 2, + "fun": 2, + "mase": 2, + "-pir": 2, + "into": 2, + "brie": 2, + "acky": 2, + "cky": 2, + "27t": 2, + "jame": 2, + "yta": 2, + "paro": 2, + "rtf": 2, + "o4": 2, + "k20": 2, + "dif": 2, + "hsh": 2, + "ūtān": 2, + "el-": 2, + "edri": 2, + "urin": 2, + "abas": 2, + "busi": 2, + "acha": 2, + "ssad": 2, + "oqi": 2, + "oqil": 2, + "ayi": 2, + "ying": 2, + "kaya": 2, + "izen": 2, + "déb": 2, + "byi": 2, + "zema": 2, + "uay": 2, + "axa": 2, + "ahoo": 2, + "vi1": 2, + "sses": 2, + "lara": 2, + "urba": 2, + "rban": 2, + "ngul": 2, + "muha": 2, + "uham": 2, + "seni": 2, + "il2": 2, + "nguy": 2, + "guyễ": 2, + "uyễn": 2, + "yễn": 2, + "tấn": 2, + "had": 2, + "dba": 2, + "time": 2, + "mmer": 2, + "vemb": 2, + "òna.": 2, + "عبد": 2, + "بدا": 2, + "دال": 2, + "],m": 2, + "teko": 2, + "ekok": 2, + "koko": 2, + "lod": 2, + "táp": 2, + "ská,": 2, + "ká,": 2, + "lác": 2, + "opká": 2, + "pkáv": 2, + "káve": 2, + "ávet": 2, + "vetr": 2, + "etrá": 2, + "ráe": 2, + "imán": 2, + "ászk": 2, + "szku": 2, + "zkur": 2, + "nyá,": 2, + "yá,": 2, + "á,p": 2, + "áro": 2, + "opol": 2, + ".ki": 2, + "sebi": 2, + "isku": 2, + ",ná": 2, + "opki": 2, + "onst": 2, + "oszk": 2, + "szká": 2, + "e,c": 2, + "kále": 2, + "nyáz": 2, + "yáze": 2, + "nyis": 2, + "yisz": 2, + "iszk": 2, + "káá": 2, + "posz": 2, + "nyij": 2, + "i.r": 2, + ".ro": 2, + "szu": 2, + "szup": 2, + "nyev": 2, + "lesz": 2, + "sztr": 2, + "ztrá": 2, + "trát": 2, + "ráti": 2, + "oriz": 2, + "zány": 2, + "ányi": 2, + "disz": 2, + "ngit": 2, + "siku": 2, + "ikul": 2, + "gáre": 2, + "csin": 2, + "siny": 2, + "vnyi": 2, + "zki": 2, + "otri": 2, + "ivál": 2, + "vále": 2, + "szim": 2, + "csik": 2, + "szto": 2, + "lo.": 2, + "ropp": 2, + "lder": 2, + "skum": 2, + ",gr": 2, + "rány": 2, + "kij,": 2, + "ztá.": 2, + "tá.": 2, + "ilá": 2, + "dzsá": 2, + "proz": 2, + "zeny": 2, + "evol": 2, + "nkul": 2, + "e.l": 2, + "orio": 2, + "ole,": 2, + "vitr": 2, + "itre": 2, + "csim": 2, + "lics": 2, + "slá": 2, + "zed": 2, + "szl": 2, + "inye": 2, + "nyen": 2, + "yenk": 2, + "linn": 2, + "pper": 2, + "rvin": 2, + "ije": 2, + "dest": 2, + "omen": 2, + "szd": 2, + "ler,": 2, + "r,d": 2, + "itro": 2, + "trom": 2, + "ijs": 2, + "evá": 2, + "nyás": 2, + "yász": 2, + "szki": 2, + "zkij": 2, + "etri": 2, + "elá": 2, + "ácse": 2, + "yde": 2, + "detr": 2, + "ripo": 2, + ".li": 2, + "egas": 2, + "a:5": 2, + "e:3": 2, + "352": 2, + "52k": 2, + "2km": 2, + "40t": 2, + ":55": 2, + "elas": 2, + "enho": 2, + "duas": 2, + "holt": 2, + "aos": 2, + "iago": 2, + "11t": 2, + "city": 2, + "tyt": 2, + "-la-": 2, + ":13": 2, + "ampi": 2, + "o(i": 2, + "(tau": 2, + "i(p": 2, + "roo,": 2, + "eèt": 2, + "eòr": 2, + "òrom": 2, + "tiàr": 2, + "iroà": 2, + "roà": 2, + "âau": 2, + "ètu": 2, + "tuhu": 2, + "aèo": 2, + "ènan": 2, + "ne),": 2, + "ii:": 2, + "teì": 2, + "eìt": 2, + ",pu": 2, + "prot": 2, + ":\"t": 2, + "ore,": 2, + "être": 2, + "tre.": 2, + "s'é": 2, + "s'éc": 2, + "'écr": 2, + "écri": 2, + "mav": 2, + "ouff": 2, + "fuse": 2, + "mago": 2, + "ogiq": 2, + "giqu": 2, + "lep": 2, + "ape’": 2, + "pe’e": 2, + "e’et": 2, + "’ete": 2, + "troj": 2, + "roja": 2, + "ojan": 2, + "jany": 2, + "490": 2, + "or.": 2, + "r.u": 2, + "asik": 2, + "sika": 2, + "ge/": 2, + "e/": 2, + "nore": 2, + "oreg": 2, + "eg/": 2, + "g/": 2, + "rike": 2, + "riik": 2, + "ter.": 2, + "6hu": 2, + "ract": 2, + "acti": 2, + "holc": 2, + "olco": 2, + "5tu": 2, + "iva-": 2, + "va-o": 2, + "a-oa": 2, + "-oa": 2, + "ua-p": 2, + "-pou": 2, + "mā:": 2, + "m²)": 2, + "²)t": 2, + "aa1": 2, + "71t": 2, + "5ma": 2, + "354": 2, + "16t": 2, + "7p": 2, + "7pa": 2, + "518": 2, + "ra9": 2, + "1hi": 2, + "12p": 2, + "ra3": 2, + "235": 2, + "35t": 2, + "120": 2, + "72t": 2, + "5hu": 2, + "aa8": 2, + "oa1": 2, + "20r": 2, + "oa3": 2, + "24u": 2, + "521": 2, + "545": 2, + "45t": 2, + "26f": 2, + "6fa": 2, + "001": 2, + "8ar": 2, + "9te": 2, + "ao6": 2, + "a35": 2, + "3ma": 2, + "a40": 2, + "401": 2, + "122": 2, + "226": 2, + "ngir": 2, + "ka:": 2, + "tiaà": 2, + "iaàa": 2, + "aàau": 2, + "àau": 2, + "aveā": 2, + "veā": 2, + "eān": 2, + "natī": 2, + "atīr": 2, + "tīra": 2, + "īrar": 2, + "u\"p": 2, + "\"per": 2, + "1ga": 2, + "-7": 2, + "a13": 2, + "-5": 2, + "4g": 2, + "4ga": 2, + "se2": 2, + "7o": 2, + "'a1": 2, + "12,8": 2, + "iʻo": 2, + "iao.": 2, + "est,": 2, + "uta,": 2, + "akak": 2, + "hīt": 2, + "hīto": 2, + "cine": 2, + "cann": 2, + "ecro": 2, + "cran": 2, + "ees": 2, + "eest": 2, + "goa.": 2, + "whiw": 2, + "hiwh": 2, + "whin": 2, + "ohu,": 2, + "kaia": 2, + "ako,": 2, + "etak": 2, + "u:h": 2, + "raue": 2, + "auem": 2, + "uemi": 2, + "otuh": 2, + "uhak": 2, + "i\"a": 2, + "\"ak": 2, + "\"ako": 2, + "teng": 2, + "tuki": 2, + "u.k": 2, + "6ng": 2, + "inoh": 2, + "naak": 2, + "aaki": 2, + "6ki": 2, + "12k": 2, + "8ng": 2, + "(tai": 2, + "iohi": 2, + "kaho": 2, + "hoah": 2, + "oaho": 2, + "wari": 2, + ")me": 2, + "esil": 2, + "ekau": 2, + "karō": 2, + "arōp": 2, + "ōpūh": 2, + "pūhi": 2, + "ūhia": 2, + "e(n": 2, + "“ta": 2, + "ga(": 2, + ",wh": 2, + "uhin": 2, + "tiim": 2, + "iima": 2, + "waan": 2, + "ma;": 2, + "(ina": 2, + "koj": 2, + "pono": 2, + "coun": 2, + "ounc": 2, + "unci": 2, + "ncil": 2, + "gum": 2, + "ocie": 2, + "ciet": 2, + "iety": 2, + "ety": 2, + "ty(": 2, + "ams)": 2, + "),a": 2, + ",as": 2, + "l(a": 2, + "(ami": 2, + "ofp": 2, + "gres": 2, + "),m": 2, + "msi": 2, + ".ke": 2, + "wao": 2, + "ce,": 2, + "tawh": 2, + "(amf": 2, + "amf)": 2, + "f).": 2, + "nuin": 2, + "he\"": 2, + "a;3": 2, + "u.n": 2, + "hoko": 2, + "aill": 2, + "isw": 2, + "50n": 2, + "nisl": 2, + "slas": 2, + "u.\"": 2, + "iki.": 2, + "ene,": 2, + "pūta": 2, + "aing": 2, + "s,k": 2, + "keng": 2, + ",ah": 2, + "whir": 2, + "lbl": 2, + "i\":": 2, + "\":\"": 2, + ":\"k": 2, + "o.“": 2, + ".“m": 2, + "“mo": 2, + "toko": 2, + "201": 2, + "1ng": 2, + "3i": 2, + "kona": 2, + ",10": 2, + "raru": 2, + "net,": 2, + "d,t": 2, + "a[i": 2, + "[in": 2, + "ori]": 2, + "ri]": 2, + "kahe": 2, + "i.\"": 2, + "unah": 2, + "awap": 2, + "wapa": 2, + "opu.": 2, + "raih": 2, + "aiha": 2, + "f),": 2, + "ra\"": 2, + "cal,": 2, + "utau": 2, + "kapa": 2, + "amut": 2, + "oang": 2, + "keem": 2, + "eemu": 2, + "ohnn": 2, + "hnny": 2, + "yha": 2, + "llyd": 2, + "lyda": 2, + "yday": 2, + "amir": 2, + "5,i": 2, + "s-la": 2, + "owī": 2, + "wīw": 2, + "wīwī": 2, + "h.m": 2, + "toka": 2, + "ck'": 2, + "k'n": 2, + "'n'": 2, + "n'r": 2, + "'ro": 2, + "puor": 2, + "uoro": 2, + "ndb": 2, + "blu": 2, + "blue": 2, + ",so": 2, + "ock,": 2, + "ck,": 2, + "when": 2, + "ahik": 2, + "oim": 2, + "huih": 2, + "uihu": 2, + "ihui": 2, + "e80": 2, + "miri": 2, + "maki": 2, + "puku": 2, + "kupu": 2, + "kahu": 2, + "tron": 2, + "dsc": 2, + ":me": 2, + "th:": 2, + "h:": 2, + "kni": 2, + "knig": 2, + "nigh": 2, + "rnet": 2, + "meta": 2, + "icm": 2, + "(onu": 2, + "onu)": 2, + "enev": 2, + "neva": 2, + "iām": 2, + "1.n": 2, + "orau": 2, + "meo": 2, + "ora;": 2, + ";no": 2, + "cong": 2, + "ae2": 2, + "tā'": 2, + "tā'a": 2, + "ndie": 2, + "dien": 2, + "ārua": 2, + "a'oh": 2, + "alt=": 2, + "|vig": 2, + "a'aa": 2, + "'aa'": 2, + "a'u,": 2, + "'u,": 2, + "to'o": 2, + "o'on": 2, + "'ona": 2, + "ona'": 2, + "irah": 2, + "māne": 2, + "ānea": 2, + "a'oa": 2, + "oa'o": 2, + "to'u": 2, + "o'un": 2, + "'una": 2, + "a'ē": 2, + "'ēi": 2, + "i'ā": 2, + "'āt": 2, + "māro": 2, + "auha": 2, + ",fl": 2, + "enf": 2, + "e'ī": 2, + "s,o": 2, + "oa'a": 2, + "a'a,": 2, + "mā'e": 2, + "ā'ea": 2, + "e'e": 2, + "rauv": 2, + "uvaa": 2, + "vaa,": 2, + "hīe": 2, + "a'ai": 2, + "ioo": 2, + "anoa": 2, + "u'a.": 2, + "itik": 2, + "tiki": 2, + "'ēhu": 2, + "ēhu": 2, + "u'ā": 2, + "tio,": 2, + "'iri": 2, + "'ōp": 2, + "'ōpū": 2, + "emok": 2, + "moka": 2, + "okar": 2, + "omot": 2, + "tīm": 2, + "tīma": 2, + "īmat": 2, + "aep": 2, + "ndid": 2, + "ie'": 2, + "i,'": 2, + "ārem": 2, + "tāmā": 2, + "āmā'": 2, + "eō'": 2, + "m(m": 2, + "(mou": 2, + "mouv": 2, + "uvem": 2, + "veme": 2, + "n,1": 2, + "ti),": 2, + ",12": 2, + "12m": 2, + "2mā": 2, + "i'e": 2, + "hīk": 2, + "hīko": 2, + "īkoi": 2, + "koi,": 2, + "'api": 2, + "api'": 2, + "ū'o": 2, + "ka'i": 2, + "'i'": 2, + "'ito": 2, + "a'ā": 2, + "i'a'": 2, + "iers": 2, + "akeh": 2, + "brab": 2, + "bant": 2, + "ant,": 2, + "e'ap": 2, + "ura'": 2, + "hoa,": 2, + "omo,": 2, + "āpi'": 2, + "ansh": 2, + "nshi": 2, + "pǔt": 2, + "ǔta": 2, + "popo": 2, + "'e.": 2, + "aeau": 2, + "hide": 2, + "umua": 2, + "muak": 2, + "uaki": 2, + "nryk": 2, + "ryk": 2, + "ykj": 2, + "kja": 2, + "niak": 2, + "tyc": 2, + "tych": 2, + "ychy": 2, + "eti,": 2, + "–2": 2, + "25i": 2, + "akā": 2, + "ele,": 2, + "hul": 2, + "hula": 2, + "paʻ": 2, + "aʻi": 2, + "ʻano": 2, + "ʻii": 2, + "ekū": 2, + "kūl": 2, + "loko": 2, + "anaʻ": 2, + "naʻo": 2, + "ʻoʻ": 2, + "koʻi": 2, + "aupu": 2, + "acks": 2, + "ckso": 2, + "kson": 2, + "kāle": 2, + "ikū": 2, + "hoʻo": 2, + "oʻok": 2, + "\"thr": 2, + "er\"": 2, + "foo": 2, + "hist": 2, + "stor": 2, + "ewo": 2, + "worl": 2, + "orld": 2, + "ess,": 2, + "ss,": 2, + ",g.": 2, + "g.,": 2, + "nbo": 2, + "s,p": 2, + "verp": 2, + "erpo": 2, + "rpoo": 2, + "pool": 2, + "obal": 2, + "rint": 2, + ":th": 2, + ",ba": 2, + "back": 2, + "si.": 2, + "si(": 2, + "hsiu": 2, + "yu.": 2, + "tai;": 2, + "i.5": 2, + "vehe": 2, + "ueê": 2, + "omǎ": 2, + "i;h": 2, + "u;h": 2, + "14u": 2, + "o:e": 2, + "iti:": 2, + "ti:": 2, + ":15": 2, + "ri;": 2, + "uru:": 2, + "nau,": 2, + "iaî": 2, + "aeï": 2, + "u:e": 2, + "o‘a;": 2, + "‘a;": 2, + ".29": 2, + "30e": 2, + ";na": 2, + "2fa": 2, + "a,5": 2, + "u;a": 2, + ";ai": 2, + "ûai": 2, + "pof": 2, + "ino.": 2, + "o.1": 2, + "12e": 2, + "ïa;": 2, + "kela": 2, + "laï": 2, + ",tu": 2, + "16u": 2, + ";17": 2, + "7ar": 2, + "heï": 2, + "18u": 2, + "aoao": 2, + ";22": 2, + "22e": 2, + "ine;": 2, + "ne;": 2, + "hoê.": 2, + "oê.": 2, + "râr": 2, + "i;3": 2, + "tu;": 2, + "ite;": 2, + "aua.": 2, + "emǎ": 2, + "apun": 2, + "?10": 2, + "ǎta‘": 2, + "vau.": 2, + "a?u": 2, + "?ua": 2, + "aava": 2, + "oep": 2, + "aai,": 2, + "17u": 2, + "epo.": 2, + "po.": 2, + "o.2": 2, + "ova.": 2, + "la:": 2, + "mamo": 2, + "amoe": 2, + "eiô": 2, + "u:1": 2, + "11e": 2, + "oere": 2, + "omai": 2, + "ohe.": 2, + "reê": 2, + "17i": 2, + "tôi": 2, + "a;t": 2, + "oha,": 2, + "8fa": 2, + "irad": 2, + "rada": 2, + "da;": 2, + "mehu": 2, + "ehui": 2, + "huia": 2, + "uiae": 2, + "iael": 2, + "ela;": 2, + "tusa": 2, + "usae": 2, + "sael": 2, + "na;": 2, + "vivo": 2, + "taz": 2, + "ala-": 2, + "la-k": 2, + "a-ka": 2, + "-kai": 2, + "ead": 2, + "âh": 2, + "âho": 2, + "râv": 2, + "24i": 2, + "5it": 2, + "eta;": 2, + "ta;": 2, + "’ue": 2, + "26e": 2, + "osa.": 2, + "ela.": 2, + "8pa": 2, + "e.3": 2, + ".32": 2, + "rôi": 2, + "ia:": 2, + "i.4": 2, + "u.7": 2, + "va;": 2, + "tou:": 2, + "ou:": 2, + "eig": 2, + "oeï": 2, + "i;t": 2, + "i-an": 2, + "-ana": 2, + "a‘e-": 2, + "‘e-h": 2, + "e-hi": 2, + "20o": 2, + "nau‘": 2, + "ao;": 2, + "6a": 2, + "ere-": 2, + "re-a": 2, + "ûar": 2, + ",14": 2, + "i;m": 2, + "pahe": 2, + "ahee": 2, + "eba,": 2, + "pâp": 2, + "pâpâ": 2, + "euu": 2, + "â;": 2, + "â;e": 2, + "marô": 2, + "arô": 2, + "ôte": 2, + ",16": 2, + "auhu": 2, + "pûp": 2, + "pûpû": 2, + "no‘a": 2, + "i;i": 2, + "aiâ": 2, + "22i": 2, + "toet": 2, + "oeto": 2, + "etoe": 2, + "x1": 2, + "u;i": 2, + "iǒ": 2, + "ǒn": 2, + "ǒna": 2, + "eta:": 2, + "îpa": 2, + "uain": 2, + "a;a": 2, + "haeh": 2, + "28e": 2, + "29e": 2, + "gome": 2, + "mese": 2, + "esek": 2, + "seka": 2, + "asa.": 2, + "zaï": 2, + "uê": 2, + "aê.": 2, + "zera": 2, + "abat": 2, + "nime": 2, + "erod": 2, + "alan": 2, + "inev": 2, + "eve,": 2, + "obot": 2, + "luda": 2, + "uhi,": 2, + "sido": 2, + "idon": 2, + "hiap": 2, + "iapo": 2, + "ereg": 2, + "ari,": 2, + "doma": 2, + "tii,": 2, + "phak": 2, + "akes": 2, + "kesa": 2, + "esad": 2, + "sada": 2, + "sele": 2, + ",29": 2, + "ba.": 2, + "aith": 2, + "mbc": 2, + "mbch": 2, + "bchb": 2, + "chb": 2, + "hbi": 2, + "oahi": 2, + "arsh": 2, + "igen": 2, + "olym": 2, + "re\"": 2, + "emk": 2, + "ayô": 2, + "orv": 2, + "orve": 2, + "rves": 2, + "vese": 2, + "ough": 2, + "mkp": 2, + "mkpe": 2, + "llco": 2, + "'a-a": 2, + "ipf": 2, + "pfi": 2, + "pfiz": 2, + "fize": 2, + "ersh": 2, + "ship": 2, + "p),": 2, + "êpŭ": 2, + "tolo": 2, + "logi": 2, + "noy": 2, + "yaou": 2, + "aoun": 2, + "ound": 2, + "l'or": 2, + "'oré": 2, + "oréa": 2, + "cham": 2, + "hamp": 2, + "plas": 2, + "lasm": 2, + "asmo": 2, + "smod": 2, + "modi": 2, + "ada.": 2, + "umuh": 2, + "iûi": 2, + "okw": 2, + "echn": 2, + "chno": 2, + "hnol": 2, + "nolo": 2, + "ini-": 2, + "": 2, + ">]": 2, + "oon.": 2, + "pŭr": 2, + "ŭra": 2, + "virc": 2, + "rcho": 2, + "chow": 2, + "0,00": 2, + "'i-f": 2, + "her,": 2, + "lica": 2, + "ngst": 2, + "ill,": 2, + "l,e": 2, + "ĕê.": 2, + "ng'o": 2, + "mcdo": 2, + "cdon": 2, + "êbu": 2, + "hebe": 2, + "ika:": 2, + "auap": 2, + "uapa": 2, + "a]i": 2, + "opw": 2, + "pwa": 2, + "pwan": 2, + "wani": 2, + "ivt": 2, + "vto": 2, + "atât": 2, + "tâta": 2, + "saha": 2, + "â.u": 2, + "epoh": 2, + "ohep": 2, + "jom": 2, + "jomo": 2, + "nafe": 2, + "afea": 2, + "mats": 2, + "atsu": 2, + "tsul": 2, + "suli": 2, + "'ut": 2, + "oseb": 2, + "sebe": 2, + "ebel": 2, + "ruau": 2, + "pii,": 2, + "ng'i": 2, + "g'iy": 2, + "'iya": 2, + "um,": 2, + "m,t": 2, + "(aw": 2, + "(awa": 2, + "o'a,": 2, + ".ei": 2, + "nahe": 2, + "ahea": 2, + "faaô": 2, + "aaô": 2, + "aôa": 2, + "bi.": 2, + "ycl": 2, + "mno": 2, + "addi": 2, + "abab": 2, + "cgia": 2, + "giar": 2, + ",ca": 2, + "(ua": 2, + "hiv,": 2, + "iv,": 2, + "a'im": 2, + ".\"r": 2, + "tle,": 2, + "uïar": 2, + "ïara": 2, + "vee": 2, + "mbia": 2, + "joha": 2, + "uro,": 2, + "rkt": 2, + "omj": 2, + "gnes": 2, + "yew": 2, + "yewa": 2, + "ewan": 2, + "avag": 2, + "vage": 2, + "bimb": 2, + "imbo": 2, + "woli": 2, + "oliy": 2, + "liyi": 2, + "igho": 2, + "ghod": 2, + "hoda": 2, + "odar": 2, + "daro": 2, + "aj.": 2, + "j.c": 2, + "m,i": 2, + "sel,": 2, + "meye": 2, + "eyer": 2, + "êau": 2, + "abur": 2, + "buri": 2, + "'iu": 2, + "upau": 2, + "paup": 2, + "ota.": 2, + "eyg": 2, + "ygi": 2, + "girl": 2, + "but": 2, + "seko": 2, + "ekon": 2, + "kond": 2, + "oioi": 2, + "8raa": 2, + "eben": 2, + "ezer": 2, + "umia": 2, + "nema": 2, + "om,": 2, + "egh": 2, + "leti": 2, + "laid": 2, + "aide": 2, + "appi": 2, + "ppia": 2, + "aht": 2, + "ua(": 2, + "c).": 2, + "gh.": 2, + "'ib": 2, + "ha'u": 2, + "a'ut": 2, + "'uti": 2, + "kanv": 2, + "anva": 2, + "nvar": 2, + ")ei": 2, + "rise": 2, + "liam": 2, + "es\"": 2, + "s\"t": 2, + "adak": 2, + "daku": 2, + "âtu": 2, + ",0%": 2, + "dord": 2, + "rdor": 2, + "ssc": 2, + "ess.": 2, + "),u": 2, + "40i": 2, + "40m": 2, + "(sm": 2, + "(sme": 2, + "smeg": 2, + "mega": 2, + "rêt": 2, + "nteh": 2, + ",\"": 2, + "gift": 2, + "'ita": 2, + "ddo,": 2, + "do,": 2, + "n,b": 2, + "(mw": 2, + "ote.": 2, + "cs).": 2, + "tiw": 2, + "tiwh": 2, + "whik": 2, + "hike": 2, + "kete": 2, + "hosp": 2, + "ospi": 2, + "spit": 2, + "rtey": 2, + "ceo": 2, + "lsc": 2, + "choo": 2, + "hool": 2, + "pŭt": 2, + "ŭta": 2, + "ogl": 2, + "moun": 2, + "ount": 2, + "untc": 2, + "ntcr": 2, + "tcre": 2, + "ast,": 2, + "'iv": 2, + "nnu": 2, + ",f.": 2, + "f.,": 2, + "d.t": 2, + "(5)": 2, + "rbal": 2, + "ejis": 2, + "jisu": 2, + "ankr": 2, + "nkro": 2, + "t.g": 2, + "firs": 2, + "irst": 2, + "komf": 2, + "omfo": 2, + "mfo": 2, + "foa": 2, + "'oa.": 2, + "moko": 2, + "okow": 2, + "wab": 2, + "dsi": 2, + "edk": 2, + "dki": 2, + "ingd": 2, + "ngdo": 2, + "gdom": 2, + "â.\"": 2, + ".\"a": 2, + "doe": 2, + "komi": 2, + "isin": 2, + "mfi,": 2, + "abio": 2, + "ddi": 2, + "kpi": 2, + "bum": 2, + "lini": 2, + "bisi": 2, + "isiw": 2, + "echi": 2, + "mant": 2, + "cuba": 2, + "dail": 2, + "aily": 2, + "îe": 2, + "faa.": 2, + "ôno": 2, + "e4r": 2, + "volt": 2, + "olta": 2, + "umu.": 2, + "ngs,": 2, + "gs,": 2, + "omma": 2, + "peac": 2, + "acek": 2, + "ceke": 2, + "ekee": 2, + "keep": 2, + "eepi": 2, + "epin": 2, + "gce": 2, + "mǎrû": 2, + "tv3": 2, + "june": 2, + "ati'": 2, + "apî.": 2, + "pî.": 2, + ".av": 2, + "ecd": 2, + "nsn": 2, + "relu": 2, + "elue": 2, + "ruby": 2, + "uby": 2, + "tal,": 2, + "fe,": 2, + "mo'e": 2, + "ekam": 2, + "kame": 2, + "amek": 2, + "aueu": 2, + "ueue": 2, + "abc": 2, + "bcn": 2, + "cno": 2, + "ise.": 2, + "ote,": 2, + "odun": 2, + "iek": 2, + "kosi": 2, + "osia": 2, + "rgh,": 2, + "gh,": 2, + "h,i": 2, + "h.t": 2, + "c,u": 2, + "hoâ": 2, + "ârâ": 2, + "(sd": 2, + "(sdf": 2, + "sdf)": 2, + "'ep": 2, + "î,t": 2, + "sak": 2, + "dict": 2, + "utir": 2, + "ll-a": 2, + "l-af": 2, + "-afr": 2, + "sule": 2, + "ulem": 2, + "gbe": 2, + "imp": 2, + "pno": 2, + "chps": 2, + "wase": 2, + "fesô": 2, + "esôr": 2, + "sôr": 2, + "uml": 2, + "mlu": 2, + "luu": 2, + "vmb": 2, + "nyu": 2, + "yun": 2, + "yuni": 2, + "niva": 2, + "ivas": 2, + "vasi": 2, + "siti": 2, + ",sh": 2, + "kpaa": 2, + "paa.": 2, + "umô": 2, + "tren": 2, + "lcip": 2, + "tegb": 2, + "egba": 2, + "gbay": 2, + "bayo": 2, + "bow": 2, + "bowe": 2, + "owen": 2, + "wen": 2, + "ienc": 2, + "ce.": 2, + "mole": 2, + "olec": 2, + "lecu": 2, + "ecul": 2, + "nar,": 2, + "auih": 2, + "past": 2, + "steu": 2, + "ur,": 2, + "itum": 2, + "anom": 2, + "noma": 2, + "omc": 2, + "mcgi": 2, + "cgil": 2, + "gill": 2, + "edn": 2, + "anyi": 2, + "tanf": 2, + "sten": 2, + "lehn": 2, + "ehn": 2, + "osl": 2, + "osh": 2, + "utta": 2, + "esh.": 2, + "sh.": 2 + } +} \ No newline at end of file diff --git a/visualizations/embedding_alignment_quality.png b/visualizations/embedding_alignment_quality.png new file mode 100644 index 0000000000000000000000000000000000000000..9543f885baff82b9cad58f151250118022d45164 Binary files /dev/null and b/visualizations/embedding_alignment_quality.png differ diff --git a/visualizations/embedding_isotropy.png b/visualizations/embedding_isotropy.png new file mode 100644 index 0000000000000000000000000000000000000000..0ce3124ca083d2e25971eaa37d7fc8693e2b39e0 Binary files /dev/null and b/visualizations/embedding_isotropy.png differ diff --git a/visualizations/embedding_norms.png b/visualizations/embedding_norms.png new file mode 100644 index 0000000000000000000000000000000000000000..4e6d2f51c4188d817ac15fd253dc133770892e6d Binary files /dev/null and b/visualizations/embedding_norms.png differ diff --git a/visualizations/embedding_similarity.png b/visualizations/embedding_similarity.png new file mode 100644 index 0000000000000000000000000000000000000000..3b91606c6cf56e9cc8c6e3946f15f1e7537c53b5 --- /dev/null +++ b/visualizations/embedding_similarity.png @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:75ad716d6e898c55b36fca21a8102afbd3808f51c844179665bb217e7ad1ceeb +size 149226 diff --git a/visualizations/embedding_tsne_multilingual.png b/visualizations/embedding_tsne_multilingual.png new file mode 100644 index 0000000000000000000000000000000000000000..852b9a9bed9a47e1e524e5a0e2eefd217dbd26ee --- /dev/null +++ b/visualizations/embedding_tsne_multilingual.png @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:66ce5d71d4f6de167af8d5d0686f44fdfeb89ac318659016e2473144c0114ed1 +size 237204 diff --git a/visualizations/markov_branching.png b/visualizations/markov_branching.png new file mode 100644 index 0000000000000000000000000000000000000000..49b1e010b65f36fe8b0b1ef3187386e10eb0d6ef Binary files /dev/null and b/visualizations/markov_branching.png differ diff --git a/visualizations/markov_contexts.png b/visualizations/markov_contexts.png new file mode 100644 index 0000000000000000000000000000000000000000..9a473ded8f8d2feaa81500773e3fd877e87c5901 Binary files /dev/null and b/visualizations/markov_contexts.png differ diff --git a/visualizations/markov_entropy.png b/visualizations/markov_entropy.png new file mode 100644 index 0000000000000000000000000000000000000000..5a589957168f286dabe863653cd56990fff19ff2 Binary files /dev/null and b/visualizations/markov_entropy.png differ diff --git a/visualizations/model_sizes.png b/visualizations/model_sizes.png new file mode 100644 index 0000000000000000000000000000000000000000..926106b568375d99935ec1e9b1ec52fcd540b83a Binary files /dev/null and b/visualizations/model_sizes.png differ diff --git a/visualizations/nearest_neighbors.png b/visualizations/nearest_neighbors.png new file mode 100644 index 0000000000000000000000000000000000000000..f64f4e0d26016eb0811972dfe93905360846dc95 Binary files /dev/null and b/visualizations/nearest_neighbors.png differ diff --git a/visualizations/ngram_coverage.png b/visualizations/ngram_coverage.png new file mode 100644 index 0000000000000000000000000000000000000000..e6811f174b899877da373118759093f94ecabd78 --- /dev/null +++ b/visualizations/ngram_coverage.png @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ef9559765ab9a9b4430c9dceb419d3210ac2f6ef6f4a4957dfabb709b32eb6ee +size 101411 diff --git a/visualizations/ngram_entropy.png b/visualizations/ngram_entropy.png new file mode 100644 index 0000000000000000000000000000000000000000..745ae2b9c1ad11e9b31d6ce6954ef74716c8599a Binary files /dev/null and b/visualizations/ngram_entropy.png differ diff --git a/visualizations/ngram_perplexity.png b/visualizations/ngram_perplexity.png new file mode 100644 index 0000000000000000000000000000000000000000..89e1d12a52cb85263d9e10f9291d318c8244c389 Binary files /dev/null and b/visualizations/ngram_perplexity.png differ diff --git a/visualizations/ngram_unique.png b/visualizations/ngram_unique.png new file mode 100644 index 0000000000000000000000000000000000000000..8dccd19ffe1bd6b01ecbfb38144fb63664a3a995 Binary files /dev/null and b/visualizations/ngram_unique.png differ diff --git a/visualizations/performance_dashboard.png b/visualizations/performance_dashboard.png new file mode 100644 index 0000000000000000000000000000000000000000..ece6fdd41c6d3b3bcabbeddb3bfc75699f4f3a6f --- /dev/null +++ b/visualizations/performance_dashboard.png @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a39c0c1d5d0b0407024b24ed4a14241faa5bdf44ec9a5629126813d3c3ab29ce +size 371755 diff --git a/visualizations/position_encoding_comparison.png b/visualizations/position_encoding_comparison.png new file mode 100644 index 0000000000000000000000000000000000000000..c80d9b93d3c34ae53ba4e13763e59849c0b6c6a6 --- /dev/null +++ b/visualizations/position_encoding_comparison.png @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dcb364e688dbd7049dacfc7d6ff61bd70b387fcfca89e8276d588c95c35d3509 +size 105329 diff --git a/visualizations/tokenizer_compression.png b/visualizations/tokenizer_compression.png new file mode 100644 index 0000000000000000000000000000000000000000..de616b094223b202e19530ab2b6b04312cf53f0f Binary files /dev/null and b/visualizations/tokenizer_compression.png differ diff --git a/visualizations/tokenizer_fertility.png b/visualizations/tokenizer_fertility.png new file mode 100644 index 0000000000000000000000000000000000000000..1ef6e9079e978af615f5b3b5f4ca6d98cddb4e28 Binary files /dev/null and b/visualizations/tokenizer_fertility.png differ diff --git a/visualizations/tokenizer_oov.png b/visualizations/tokenizer_oov.png new file mode 100644 index 0000000000000000000000000000000000000000..f7e29ae2d55cb76fc4155b97c7d5a83375bdc500 Binary files /dev/null and b/visualizations/tokenizer_oov.png differ diff --git a/visualizations/tokenizer_total_tokens.png b/visualizations/tokenizer_total_tokens.png new file mode 100644 index 0000000000000000000000000000000000000000..7dd62909ff459c7706f8b695f3736eaa0b09c170 Binary files /dev/null and b/visualizations/tokenizer_total_tokens.png differ diff --git a/visualizations/top20_words.png b/visualizations/top20_words.png new file mode 100644 index 0000000000000000000000000000000000000000..9af8eb4c4a52e9efa8cb63d3d73bc8b96e4c3e35 Binary files /dev/null and b/visualizations/top20_words.png differ diff --git a/visualizations/tsne_sentences.png b/visualizations/tsne_sentences.png new file mode 100644 index 0000000000000000000000000000000000000000..045c8757bf3ebd83d8bac474b9d06d170594ac4d --- /dev/null +++ b/visualizations/tsne_sentences.png @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cd093af01ccb424cb3060c3f4b66b4dfd9a9f9127dfe98302f9cff48d584fafe +size 228879 diff --git a/visualizations/tsne_words.png b/visualizations/tsne_words.png new file mode 100644 index 0000000000000000000000000000000000000000..e4fcc945a763f32eac63b7be3977e57cf39e5703 --- /dev/null +++ b/visualizations/tsne_words.png @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:37880c5e3cf7ba46158dc1ac883cf676d5b6d64c0c08ebd154774a95f881f941 +size 448645 diff --git a/visualizations/vocab_coverage.png b/visualizations/vocab_coverage.png new file mode 100644 index 0000000000000000000000000000000000000000..92900aefe7aef9747ad2b86c23f67c7208bb6852 Binary files /dev/null and b/visualizations/vocab_coverage.png differ diff --git a/visualizations/vocab_freq_dist.png b/visualizations/vocab_freq_dist.png new file mode 100644 index 0000000000000000000000000000000000000000..0048e8ad67d3087ef441d82261d67c17fb71ccba Binary files /dev/null and b/visualizations/vocab_freq_dist.png differ diff --git a/visualizations/zipf_law.png b/visualizations/zipf_law.png new file mode 100644 index 0000000000000000000000000000000000000000..c7361c16dd18fba626dcc663818f32eccb19e6fe --- /dev/null +++ b/visualizations/zipf_law.png @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1d4c7b0938842f4625004638b2cd551456c4abb530036c9f48ee31ad4f173866 +size 108028