diff --git a/.gitattributes b/.gitattributes index a6344aac8c09253b3b630fb776ae94478aa0275b..5128fe6dbab6ef0227c02cffa9ad5350ab6c4dd6 100644 --- a/.gitattributes +++ b/.gitattributes @@ -33,3 +33,9 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text *.zip filter=lfs diff=lfs merge=lfs -text *.zst filter=lfs diff=lfs merge=lfs -text *tfevents* filter=lfs diff=lfs merge=lfs -text +visualizations/embedding_similarity.png filter=lfs diff=lfs merge=lfs -text +visualizations/performance_dashboard.png filter=lfs diff=lfs merge=lfs -text +visualizations/position_encoding_comparison.png filter=lfs diff=lfs merge=lfs -text +visualizations/tsne_sentences.png filter=lfs diff=lfs merge=lfs -text +visualizations/tsne_words.png filter=lfs diff=lfs merge=lfs -text +visualizations/zipf_law.png filter=lfs diff=lfs merge=lfs -text diff --git a/README.md b/README.md new file mode 100644 index 0000000000000000000000000000000000000000..16173c6d6743d4d6cae51003038c5273a68febae --- /dev/null +++ b/README.md @@ -0,0 +1,555 @@ +--- +language: bm +language_name: BM +language_family: atlantic_other +tags: + - wikilangs + - nlp + - tokenizer + - embeddings + - n-gram + - markov + - wikipedia + - monolingual + - family-atlantic_other +license: mit +library_name: wikilangs +pipeline_tag: feature-extraction +datasets: + - omarkamali/wikipedia-monthly +dataset_info: + name: wikipedia-monthly + description: Monthly snapshots of Wikipedia articles across 300+ languages +metrics: + - name: best_compression_ratio + type: compression + value: 4.070 + - name: best_isotropy + type: isotropy + value: 0.2244 + - name: vocabulary_size + type: vocab + value: 7195 +generated: 2025-12-28 +--- + +# BM - Wikilangs Models +## Comprehensive Research Report & Full Ablation Study + +This repository contains NLP models trained and evaluated by Wikilangs, specifically on **BM** Wikipedia data. +We analyze tokenizers, n-gram models, Markov chains, vocabulary statistics, and word embeddings. + +## 📋 Repository Contents + +### Models & Assets + +- Tokenizers (8k, 16k, 32k, 64k) +- N-gram models (2, 3, 4-gram) +- Markov chains (context of 1, 2, 3 and 4) +- Subword N-gram and Markov chains +- Embeddings in various sizes and dimensions +- Language Vocabulary +- Language Statistics +![Performance Dashboard](visualizations/performance_dashboard.png) + +### Analysis and Evaluation + +- [1. Tokenizer Evaluation](#1-tokenizer-evaluation) +- [2. N-gram Model Evaluation](#2-n-gram-model-evaluation) +- [3. Markov Chain Evaluation](#3-markov-chain-evaluation) +- [4. Vocabulary Analysis](#4-vocabulary-analysis) +- [5. Word Embeddings Evaluation](#5-word-embeddings-evaluation) +- [6. Summary & Recommendations](#6-summary--recommendations) +- [Metrics Glossary](#appendix-metrics-glossary--interpretation-guide) +- [Visualizations Index](#visualizations-index) + +--- +## 1. Tokenizer Evaluation + +![Tokenizer Compression](visualizations/tokenizer_compression.png) + +### Results + +| Vocab Size | Compression | Avg Token Len | UNK Rate | Total Tokens | +|------------|-------------|---------------|----------|--------------| +| **8k** | 3.433x | 3.36 | 0.0887% | 117,303 | +| **16k** | 3.752x | 3.68 | 0.0969% | 107,301 | +| **32k** | 4.070x 🏆 | 3.99 | 0.1051% | 98,934 | + +### Tokenization Examples + +Below are sample sentences tokenized with each vocabulary size: + +**Sample 1:** `Los Angeles ye Amerika ka Kelenyalen Jamanaw ka dugu ye. + + + +Catégorie:Amerika ka...` + +| Vocab | Tokens | Count | +|-------|--------|-------| +| 8k | `▁los ▁angeles ▁ye ▁amerika ▁ka ▁kelenyalen ▁jamanaw ▁ka ▁dugu ▁ye ... (+9 more)` | 19 | +| 16k | `▁los ▁angeles ▁ye ▁amerika ▁ka ▁kelenyalen ▁jamanaw ▁ka ▁dugu ▁ye ... (+9 more)` | 19 | +| 32k | `▁los ▁angeles ▁ye ▁amerika ▁ka ▁kelenyalen ▁jamanaw ▁ka ▁dugu ▁ye ... (+9 more)` | 19 | + +**Sample 2:** `Kunkolosɛmɛ yɛ baganw ani mogow ka kunkolo kɔnɔ yɛ. Mogow bɛ miri kunkolo kɔnɔ. +...` + +| Vocab | Tokens | Count | +|-------|--------|-------| +| 8k | `▁kunkolo sɛ mɛ ▁yɛ ▁baganw ▁ani ▁mogow ▁ka ▁kunkolo ▁kɔnɔ ... (+14 more)` | 24 | +| 16k | `▁kunkolo sɛmɛ ▁yɛ ▁baganw ▁ani ▁mogow ▁ka ▁kunkolo ▁kɔnɔ ▁yɛ ... (+11 more)` | 21 | +| 32k | `▁kunkolosɛmɛ ▁yɛ ▁baganw ▁ani ▁mogow ▁ka ▁kunkolo ▁kɔnɔ ▁yɛ . ... (+9 more)` | 19 | + +**Sample 3:** `TaliBailleul, Charles. 2008. Dictionnaire français-bambara. Bamako: Éditions Do...` + +| Vocab | Tokens | Count | +|-------|--------|-------| +| 8k | `▁tali bailleul , ▁charles . ▁ 2 0 0 8 ... (+31 more)` | 41 | +| 16k | `▁tali bailleul , ▁charles . ▁ 2 0 0 8 ... (+31 more)` | 41 | +| 32k | `▁talibailleul , ▁charles . ▁ 2 0 0 8 . ... (+30 more)` | 40 | + + +### Key Findings + +- **Best Compression:** 32k achieves 4.070x compression +- **Lowest UNK Rate:** 8k with 0.0887% unknown tokens +- **Trade-off:** Larger vocabularies improve compression but increase model size +- **Recommendation:** 32k vocabulary provides optimal balance for production use + +--- +## 2. N-gram Model Evaluation + +![N-gram Perplexity](visualizations/ngram_perplexity.png) + +![N-gram Coverage](visualizations/ngram_coverage.png) + +### Results + +| N-gram | Perplexity | Entropy | Unique N-grams | Top-100 Coverage | Top-1000 Coverage | +|--------|------------|---------|----------------|------------------|-------------------| +| **2-gram** | 950 🏆 | 9.89 | 2,854 | 45.2% | 80.3% | +| **2-gram** | 322 🏆 | 8.33 | 2,127 | 63.8% | 97.9% | +| **3-gram** | 976 | 9.93 | 3,554 | 47.1% | 75.8% | +| **3-gram** | 2,159 | 11.08 | 11,428 | 27.6% | 72.5% | +| **4-gram** | 1,930 | 10.91 | 8,337 | 41.6% | 58.5% | +| **4-gram** | 8,659 | 13.08 | 39,905 | 14.4% | 46.6% | + +### Top 5 N-grams by Size + +**2-grams:** + +| Rank | N-gram | Count | +|------|--------|-------| +| 1 | `catégorie :` | 1,068 | +| 2 | `ye .` | 822 | +| 3 | `’ a` | 627 | +| 4 | `ka dugu` | 577 | +| 5 | `. sababou` | 571 | + +**3-grams:** + +| Rank | N-gram | Count | +|------|--------|-------| +| 1 | `français - bambara` | 419 | +| 2 | `dictionnaire français -` | 419 | +| 3 | `. dictionnaire français` | 419 | +| 4 | `2008 . dictionnaire` | 419 | +| 5 | `. 2008 .` | 419 | + +**4-grams:** + +| Rank | N-gram | Count | +|------|--------|-------| +| 1 | `. dictionnaire français -` | 419 | +| 2 | `- 04 - 8` | 419 | +| 3 | `français - bambara .` | 419 | +| 4 | `- bambara . bamako` | 419 | +| 5 | `bambara . bamako :` | 419 | + + +### Key Findings + +- **Best Perplexity:** 2-gram with 322 +- **Entropy Trend:** Decreases with larger n-grams (more predictable) +- **Coverage:** Top-1000 patterns cover ~47% of corpus +- **Recommendation:** 4-gram or 5-gram for best predictive performance + +--- +## 3. Markov Chain Evaluation + +![Markov Entropy](visualizations/markov_entropy.png) + +![Markov Branching](visualizations/markov_branching.png) + +### Results + +| Context | Avg Entropy | Perplexity | Branching Factor | Unique Contexts | Predictability | +|---------|-------------|------------|------------------|-----------------|----------------| +| **1** | 0.5830 | 1.498 | 3.54 | 18,421 | 41.7% | +| **1** | 1.2181 | 2.326 | 9.19 | 508 | 0.0% | +| **2** | 0.2211 | 1.166 | 1.48 | 65,151 | 77.9% | +| **2** | 1.0235 | 2.033 | 5.17 | 4,659 | 0.0% | +| **3** | 0.0800 | 1.057 | 1.13 | 96,171 | 92.0% | +| **3** | 0.7286 | 1.657 | 3.07 | 24,092 | 27.1% | +| **4** | 0.0309 🏆 | 1.022 | 1.04 | 108,554 | 96.9% | +| **4** | 0.4796 🏆 | 1.394 | 2.01 | 73,789 | 52.0% | + +### Generated Text Samples + +Below are text samples generated from each Markov chain model: + +**Context Size 1:** + +1. `. farrell , kɔɔnɔ du riz africain , o wati san 1648 - wong vong ye` +2. `, i ka tɔgɔ tun te deli ka dugu tɔw kan , ni swedi , na` +3. `ye ko an bolo suguya kɛmɛ tan kɔnɔ bamakɔ dugu ye ukrainekaw ka kɛnɛya ye jamana` + +**Context Size 2:** + +1. `catégorie : afrika catégorie : cema amerika . onu kuntilenna fɔlɔ ye mi ma yiriwa kosɛbɛ .` +2. `ye . catégorie : faransi ka dugu ye . dugumogo be taa jon yooro . gallery sababou` +3. `’ a kulɛriw kan . hadamadenw ka josariyaw ni politikitɔnw ka bɛnkansɛbɛn ye min sigira senkan c` + +**Context Size 3:** + +1. `éditions donniya . isbn 2 - 911741 - 04 - 8 . sababou catégorie : jɛgɛ` +2. `bambara . bamako : éditions donniya . isbn 2 - 911741 - 04 - 8 . sababou catégorie` +3. `français - bambara . bamako : éditions donniya . isbn 2 - 911741 - 04 - 8 .` + +**Context Size 4:** + +1. `, charles . 2008 . dictionnaire français - bambara . bamako : éditions donniya . isbn 2 - 911741` +2. `. dictionnaire français - bambara . bamako : éditions donniya . isbn 2 - 911741 - 04 - 8` +3. `français - bambara . bamako : éditions donniya . isbn 2 - 911741 - 04 - 8 . sababou` + + +### Key Findings + +- **Best Predictability:** Context-4 with 96.9% predictability +- **Branching Factor:** Decreases with context size (more deterministic) +- **Memory Trade-off:** Larger contexts require more storage (73,789 contexts) +- **Recommendation:** Context-3 or Context-4 for text generation + +--- +## 4. Vocabulary Analysis + +![Zipf's Law](visualizations/zipf_law.png) + +![Top Words](visualizations/top20_words.png) + +![Coverage Curve](visualizations/vocab_coverage.png) + +### Statistics + +| Metric | Value | +|--------|-------| +| Vocabulary Size | 7,195 | +| Total Tokens | 102,263 | +| Mean Frequency | 14.21 | +| Median Frequency | 3 | +| Frequency Std Dev | 106.29 | + +### Most Common Words + +| Rank | Word | Frequency | +|------|------|-----------| +| 1 | ye | 4,480 | +| 2 | ka | 4,400 | +| 3 | a | 3,281 | +| 4 | la | 1,931 | +| 5 | ni | 1,900 | +| 6 | bɛ | 1,844 | +| 7 | na | 1,626 | +| 8 | min | 1,192 | +| 9 | o | 1,154 | +| 10 | ani | 1,079 | + +### Least Common Words (from vocabulary) + +| Rank | Word | Frequency | +|------|------|-----------| +| 1 | dakon | 2 | +| 2 | taamaɲogonw | 2 | +| 3 | abubakari | 2 | +| 4 | ameniras | 2 | +| 5 | kandasi | 2 | +| 6 | qore | 2 | +| 7 | amɔn | 2 | +| 8 | bajiw | 2 | +| 9 | dunbagaw | 2 | +| 10 | mouvement | 2 | + +### Zipf's Law Analysis + +| Metric | Value | +|--------|-------| +| Zipf Coefficient | 1.0134 | +| R² (Goodness of Fit) | 0.984519 | +| Adherence Quality | **excellent** | + +### Coverage Analysis + +| Top N Words | Coverage | +|-------------|----------| +| Top 100 | 52.0% | +| Top 1,000 | 79.0% | +| Top 5,000 | 95.7% | +| Top 10,000 | 0.0% | + +### Key Findings + +- **Zipf Compliance:** R²=0.9845 indicates excellent adherence to Zipf's law +- **High Frequency Dominance:** Top 100 words cover 52.0% of corpus +- **Long Tail:** -2,805 words needed for remaining 100.0% coverage + +--- +## 5. Word Embeddings Evaluation + +![Embedding Isotropy](visualizations/embedding_isotropy.png) + +![Similarity Matrix](visualizations/embedding_similarity.png) + +![t-SNE Words](visualizations/tsne_words.png) + +![t-SNE Sentences](visualizations/tsne_sentences.png) + +### Model Comparison + +| Model | Vocab Size | Dimension | Avg Norm | Std Norm | Isotropy | +|-------|------------|-----------|----------|----------|----------| +| **mono_32d** | 2,309 | 32 | 2.998 | 0.730 | 0.2244 🏆 | +| **mono_64d** | 2,309 | 64 | 2.963 | 0.687 | 0.0668 | +| **mono_128d** | 2,309 | 128 | 2.969 | 0.695 | 0.0115 | +| **embeddings_enhanced** | 0 | 0 | 0.000 | 0.000 | 0.0000 | + +### Key Findings + +- **Best Isotropy:** mono_32d with 0.2244 (more uniform distribution) +- **Dimension Trade-off:** Higher dimensions capture more semantics but reduce isotropy +- **Vocabulary Coverage:** All models cover 2,309 words +- **Recommendation:** 100d for balanced semantic capture and efficiency + +--- +## 6. Summary & Recommendations + +![Performance Dashboard](visualizations/performance_dashboard.png) + +### Production Recommendations + +| Component | Recommended | Rationale | +|-----------|-------------|-----------| +| Tokenizer | **32k BPE** | Best compression (4.07x) with low UNK rate | +| N-gram | **5-gram** | Lowest perplexity (322) | +| Markov | **Context-4** | Highest predictability (96.9%) | +| Embeddings | **100d** | Balanced semantic capture and isotropy | + +--- +## Appendix: Metrics Glossary & Interpretation Guide + +This section provides definitions, intuitions, and guidance for interpreting the metrics used throughout this report. + +### Tokenizer Metrics + +**Compression Ratio** +> *Definition:* The ratio of characters to tokens (chars/token). Measures how efficiently the tokenizer represents text. +> +> *Intuition:* Higher compression means fewer tokens needed to represent the same text, reducing sequence lengths for downstream models. A 3x compression means ~3 characters per token on average. +> +> *What to seek:* Higher is generally better for efficiency, but extremely high compression may indicate overly aggressive merging that loses morphological information. + +**Average Token Length (Fertility)** +> *Definition:* Mean number of characters per token produced by the tokenizer. +> +> *Intuition:* Reflects the granularity of tokenization. Longer tokens capture more context but may struggle with rare words; shorter tokens are more flexible but increase sequence length. +> +> *What to seek:* Balance between 2-5 characters for most languages. Arabic/morphologically-rich languages may benefit from slightly longer tokens. + +**Unknown Token Rate (OOV Rate)** +> *Definition:* Percentage of tokens that map to the unknown/UNK token, indicating words the tokenizer cannot represent. +> +> *Intuition:* Lower OOV means better vocabulary coverage. High OOV indicates the tokenizer encounters many unseen character sequences. +> +> *What to seek:* Below 1% is excellent; below 5% is acceptable. BPE tokenizers typically achieve very low OOV due to subword fallback. + +### N-gram Model Metrics + +**Perplexity** +> *Definition:* Measures how "surprised" the model is by test data. Mathematically: 2^(cross-entropy). Lower values indicate better prediction. +> +> *Intuition:* If perplexity is 100, the model is as uncertain as if choosing uniformly among 100 options at each step. A perplexity of 10 means effectively choosing among 10 equally likely options. +> +> *What to seek:* Lower is better. Perplexity decreases with larger n-grams (more context). Values vary widely by language and corpus size. + +**Entropy** +> *Definition:* Average information content (in bits) needed to encode the next token given the context. Related to perplexity: perplexity = 2^entropy. +> +> *Intuition:* High entropy means high uncertainty/randomness; low entropy means predictable patterns. Natural language typically has entropy between 1-4 bits per character. +> +> *What to seek:* Lower entropy indicates more predictable text patterns. Entropy should decrease as n-gram size increases. + +**Coverage (Top-K)** +> *Definition:* Percentage of corpus occurrences explained by the top K most frequent n-grams. +> +> *Intuition:* High coverage with few patterns indicates repetitive/formulaic text; low coverage suggests diverse vocabulary usage. +> +> *What to seek:* Depends on use case. For language modeling, moderate coverage (40-60% with top-1000) is typical for natural text. + +### Markov Chain Metrics + +**Average Entropy** +> *Definition:* Mean entropy across all contexts, measuring average uncertainty in next-word prediction. +> +> *Intuition:* Lower entropy means the model is more confident about what comes next. Context-1 has high entropy (many possible next words); Context-4 has low entropy (few likely continuations). +> +> *What to seek:* Decreasing entropy with larger context sizes. Very low entropy (<0.1) indicates highly deterministic transitions. + +**Branching Factor** +> *Definition:* Average number of unique next tokens observed for each context. +> +> *Intuition:* High branching = many possible continuations (flexible but uncertain); low branching = few options (predictable but potentially repetitive). +> +> *What to seek:* Branching factor should decrease with context size. Values near 1.0 indicate nearly deterministic chains. + +**Predictability** +> *Definition:* Derived metric: (1 - normalized_entropy) × 100%. Indicates how deterministic the model's predictions are. +> +> *Intuition:* 100% predictability means the next word is always certain; 0% means completely random. Real text falls between these extremes. +> +> *What to seek:* Higher predictability for text generation quality, but too high (>98%) may produce repetitive output. + +### Vocabulary & Zipf's Law Metrics + +**Zipf's Coefficient** +> *Definition:* The slope of the log-log plot of word frequency vs. rank. Zipf's law predicts this should be approximately -1. +> +> *Intuition:* A coefficient near -1 indicates the corpus follows natural language patterns where a few words are very common and most words are rare. +> +> *What to seek:* Values between -0.8 and -1.2 indicate healthy natural language distribution. Deviations may suggest domain-specific or artificial text. + +**R² (Coefficient of Determination)** +> *Definition:* Measures how well the linear fit explains the frequency-rank relationship. Ranges from 0 to 1. +> +> *Intuition:* R² near 1.0 means the data closely follows Zipf's law; lower values indicate deviation from expected word frequency patterns. +> +> *What to seek:* R² > 0.95 is excellent; > 0.99 indicates near-perfect Zipf adherence typical of large natural corpora. + +**Vocabulary Coverage** +> *Definition:* Cumulative percentage of corpus tokens accounted for by the top N words. +> +> *Intuition:* Shows how concentrated word usage is. If top-100 words cover 50% of text, the corpus relies heavily on common words. +> +> *What to seek:* Top-100 covering 30-50% is typical. Higher coverage indicates more repetitive text; lower suggests richer vocabulary. + +### Word Embedding Metrics + +**Isotropy** +> *Definition:* Measures how uniformly distributed vectors are in the embedding space. Computed as the ratio of minimum to maximum singular values. +> +> *Intuition:* High isotropy (near 1.0) means vectors spread evenly in all directions; low isotropy means vectors cluster in certain directions, reducing expressiveness. +> +> *What to seek:* Higher isotropy generally indicates better-quality embeddings. Values > 0.1 are reasonable; > 0.3 is good. Lower-dimensional embeddings tend to have higher isotropy. + +**Average Norm** +> *Definition:* Mean magnitude (L2 norm) of word vectors in the embedding space. +> +> *Intuition:* Indicates the typical "length" of vectors. Consistent norms suggest stable training; high variance may indicate some words are undertrained. +> +> *What to seek:* Relatively consistent norms across models. The absolute value matters less than consistency (low std deviation). + +**Cosine Similarity** +> *Definition:* Measures angular similarity between vectors, ranging from -1 (opposite) to 1 (identical direction). +> +> *Intuition:* Words with similar meanings should have high cosine similarity. This is the standard metric for semantic relatedness in embeddings. +> +> *What to seek:* Semantically related words should score > 0.5; unrelated words should be near 0. Synonyms often score > 0.7. + +**t-SNE Visualization** +> *Definition:* t-Distributed Stochastic Neighbor Embedding - a dimensionality reduction technique that preserves local structure for visualization. +> +> *Intuition:* Clusters in t-SNE plots indicate groups of semantically related words. Spread indicates vocabulary diversity; tight clusters suggest semantic coherence. +> +> *What to seek:* Meaningful clusters (e.g., numbers together, verbs together). Avoid over-interpreting distances - t-SNE preserves local, not global, structure. + +### General Interpretation Guidelines + +1. **Compare within model families:** Metrics are most meaningful when comparing models of the same type (e.g., 8k vs 64k tokenizer). +2. **Consider trade-offs:** Better performance on one metric often comes at the cost of another (e.g., compression vs. OOV rate). +3. **Context matters:** Optimal values depend on downstream tasks. Text generation may prioritize different metrics than classification. +4. **Corpus influence:** All metrics are influenced by corpus characteristics. Wikipedia text differs from social media or literature. +5. **Language-specific patterns:** Morphologically rich languages (like Arabic) may show different optimal ranges than analytic languages. + + +### Visualizations Index + +| Visualization | Description | +|---------------|-------------| +| Tokenizer Compression | Compression ratios by vocabulary size | +| Tokenizer Fertility | Average token length by vocabulary | +| Tokenizer OOV | Unknown token rates | +| Tokenizer Total Tokens | Total tokens by vocabulary | +| N-gram Perplexity | Perplexity by n-gram size | +| N-gram Entropy | Entropy by n-gram size | +| N-gram Coverage | Top pattern coverage | +| N-gram Unique | Unique n-gram counts | +| Markov Entropy | Entropy by context size | +| Markov Branching | Branching factor by context | +| Markov Contexts | Unique context counts | +| Zipf's Law | Frequency-rank distribution with fit | +| Vocab Frequency | Word frequency distribution | +| Top 20 Words | Most frequent words | +| Vocab Coverage | Cumulative coverage curve | +| Embedding Isotropy | Vector space uniformity | +| Embedding Norms | Vector magnitude distribution | +| Embedding Similarity | Word similarity heatmap | +| Nearest Neighbors | Similar words for key terms | +| t-SNE Words | 2D word embedding visualization | +| t-SNE Sentences | 2D sentence embedding visualization | +| Position Encoding | Encoding method comparison | +| Model Sizes | Storage requirements | +| Performance Dashboard | Comprehensive performance overview | + +--- +## About This Project + +### Data Source + +Models trained on [wikipedia-monthly](https://huggingface.co/datasets/omarkamali/wikipedia-monthly) - a monthly snapshot of Wikipedia articles across 300+ languages. + +### Project + +A project by **[Wikilangs](https://wikilangs.org)** - Open-source NLP models for every Wikipedia language. + +### Maintainer + +[Omar Kamali](https://omarkamali.com) - [Omneity Labs](https://omneitylabs.com) + +### Citation + +If you use these models in your research, please cite: + +```bibtex +@misc{wikilangs2025, + author = {Kamali, Omar}, + title = {Wikilangs: Open NLP Models for Wikipedia Languages}, + year = {2025}, + publisher = {HuggingFace}, + url = {https://huggingface.co/wikilangs} + institution = {Omneity Labs} +} +``` + +### License + +MIT License - Free for academic and commercial use. + +### Links + +- 🌐 Website: [wikilangs.org](https://wikilangs.org) +- 🤗 Models: [huggingface.co/wikilangs](https://huggingface.co/wikilangs) +- 📊 Data: [wikipedia-monthly](https://huggingface.co/datasets/omarkamali/wikipedia-monthly) +- 👤 Author: [Omar Kamali](https://huggingface.co/omarkamali) +--- +*Generated by Wikilangs Models Pipeline* + +*Report Date: 2025-12-28 05:28:29* diff --git a/models/embeddings/monolingual/bm_128d.bin b/models/embeddings/monolingual/bm_128d.bin new file mode 100644 index 0000000000000000000000000000000000000000..a2a170e765772226cb0d0420349bb571b483b583 --- /dev/null +++ b/models/embeddings/monolingual/bm_128d.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7f0d7c8930252db4f75ccff26903504087a5598f8e89d5877efdc3838fa71e4e +size 1026401129 diff --git a/models/embeddings/monolingual/bm_128d.meta.json b/models/embeddings/monolingual/bm_128d.meta.json new file mode 100644 index 0000000000000000000000000000000000000000..65e3cb04cee5886eb5f2c11ccaf044be520cf352 --- /dev/null +++ b/models/embeddings/monolingual/bm_128d.meta.json @@ -0,0 +1 @@ +{"lang": "bm", "dim": 128, "max_seq_len": 512, "is_aligned": false} \ No newline at end of file diff --git a/models/embeddings/monolingual/bm_128d_metadata.json b/models/embeddings/monolingual/bm_128d_metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..1a264fc17e90c3bb0cf7926f5efdc6778111ebe2 --- /dev/null +++ b/models/embeddings/monolingual/bm_128d_metadata.json @@ -0,0 +1,13 @@ +{ + "language": "bm", + "dimension": 128, + "version": "monolingual", + "training_params": { + "dim": 128, + "min_count": 5, + "window": 5, + "negative": 5, + "epochs": 5 + }, + "vocab_size": 2309 +} \ No newline at end of file diff --git a/models/embeddings/monolingual/bm_32d.bin b/models/embeddings/monolingual/bm_32d.bin new file mode 100644 index 0000000000000000000000000000000000000000..05b41e1d21d4089e054616e38579de3932778d66 --- /dev/null +++ b/models/embeddings/monolingual/bm_32d.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ecbf3cf75d36d5786a480590916fad5d6bc30b12637de0b8e671f92799273b4e +size 256627817 diff --git a/models/embeddings/monolingual/bm_32d.meta.json b/models/embeddings/monolingual/bm_32d.meta.json new file mode 100644 index 0000000000000000000000000000000000000000..ac09ee66c3dc8de3beb2232731729aae7e885cc6 --- /dev/null +++ b/models/embeddings/monolingual/bm_32d.meta.json @@ -0,0 +1 @@ +{"lang": "bm", "dim": 32, "max_seq_len": 512, "is_aligned": false} \ No newline at end of file diff --git a/models/embeddings/monolingual/bm_32d_metadata.json b/models/embeddings/monolingual/bm_32d_metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..7b5a9338f2d19c36c19a5bee6ec9ba824e478b43 --- /dev/null +++ b/models/embeddings/monolingual/bm_32d_metadata.json @@ -0,0 +1,13 @@ +{ + "language": "bm", + "dimension": 32, + "version": "monolingual", + "training_params": { + "dim": 32, + "min_count": 5, + "window": 5, + "negative": 5, + "epochs": 5 + }, + "vocab_size": 2309 +} \ No newline at end of file diff --git a/models/embeddings/monolingual/bm_64d.bin b/models/embeddings/monolingual/bm_64d.bin new file mode 100644 index 0000000000000000000000000000000000000000..62fa650c437352cb4dafe059ee51c9259278ed64 --- /dev/null +++ b/models/embeddings/monolingual/bm_64d.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:03ddc93065212141e650c80ef4273e04a2ec47432a07bd4dc33ebf690234049c +size 513218921 diff --git a/models/embeddings/monolingual/bm_64d.meta.json b/models/embeddings/monolingual/bm_64d.meta.json new file mode 100644 index 0000000000000000000000000000000000000000..0df9c6a110ed5f048993ee4f50bdb3df37a9d879 --- /dev/null +++ b/models/embeddings/monolingual/bm_64d.meta.json @@ -0,0 +1 @@ +{"lang": "bm", "dim": 64, "max_seq_len": 512, "is_aligned": false} \ No newline at end of file diff --git a/models/embeddings/monolingual/bm_64d_metadata.json b/models/embeddings/monolingual/bm_64d_metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..d9caec59e06b518fc8aa81308f0fc91bf3e76512 --- /dev/null +++ b/models/embeddings/monolingual/bm_64d_metadata.json @@ -0,0 +1,13 @@ +{ + "language": "bm", + "dimension": 64, + "version": "monolingual", + "training_params": { + "dim": 64, + "min_count": 5, + "window": 5, + "negative": 5, + "epochs": 5 + }, + "vocab_size": 2309 +} \ No newline at end of file diff --git a/models/subword_markov/bm_markov_ctx1_subword.parquet b/models/subword_markov/bm_markov_ctx1_subword.parquet new file mode 100644 index 0000000000000000000000000000000000000000..123dec3748f2d72be5906896666c5c7659acd578 --- /dev/null +++ b/models/subword_markov/bm_markov_ctx1_subword.parquet @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0819a99ba610dc7d0095d059a8cd0fbf0e93d96340fab94bfe408f6e78c431e4 +size 40112 diff --git a/models/subword_markov/bm_markov_ctx1_subword_metadata.json b/models/subword_markov/bm_markov_ctx1_subword_metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..c5cad5b3b41306e55802ed02a9ee077b1f43e1e5 --- /dev/null +++ b/models/subword_markov/bm_markov_ctx1_subword_metadata.json @@ -0,0 +1,7 @@ +{ + "context_size": 1, + "variant": "subword", + "language": "bm", + "unique_contexts": 508, + "total_transitions": 649338 +} \ No newline at end of file diff --git a/models/subword_markov/bm_markov_ctx2_subword.parquet b/models/subword_markov/bm_markov_ctx2_subword.parquet new file mode 100644 index 0000000000000000000000000000000000000000..d177b392414034a349651ba4759107a3769d5f94 --- /dev/null +++ b/models/subword_markov/bm_markov_ctx2_subword.parquet @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6bb80b6a46cd1c2d4387947a64a191c8c3a0e17cb30ee46dd9853eb3f4e28c6a +size 184560 diff --git a/models/subword_markov/bm_markov_ctx2_subword_metadata.json b/models/subword_markov/bm_markov_ctx2_subword_metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..3ab9ca0e3bde92f944deda1f24efe9fbc50064f7 --- /dev/null +++ b/models/subword_markov/bm_markov_ctx2_subword_metadata.json @@ -0,0 +1,7 @@ +{ + "context_size": 2, + "variant": "subword", + "language": "bm", + "unique_contexts": 4659, + "total_transitions": 648039 +} \ No newline at end of file diff --git a/models/subword_markov/bm_markov_ctx3_subword.parquet b/models/subword_markov/bm_markov_ctx3_subword.parquet new file mode 100644 index 0000000000000000000000000000000000000000..5b1e03354083d444268326e70716e7d5ce0d817c --- /dev/null +++ b/models/subword_markov/bm_markov_ctx3_subword.parquet @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2346a42c76aff72fd2b3fe02f559333cd9dda578b8ced3ba260d8cf6e2171a4e +size 546787 diff --git a/models/subword_markov/bm_markov_ctx3_subword_metadata.json b/models/subword_markov/bm_markov_ctx3_subword_metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..52b7bdf3b7ef6cc1388c710d854b50d81d7553e6 --- /dev/null +++ b/models/subword_markov/bm_markov_ctx3_subword_metadata.json @@ -0,0 +1,7 @@ +{ + "context_size": 3, + "variant": "subword", + "language": "bm", + "unique_contexts": 24092, + "total_transitions": 646740 +} \ No newline at end of file diff --git a/models/subword_markov/bm_markov_ctx4_subword.parquet b/models/subword_markov/bm_markov_ctx4_subword.parquet new file mode 100644 index 0000000000000000000000000000000000000000..c1a6bd66ad6c9b3366ba0248c1d28015157c5d8e --- /dev/null +++ b/models/subword_markov/bm_markov_ctx4_subword.parquet @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a1d7257d4abefb8c32f0420d2d9fc0d913bcdb5e4772236891d7490a5264704a +size 1226126 diff --git a/models/subword_markov/bm_markov_ctx4_subword_metadata.json b/models/subword_markov/bm_markov_ctx4_subword_metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..1bd1f007c6242dc9a5540f72ed12bdb1917536d1 --- /dev/null +++ b/models/subword_markov/bm_markov_ctx4_subword_metadata.json @@ -0,0 +1,7 @@ +{ + "context_size": 4, + "variant": "subword", + "language": "bm", + "unique_contexts": 73789, + "total_transitions": 645441 +} \ No newline at end of file diff --git a/models/subword_ngram/bm_2gram_subword.parquet b/models/subword_ngram/bm_2gram_subword.parquet new file mode 100644 index 0000000000000000000000000000000000000000..d4a5b59cc5c7b935377d6334e10935bc1ebde99b --- /dev/null +++ b/models/subword_ngram/bm_2gram_subword.parquet @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:06ce57f95742b61708e17e229d33f174f2dabe7ae11cfc1872a7a6182573cfcc +size 26169 diff --git a/models/subword_ngram/bm_2gram_subword_metadata.json b/models/subword_ngram/bm_2gram_subword_metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..f2bd4259ef97b848a6a15e329370b7d3505e81ad --- /dev/null +++ b/models/subword_ngram/bm_2gram_subword_metadata.json @@ -0,0 +1,7 @@ +{ + "n": 2, + "variant": "subword", + "language": "bm", + "unique_ngrams": 2127, + "total_ngrams": 649338 +} \ No newline at end of file diff --git a/models/subword_ngram/bm_3gram_subword.parquet b/models/subword_ngram/bm_3gram_subword.parquet new file mode 100644 index 0000000000000000000000000000000000000000..42bde8c5606ea8a0651b784b74df228a636e350a --- /dev/null +++ b/models/subword_ngram/bm_3gram_subword.parquet @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2f6c3f360cbad86d31de6197b81525e30f7a976dc638b3ca0ae073b2a98553a6 +size 131173 diff --git a/models/subword_ngram/bm_3gram_subword_metadata.json b/models/subword_ngram/bm_3gram_subword_metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..de4a7ef1974a0225bc4c4ef52f9a8593047db2f3 --- /dev/null +++ b/models/subword_ngram/bm_3gram_subword_metadata.json @@ -0,0 +1,7 @@ +{ + "n": 3, + "variant": "subword", + "language": "bm", + "unique_ngrams": 11428, + "total_ngrams": 648039 +} \ No newline at end of file diff --git a/models/subword_ngram/bm_4gram_subword.parquet b/models/subword_ngram/bm_4gram_subword.parquet new file mode 100644 index 0000000000000000000000000000000000000000..878685bd153288027c972c96322699ebde56636e --- /dev/null +++ b/models/subword_ngram/bm_4gram_subword.parquet @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:66a769c12a2d8a97eff8c9d92dea9868be0c798775b864d08da7c4cc28cc988f +size 486277 diff --git a/models/subword_ngram/bm_4gram_subword_metadata.json b/models/subword_ngram/bm_4gram_subword_metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..29947197bffa7613edca39a80dd70db282741d63 --- /dev/null +++ b/models/subword_ngram/bm_4gram_subword_metadata.json @@ -0,0 +1,7 @@ +{ + "n": 4, + "variant": "subword", + "language": "bm", + "unique_ngrams": 39905, + "total_ngrams": 646740 +} \ No newline at end of file diff --git a/models/tokenizer/bm_tokenizer_16k.model b/models/tokenizer/bm_tokenizer_16k.model new file mode 100644 index 0000000000000000000000000000000000000000..b119bde57427c513a615a8d882034a25ce208943 --- /dev/null +++ b/models/tokenizer/bm_tokenizer_16k.model @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9296d04641b8a3567ec23dd58f2570e88576b52be897baa8365b0b75d62817db +size 512912 diff --git a/models/tokenizer/bm_tokenizer_16k.vocab b/models/tokenizer/bm_tokenizer_16k.vocab new file mode 100644 index 0000000000000000000000000000000000000000..2d8a0b1522ccbf727506025224d8a83992052ea4 --- /dev/null +++ b/models/tokenizer/bm_tokenizer_16k.vocab @@ -0,0 +1,16000 @@ + 0 + 0 + 0 + 0 +▁k -0 +an -1 +▁s -2 +▁b -3 +▁d -4 +▁n -5 +▁y -6 +▁m -7 +in -8 +▁f -9 +▁ka -10 +la -11 +ar -12 +▁t -13 +▁ye -14 +am -15 +on -16 +en -17 +▁a -18 +li -19 +▁c -20 +ri -21 +▁j -22 +▁la -23 +ti -24 +ba -25 +le -26 +ɔn -27 +gu -28 +go -29 +ya -30 +ra -31 +▁bɛ -32 +ara -33 +ugu -34 +▁ni -35 +un -36 +▁na -37 +▁w -38 +ana -39 +is -40 +▁min -41 +at -42 +ɔr -43 +ɛn -44 +▁ma -45 +▁o -46 +ma -47 +len -48 +re -49 +ani -50 +ko -51 +ka -52 +▁kɛ -53 +▁si -54 +ɔrɔ -55 +si -56 +lo -57 +▁( -58 +▁sa -59 +▁dugu -60 +ro -61 +▁ko -62 +amana -63 +ɔg -64 +▁san -65 +ga -66 +na -67 +rie -68 +il -69 +tion -70 +ama -71 +▁cat -72 +▁ani -73 +égo -74 +égorie -75 +▁catégorie -76 +ou -77 +▁p -78 +di -79 +▁ba -80 +▁don -81 +ni -82 +▁ta -83 +ul -84 +▁jamana -85 +▁di -86 +gi -87 +ɔgɔ -88 +▁h -89 +▁kan -90 +er -91 +▁ɲ -92 +▁u -93 +▁wa -94 +ɛr -95 +▁e -96 +▁i -97 +so -98 +ta -99 +kan -100 +ran -101 +▁saba -102 +▁se -103 +ɔnɔ -104 +da -105 +ogo -106 +bi -107 +▁de -108 +ki -109 +ur -110 +sa -111 +▁fɛ -112 +▁sabab -113 +ari -114 +lan -115 +▁da -116 +oro -117 +▁ch -118 +▁be -119 +▁fɔ -120 +▁g -121 +▁fa -122 +▁kɔ -123 +▁kɔnɔ -124 +es -125 +▁sababou -126 +▁in -127 +▁dɔ -128 +▁ke -129 +▁tun -130 +▁fran -131 +kɛ -132 +iri -133 +les -134 +ɛrɛ -135 +▁bama -136 +te -137 +us -138 +olo -139 +or -140 +▁is -141 +ire -142 +ille -143 +aman -144 +he -145 +▁sɔrɔ -146 +aran -147 +▁ku -148 +▁ti -149 +fɛ -150 +▁é -151 +niya -152 +ɛb -153 +▁bamako -154 +bara -155 +tions -156 +ais -157 +▁franç -158 +bn -159 +ini -160 +bam -161 +▁français -162 +se -163 +▁dic -164 +▁kelen -165 +▁char -166 +▁isbn -167 +▁ha -168 +um -169 +ditions -170 +▁donniya -171 +▁charles -172 +naire -173 +▁diction -174 +baille -175 +bambara -176 +bailleul -177 +▁éditions -178 +▁dictionnaire -179 +ke -180 +den -181 +eri -182 +nu -183 +aransi -184 +▁taa -185 +▁sigi -186 +▁bɔ -187 +▁an -188 +▁man -189 +▁bi -190 +inɛ -191 +▁ji -192 +fa -193 +lɛ -194 +ɲɛ -195 +▁fan -196 +gɛ -197 +▁af -198 +▁minnu -199 +▁mali -200 +ch -201 +mɛ -202 +). -203 +to -204 +de -205 +▁v -206 +▁kɔfɛ -207 +▁sira -208 +ji -209 +wa -210 +▁ja -211 +uru -212 +▁ɲɛ -213 +ulu -214 +▁" -215 +ɔrɔn -216 +lu -217 +▁baara -218 +bɔ -219 +ameri -220 +be -221 +jɛ -222 +▁yo -223 +▁mɔgɔ -224 +▁fara -225 +▁kun -226 +▁dan -227 +▁sen -228 +ye -229 +oli -230 +▁caman -231 +dugu -232 +▁mo -233 +wu -234 +ina -235 +ine -236 +ge -237 +▁fi -238 +▁cɛ -239 +ku -240 +▁mara -241 +ca -242 +yɔrɔ -243 +lɔ -244 +▁tɛ -245 +▁. -246 +man -247 +▁kuma -248 +bo -249 +bu -250 +tu -251 +▁faransi -252 +ce -253 +nen -254 +lima -255 +▁yɔrɔ -256 +▁to -257 +me -258 +qu -259 +▁tu -260 +▁dɔn -261 +ne -262 +don -263 +tigi -264 +ɔgɔn -265 +▁jamanaw -266 +px -267 +▁ɛn -268 +▁tɔgɔ -269 +▁woro -270 +▁su -271 +▁yɛ -272 +pa -273 +lon -274 +ent -275 +▁faso -276 +▁gu -277 +gan -278 +▁ameri -279 +▁ca -280 +▁do -281 +▁mu -282 +▁ya -283 +▁kɛra -284 +▁bɛɛ -285 +ɛnɛ -286 +yalen -287 +), -288 +▁worodugu -289 +ci -290 +cogo -291 +we -292 +▁mi -293 +▁nke -294 +▁ọ -295 +hi -296 +kolo -297 +▁fo -298 +▁afri -299 +▁ga -300 +ha -301 +ɛbɛn -302 +▁jon -303 +jamana -304 +▁walima -305 +do -306 +mu -307 +▁ban -308 +fan -309 +▁tle -310 +nan -311 +▁nin -312 +▁kɔrɔ -313 +▁kɛlɛ -314 +▁yɛrɛ -315 +▁so -316 +ban -317 +▁kalan -318 +heli -319 +▁cogo -320 +▁l -321 +tɛr -322 +uni -323 +▁kos -324 +inɛti -325 +▁fanga -326 +▁saheli -327 +tɛrinɛti -328 +ja -329 +wi -330 +▁dugum -331 +▁ɛntɛrinɛti -332 +▁dɛ -333 +▁re -334 +kili -335 +▁dugumogo -336 +▁yooro -337 +▁bo -338 +▁jɛ -339 +yiri -340 +▁fɔlɔ -341 +kun -342 +▁le -343 +ati -344 +▁r -345 +oni -346 +amara -347 +th -348 +yan -349 +▁ɲɔgɔn -350 +ate -351 +▁fana -352 +▁siti -353 +faransi -354 +du -355 +hụ -356 +st -357 +▁bolo -358 +al -359 +rô -360 +▁kon -361 +bin -362 +ɛbɛ -363 +▁z -364 +▁we -365 +▁kelenyalen -366 +ôrô -367 +▁masa -368 +ilan -369 +▁waati -370 +kọ -371 +▁du -372 +▁bon -373 +▁den -374 +▁fasojamana -375 +kɛla -376 +▁mans -377 +gh -378 +▁ki -379 +▁dam -380 +mi -381 +yi -382 +sen -383 +fi -384 +isi -385 +tin -386 +risi -387 +co -388 +▁sugu -389 +▁wala -390 +pu -391 +aba -392 +▁co -393 +▁tile -394 +▁jira -395 +▁tlebi -396 +▁mansamara -397 +kɔ -398 +vi -399 +gwu -400 +ɛgɛ -401 +▁wɛrɛ -402 +fin -403 +mɔgɔ -404 +▁me -405 +▁te -406 +denw -407 +▁afrika -408 +pe -409 +ata -410 +▁al -411 +▁ne -412 +▁amerika -413 +po -414 +dɔn -415 +af -416 +▁kɛmɛ -417 +.[ -418 +gin -419 +kulu -420 +▁kosɛbɛ -421 +ve -422 +ter -423 +▁jɔ -424 +▁jo -425 +▁nka -426 +amanan -427 +▁gun -428 +▁li -429 +▁vi -430 +▁tan -431 +▁jate -432 +que -433 +▁faaba -434 +▁sɛbɛn -435 +▁egwu -436 +▁: -437 +tan -438 +▁ci -439 +▁- -440 +▁diɲɛ -441 +fɔ -442 +pi -443 +▁yen -444 +▁walasa -445 +▁bamanan -446 +zi -447 +▁ar -448 +▁of -449 +▁bɔra -450 +yanfan -451 +kụ -452 +▁kè -453 +▁dɔw -454 +fe -455 +amu -456 +kɔnɔ -457 +▁bila -458 +▁bè -459 +ɛna -460 +urun -461 +▁olu -462 +▁kɔrɔn -463 +▁dugukolo -464 +ing -465 +et -466 +▁ro -467 +▁fɛn -468 +▁kɔn -469 +▁hakɛ -470 +mo -471 +▁no -472 +▁po -473 +dị -474 +gô -475 +kalo -476 +▁son -477 +▁kulu -478 +▁yiri -479 +bụ -480 +cɛ -481 +ft -482 +▁ju -483 +ɛrɛn -484 +ariya -485 +▁yoga -486 +as -487 +▁mar -488 +▁kô -489 +▁ali -490 +▁— -491 +tiki -492 +▁tɔn -493 +▁jago -494 +san -495 +iriki -496 +▁uk -497 +▁daminɛ -498 +▁dô -499 +▁afiriki -500 +▁sin -501 +lle -502 +bli -503 +dala -504 +▁bana -505 +▁sababu -506 +▁“ -507 +kɔn -508 +ɛri -509 +▁fô -510 +wift -511 +▁fil -512 +▁mis -513 +ry -514 +▁ŋ -515 +▁aw -516 +uman -517 +▁swift -518 +▁mari -519 +▁bé -520 +tigɛ -521 +▁kɔgɔ -522 +sh -523 +▁jan -524 +▁fila -525 +▁jɛkulu -526 +ôgô -527 +ariku -528 +▁kura -529 +▁tuma -530 +▁wele -531 +▁con -532 +▁pro -533 +▁poli -534 +▁suguya -535 +▁fe -536 +▁tɔ -537 +▁kɛr -538 +▁boli -539 +su -540 +dan -541 +▁dị -542 +kụkọ -543 +▁the -544 +▁bɛna -545 +▁wɛrɛw -546 +▁kɔgɔji -547 +yo -548 +kaw -549 +wan -550 +▁sis -551 +▁kɛnɛ -552 +▁ukra -553 +au -554 +min -555 +fara -556 +jago -557 +▁bin -558 +▁sôrô -559 +▁ɲɛmɔgɔ -560 +▁ɔ -561 +ene -562 +kɔrɔ -563 +▁ce -564 +▁nɔ -565 +▁on -566 +▁muso -567 +▁sɛnɛ -568 +▁dilan -569 +ll -570 +tt -571 +ɲi -572 +ịhụ -573 +▁fari -574 +▁bamanankan -575 +ali -576 +gne -577 +nanya -578 +ịhụnanya -579 +▁bu -580 +▁lo -581 +▁des -582 +▁kab -583 +▁с -584 +▁lam -585 +▁sariya -586 +pụ -587 +▁et -588 +baga -589 +▁fin -590 +▁jɛn -591 +je -592 +▁ụ -593 +our -594 +ron -595 +taa -596 +▁franse -597 +εε -598 +▁[ -599 +▁« -600 +ami -601 +ega -602 +fɛn -603 +▁ho -604 +bolo -605 +▁laban -606 +▁hakili -607 +eni -608 +▁ahụ -609 +▁ndị -610 +amerika -611 +ru -612 +ty -613 +té -614 +dio -615 +sin -616 +▁pa -617 +mali -618 +ropa -619 +▁lab -620 +▁foro -621 +▁yiriwa -622 +▁farafin -623 +law -624 +ver -625 +▁naf -626 +ts -627 +ard -628 +dia -629 +▁fu -630 +▁/ -631 +▁at -632 +▁daɲɛ -633 +.. -634 +ww -635 +ere -636 +nin -637 +▁en -638 +▁go -639 +▁yé -640 +▁tra -641 +▁kama -642 +ɔrɔnya -643 +▁senega -644 +▁– -645 +int -646 +son -647 +▁bụ -648 +▁sh -649 +▁wi -650 +ulon -651 +kɛlaw -652 +kɛrɛn -653 +▁siri -654 +▁tariku -655 +▁baarakɛ -656 +▁+ -657 +sia -658 +▁baw -659 +▁dabɔ -660 +▁marifa -661 +rụ -662 +на -663 +▁, -664 +las -665 +bali -666 +jɛgɛ -667 +yali -668 +▁taama -669 +▁kɛmɛda -670 +▁sigilen -671 +rè -672 +che -673 +kow -674 +dama -675 +lenw -676 +▁kolon -677 +▁mɔgɔw -678 +▁sigira -679 +▁ameriki -680 +▁jamanadenw -681 +▁ɛ -682 +pan -683 +▁lu -684 +▁un -685 +▁duni -686 +▁lajɛ -687 +▁laka -688 +▁sila -689 +èn -690 +ск -691 +ena -692 +▁aka -693 +▁gine -694 +ра -695 +ber -696 +▁es -697 +▁wo -698 +▁dun -699 +▁laa -700 +publi -701 +▁cent -702 +▁tugu -703 +dɔnnen -704 +▁kɛrɛn -705 +▁bamakɔ -706 +▁jɔyɔrɔ -707 +▁politiki -708 +▁в -709 +are -710 +baw -711 +naf -712 +▁dé -713 +▁nt -714 +▁ra -715 +land -716 +tara -717 +▁tali -718 +▁wale -719 +▁cogoya -720 +▁masala -721 +kɛrɛnnen -722 +ré -723 +то -724 +mis -725 +▁je -726 +afri -727 +▁mas -728 +▁mili -729 +▁sisan -730 +el -731 +fo -732 +ps -733 +chi -734 +kar -735 +yɛn -736 +▁kaba -737 +▁minɛ -738 +▁site -739 +▁к -740 +jan -741 +res -742 +ton -743 +▁bar -744 +▁bɛn -745 +▁nafa -746 +▁kɛrɛnkɛrɛnnen -747 +ph -748 +ɛni -749 +hara -750 +▁ihe -751 +arabu -752 +bagan -753 +kalan -754 +▁kɔkan -755 +▁mansa -756 +▁kabini -757 +ck -758 +baa -759 +bia -760 +mba -761 +tra -762 +▁sun -763 +▁fanba -764 +▁tulon -765 +▁kunnaf -766 +▁farafinna -767 +lé -768 +va -769 +ces -770 +cha -771 +lin -772 +mar -773 +tte -774 +▁ale -775 +▁fla -776 +sɛbɛn -777 +▁sika -778 +ال -779 +tik -780 +ment -781 +tali -782 +▁nan -783 +▁hali -784 +▁tila -785 +afrika -786 +▁eropa -787 +▁laadala -788 +▁ịhụnanya -789 +▁jamanaden -790 +kw -791 +▁hi -792 +▁sɛ -793 +bila -794 +▁abụ -795 +▁mun -796 +▁sou -797 +▁cɛma -798 +▁kalo -799 +▁ukraine -800 +ct -801 +tɛ -802 +ɲa -803 +▁л -804 +▁р -805 +babu -806 +sira -807 +▁kar -808 +▁nana -809 +▁yɛlɛ -810 +▁danbɔ -811 +▁irisi -812 +▁sahara -813 +▁sigida -814 +▁kunnafoni -815 +za -816 +rit -817 +èrè -818 +▁sɛb -819 +ugula -820 +ɛnajɛ -821 +▁wari -822 +▁bonya -823 +▁filmu -824 +tɔ -825 +▁; -826 +▁th -827 +▁sam -828 +▁uni -829 +kelen -830 +kɔrɔn -831 +▁fɔli -832 +▁fɛɛrɛ -833 +▁sɛben -834 +▁hadama -835 +▁danfara -836 +по -837 +▁| -838 +liw -839 +ste -840 +tes -841 +uli -842 +ence -843 +lanw -844 +▁lib -845 +▁kilo -846 +▁kolo -847 +▁tiɲɛ -848 +// -849 +vo -850 +▁ʃ -851 +can -852 +mes -853 +ɛlɛ -854 +▁as -855 +▁pe -856 +dasi -857 +fasi -858 +wari -859 +▁ala -860 +▁mon -861 +▁yan -862 +▁ɲin -863 +▁dɔgɔ -864 +▁jugu -865 +▁minu -866 +▁musa -867 +▁jigin -868 +▁saint -869 +kuntigi -870 +:// -871 +ilɛ -872 +tɔn -873 +bola -874 +gera -875 +▁dala -876 +▁tɛmɛ -877 +▁akụkọ -878 +▁faran -879 +▁senkan -880 +▁farikolo -881 +mb -882 +sɛ -883 +des -884 +han -885 +mah -886 +nes -887 +▁nk -888 +▁pi -889 +ania -890 +▁art -891 +▁bam -892 +▁kul -893 +▁par -894 +▁dɛmɛ -895 +▁sini -896 +▁dunia -897 +▁sɔrɔdasi -898 +no -899 +arị -900 +der -901 +▁ex -902 +▁nu -903 +bili -904 +▁hak -905 +donna -906 +mancɛ -907 +tinin -908 +ɛnama -909 +▁kɛɲɛ -910 +▁seko -911 +▁sera -912 +cation -913 +▁atlan -914 +▁kongo -915 +▁foroba -916 +▁fitinin -917 +dɔ -918 +nô -919 +tle -920 +usu -921 +▁am -922 +▁au -923 +▁er -924 +▁gi -925 +buru -926 +sɛgɛ -927 +▁ama -928 +▁jɔn -929 +▁wee -930 +▁fili -931 +▁nɛgɛ -932 +▁sara -933 +▁sɛgɛ -934 +▁bagan -935 +▁kungo -936 +▁segin -937 +▁africa -938 +▁nafolo -939 +▁jamanakuntigi -940 +ен -941 +▁* -942 +▁» -943 +lar -944 +yɔn -945 +ɔra -946 +▁fè -947 +paɲi -948 +▁mus -949 +▁tum -950 +▁bara -951 +▁ɛndu -952 +▁ebola -953 +▁galle -954 +▁kɛnɛya -955 +▁sɔrɔko -956 +▁yɛlɛma -957 +▁cɛmancɛ -958 +▁dɔnkili -959 +▁yɛrɛmah -960 +▁madɔnnen -961 +▁sigiyɔrɔ -962 +ho -963 +aka -964 +ben -965 +ger -966 +gon -967 +mɛn -968 +orr -969 +run -970 +sun -971 +tto -972 +urs -973 +▁bô -974 +▁là -975 +▁sé -976 +▁ال -977 +pụta -978 +were -979 +▁and -980 +▁dum -981 +▁for -982 +▁les -983 +▁por -984 +akụkọ -985 +▁jama -986 +▁kara -987 +▁lase -988 +▁mugu -989 +▁sanu -990 +gnette -991 +▁diinɛ -992 +▁kɛcogo -993 +▁masakɛ -994 +". -995 +fu -996 +gɔ -997 +it -998 +ов -999 +dew -1000 +kis -1001 +sis -1002 +sti -1003 +umb -1004 +ɔni -1005 +▁ge -1006 +▁tè -1007 +sion -1008 +tɛrɛ -1009 +▁kala -1010 +▁wati -1011 +orrent -1012 +▁kataa -1013 +▁sudan -1014 +▁woroduguyanfan -1015 +ak -1016 +uk -1017 +▁у -1018 +▁‘ -1019 +ala -1020 +ang -1021 +bur -1022 +ral -1023 +the -1024 +▁ak -1025 +▁el -1026 +ɔnin -1027 +baara -1028 +▁kono -1029 +▁môgô -1030 +tional -1031 +▁arabu -1032 +▁inter -1033 +▁labɛn -1034 +▁surun -1035 +▁ɲuman -1036 +▁kalanso -1037 +▁sirilanw -1038 +▁sɛgɛsɛgɛ -1039 +né -1040 +pp -1041 +ss -1042 +ية -1043 +▁< -1044 +sɛn -1045 +▁qu -1046 +faso -1047 +▁com -1048 +▁shi -1049 +bilen -1050 +ɲɔgɔn -1051 +▁jiri -1052 +▁kore -1053 +▁onye -1054 +▁risi -1055 +▁togo -1056 +▁yoro -1057 +▁dɔnko -1058 +▁hakil -1059 +▁motto -1060 +▁ninnu -1061 +▁silamɛ -1062 +▁faranfasi -1063 +bɛ -1064 +jo -1065 +ld -1066 +fil -1067 +gar -1068 +kon -1069 +ria -1070 +ɔpu -1071 +fina -1072 +jata -1073 +main -1074 +tini -1075 +ɲini -1076 +gharị -1077 +▁dɔrɔn -1078 +▁kulɛri -1079 +▁lakali -1080 +▁ɲinini -1081 +▁dɔnniya -1082 +▁gallery -1083 +▁kumajago -1084 + -15835 +я -15836 +ل -15837 ++ -15838 +ь -15839 +% -15840 +ʃ -15841 +б -15842 +ي -15843 +ā -15844 +ч -15845 +ò -15846 +ة -15847 +* -15848 += -15849 +ц -15850 +ر -15851 +ᴐ -15852 +‘ -15853 +م -15854 +! -15855 +· -15856 +í -15857 +ï -15858 +ї -15859 +â -15860 +х -15861 +ú -15862 +ù -15863 +ы -15864 +ф -15865 +ш -15866 +_ -15867 +ж -15868 +و -15869 +? -15870 +ߊ -15871 +ƙ -15872 +ю -15873 +̀ -15874 +á -15875 +ɳ -15876 +ó -15877 +ب -15878 +ɗ -15879 +& -15880 +ü -15881 +є -15882 +ì -15883 +ê -15884 +ج -15885 +ë -15886 +ş -15887 +س -15888 +ع -15889 +ن -15890 +ߞ -15891 +ñ -15892 +ه -15893 +ߏ -15894 +ߒ -15895 +߬ -15896 +ī -15897 +ъ -15898 +э -15899 +ت -15900 +د -15901 +ߋ -15902 +ߘ -15903 +߫ -15904 +߲ -15905 +ı -15906 +œ -15907 +ś -15908 +ū -15909 +ߓ -15910 +° -15911 +İ -15912 +ߌ -15913 +ὲ -15914 +ⴰ -15915 +日 -15916 +î -15917 +ö -15918 +́ -15919 +إ -15920 +ش -15921 +ߍ -15922 +ߎ -15923 +‰ -15924 +{ -15925 +ä -15926 +ø -15927 +щ -15928 +י -15929 +् -15930 +ṇ -15931 +ⵜ -15932 +本 -15933 +# -15934 +ã -15935 +û -15936 +ć -15937 +غ -15938 +ك -15939 +ߐ -15940 +ߙ -15941 +ߝ -15942 +ߡ -15943 +社 -15944 +} -15945 +ł -15946 +ũ -15947 +λ -15948 +ѣ -15949 +ئ -15950 +ز -15951 +ߖ -15952 +ߛ -15953 +ߟ -15954 +ߠ -15955 +ߣ -15956 +ߦ -15957 +ध -15958 +म -15959 +ố -15960 +′ -15961 +『 -15962 +』 -15963 +の -15964 +史 -15965 +朝 -15966 +英 -15967 +集 -15968 +$ -15969 +^ -15970 +£ -15971 +× -15972 +å -15973 +ą -15974 +č -15975 +š -15976 +ʻ -15977 +ˈ -15978 +ː -15979 +δ -15980 +σ -15981 +ה -15982 +ו -15983 +ל -15984 +מ -15985 +ר -15986 +ת -15987 +، -15988 +ح -15989 +ص -15990 +ظ -15991 +ق -15992 +ى -15993 +َ -15994 +ग -15995 diff --git a/models/tokenizer/bm_tokenizer_32k.model b/models/tokenizer/bm_tokenizer_32k.model new file mode 100644 index 0000000000000000000000000000000000000000..356f9d84cd4d01bdd3b05da0b1b81796bf5ccb92 --- /dev/null +++ b/models/tokenizer/bm_tokenizer_32k.model @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5c3728738bd953c0b0980dea17440614b9fc5c1944fd6a606c0819bd83da8f70 +size 801851 diff --git a/models/tokenizer/bm_tokenizer_32k.vocab b/models/tokenizer/bm_tokenizer_32k.vocab new file mode 100644 index 0000000000000000000000000000000000000000..3137a72b1baa7703dfc5fc5965c8aa3766d5d98f --- /dev/null +++ b/models/tokenizer/bm_tokenizer_32k.vocab @@ -0,0 +1,32000 @@ + 0 + 0 + 0 + 0 +▁k -0 +an -1 +▁s -2 +▁b -3 +▁d -4 +▁n -5 +▁y -6 +▁m -7 +in -8 +▁f -9 +▁ka -10 +la -11 +ar -12 +▁t -13 +▁ye -14 +am -15 +on -16 +en -17 +▁a -18 +li -19 +▁c -20 +ri -21 +▁j -22 +▁la -23 +ti -24 +ba -25 +le -26 +ɔn -27 +gu -28 +go -29 +ya -30 +ra -31 +▁bɛ -32 +ara -33 +ugu -34 +▁ni -35 +un -36 +▁na -37 +▁w -38 +ana -39 +is -40 +▁min -41 +at -42 +ɔr -43 +ɛn -44 +▁ma -45 +▁o -46 +ma -47 +len -48 +re -49 +ani -50 +ko -51 +ka -52 +▁kɛ -53 +▁si -54 +ɔrɔ -55 +si -56 +lo -57 +▁( -58 +▁sa -59 +▁dugu -60 +ro -61 +▁ko -62 +amana -63 +ɔg -64 +▁san -65 +ga -66 +na -67 +rie -68 +il -69 +tion -70 +ama -71 +▁cat -72 +▁ani -73 +égo -74 +égorie -75 +▁catégorie -76 +ou -77 +▁p -78 +di -79 +▁ba -80 +▁don -81 +ni -82 +▁ta -83 +ul -84 +▁jamana -85 +▁di -86 +gi -87 +ɔgɔ -88 +▁h -89 +▁kan -90 +er -91 +▁ɲ -92 +▁u -93 +▁wa -94 +ɛr -95 +▁e -96 +▁i -97 +so -98 +ta -99 +kan -100 +ran -101 +▁saba -102 +▁se -103 +ɔnɔ -104 +da -105 +ogo -106 +bi -107 +▁de -108 +ki -109 +ur -110 +sa -111 +▁fɛ -112 +▁sabab -113 +ari -114 +lan -115 +▁da -116 +oro -117 +▁ch -118 +▁be -119 +▁fɔ -120 +▁g -121 +▁fa -122 +▁kɔ -123 +▁kɔnɔ -124 +es -125 +▁sababou -126 +▁in -127 +▁dɔ -128 +▁ke -129 +▁tun -130 +▁fran -131 +kɛ -132 +iri -133 +les -134 +ɛrɛ -135 +▁bama -136 +te -137 +us -138 +olo -139 +or -140 +▁is -141 +ire -142 +ille -143 +aman -144 +he -145 +▁sɔrɔ -146 +aran -147 +▁ku -148 +▁ti -149 +fɛ -150 +▁é -151 +niya -152 +ɛb -153 +▁bamako -154 +bara -155 +tions -156 +ais -157 +▁franç -158 +bn -159 +ini -160 +bam -161 +▁français -162 +se -163 +▁dic -164 +▁kelen -165 +▁char -166 +▁isbn -167 +▁ha -168 +um -169 +ditions -170 +▁donniya -171 +▁charles -172 +naire -173 +▁diction -174 +baille -175 +bambara -176 +bailleul -177 +▁éditions -178 +▁dictionnaire -179 +ke -180 +den -181 +eri -182 +nu -183 +aransi -184 +▁taa -185 +▁sigi -186 +▁bɔ -187 +▁an -188 +▁man -189 +▁bi -190 +inɛ -191 +▁ji -192 +fa -193 +lɛ -194 +ɲɛ -195 +▁fan -196 +gɛ -197 +▁af -198 +▁minnu -199 +▁mali -200 +ch -201 +mɛ -202 +). -203 +to -204 +de -205 +▁v -206 +▁kɔfɛ -207 +▁sira -208 +ji -209 +wa -210 +▁ja -211 +uru -212 +▁ɲɛ -213 +ulu -214 +▁" -215 +ɔrɔn -216 +lu -217 +▁baara -218 +bɔ -219 +ameri -220 +be -221 +jɛ -222 +▁yo -223 +▁mɔgɔ -224 +▁fara -225 +▁kun -226 +▁dan -227 +▁sen -228 +ye -229 +oli -230 +▁caman -231 +dugu -232 +▁mo -233 +wu -234 +ina -235 +ine -236 +ge -237 +▁fi -238 +▁cɛ -239 +ku -240 +▁mara -241 +ca -242 +yɔrɔ -243 +lɔ -244 +▁tɛ -245 +▁. -246 +man -247 +▁kuma -248 +bo -249 +bu -250 +tu -251 +▁faransi -252 +ce -253 +nen -254 +lima -255 +▁yɔrɔ -256 +▁to -257 +me -258 +qu -259 +▁tu -260 +▁dɔn -261 +ne -262 +don -263 +tigi -264 +ɔgɔn -265 +▁jamanaw -266 +px -267 +▁ɛn -268 +▁tɔgɔ -269 +▁woro -270 +▁su -271 +▁yɛ -272 +pa -273 +lon -274 +ent -275 +▁faso -276 +▁gu -277 +gan -278 +▁ameri -279 +▁ca -280 +▁do -281 +▁mu -282 +▁ya -283 +▁kɛra -284 +▁bɛɛ -285 +ɛnɛ -286 +yalen -287 +), -288 +▁worodugu -289 +ci -290 +cogo -291 +we -292 +▁mi -293 +▁nke -294 +▁ọ -295 +hi -296 +kolo -297 +▁fo -298 +▁afri -299 +▁ga -300 +ha -301 +ɛbɛn -302 +▁jon -303 +jamana -304 +▁walima -305 +do -306 +mu -307 +▁ban -308 +fan -309 +▁tle -310 +nan -311 +▁nin -312 +▁kɔrɔ -313 +▁kɛlɛ -314 +▁yɛrɛ -315 +▁so -316 +ban -317 +▁kalan -318 +heli -319 +▁cogo -320 +▁l -321 +tɛr -322 +uni -323 +▁kos -324 +inɛti -325 +▁fanga -326 +▁saheli -327 +tɛrinɛti -328 +ja -329 +wi -330 +▁dugum -331 +▁ɛntɛrinɛti -332 +▁dɛ -333 +▁re -334 +kili -335 +▁dugumogo -336 +▁yooro -337 +▁bo -338 +▁jɛ -339 +yiri -340 +▁fɔlɔ -341 +kun -342 +▁le -343 +ati -344 +▁r -345 +oni -346 +amara -347 +th -348 +yan -349 +▁ɲɔgɔn -350 +ate -351 +▁fana -352 +▁siti -353 +faransi -354 +du -355 +hụ -356 +st -357 +▁bolo -358 +al -359 +rô -360 +▁kon -361 +bin -362 +ɛbɛ -363 +▁z -364 +▁we -365 +▁kelenyalen -366 +ôrô -367 +▁masa -368 +ilan -369 +▁waati -370 +kọ -371 +▁du -372 +▁bon -373 +▁den -374 +▁fasojamana -375 +kɛla -376 +▁mans -377 +gh -378 +▁ki -379 +▁dam -380 +mi -381 +yi -382 +sen -383 +fi -384 +isi -385 +tin -386 +risi -387 +co -388 +▁sugu -389 +▁wala -390 +pu -391 +aba -392 +▁co -393 +▁tile -394 +▁jira -395 +▁tlebi -396 +▁mansamara -397 +kɔ -398 +vi -399 +gwu -400 +ɛgɛ -401 +▁wɛrɛ -402 +fin -403 +mɔgɔ -404 +▁me -405 +▁te -406 +denw -407 +▁afrika -408 +pe -409 +ata -410 +▁al -411 +▁ne -412 +▁amerika -413 +po -414 +dɔn -415 +af -416 +▁kɛmɛ -417 +.[ -418 +gin -419 +kulu -420 +▁kosɛbɛ -421 +ve -422 +ter -423 +▁jɔ -424 +▁jo -425 +▁nka -426 +amanan -427 +▁gun -428 +▁li -429 +▁vi -430 +▁tan -431 +▁jate -432 +que -433 +▁faaba -434 +▁sɛbɛn -435 +▁egwu -436 +▁: -437 +tan -438 +▁ci -439 +▁- -440 +▁diɲɛ -441 +fɔ -442 +pi -443 +▁yen -444 +▁walasa -445 +▁bamanan -446 +zi -447 +▁ar -448 +▁of -449 +▁bɔra -450 +yanfan -451 +kụ -452 +▁kè -453 +▁dɔw -454 +fe -455 +amu -456 +kɔnɔ -457 +▁bila -458 +▁bè -459 +ɛna -460 +urun -461 +▁olu -462 +▁kɔrɔn -463 +▁dugukolo -464 +ing -465 +et -466 +▁ro -467 +▁fɛn -468 +▁kɔn -469 +▁hakɛ -470 +mo -471 +▁no -472 +▁po -473 +dị -474 +gô -475 +kalo -476 +▁son -477 +▁kulu -478 +▁yiri -479 +bụ -480 +cɛ -481 +ft -482 +▁ju -483 +ɛrɛn -484 +ariya -485 +▁yoga -486 +as -487 +▁mar -488 +▁kô -489 +▁ali -490 +▁— -491 +tiki -492 +▁tɔn -493 +▁jago -494 +san -495 +iriki -496 +▁uk -497 +▁daminɛ -498 +▁dô -499 +▁afiriki -500 +▁sin -501 +lle -502 +bli -503 +dala -504 +▁bana -505 +▁sababu -506 +▁“ -507 +kɔn -508 +ɛri -509 +▁fô -510 +wift -511 +▁fil -512 +▁mis -513 +ry -514 +▁ŋ -515 +▁aw -516 +uman -517 +▁swift -518 +▁mari -519 +▁bé -520 +tigɛ -521 +▁kɔgɔ -522 +sh -523 +▁jan -524 +▁fila -525 +▁jɛkulu -526 +ôgô -527 +ariku -528 +▁kura -529 +▁tuma -530 +▁wele -531 +▁con -532 +▁pro -533 +▁poli -534 +▁suguya -535 +▁fe -536 +▁tɔ -537 +▁kɛr -538 +▁boli -539 +su -540 +dan -541 +▁dị -542 +kụkọ -543 +▁the -544 +▁bɛna -545 +▁wɛrɛw -546 +▁kɔgɔji -547 +yo -548 +kaw -549 +wan -550 +▁sis -551 +▁kɛnɛ -552 +▁ukra -553 +au -554 +min -555 +fara -556 +jago -557 +▁bin -558 +▁sôrô -559 +▁ɲɛmɔgɔ -560 +▁ɔ -561 +ene -562 +kɔrɔ -563 +▁ce -564 +▁nɔ -565 +▁on -566 +▁muso -567 +▁sɛnɛ -568 +▁dilan -569 +ll -570 +tt -571 +ɲi -572 +ịhụ -573 +▁fari -574 +▁bamanankan -575 +ali -576 +gne -577 +nanya -578 +ịhụnanya -579 +▁bu -580 +▁lo -581 +▁des -582 +▁kab -583 +▁с -584 +▁lam -585 +▁sariya -586 +pụ -587 +▁et -588 +baga -589 +▁fin -590 +▁jɛn -591 +je -592 +▁ụ -593 +our -594 +ron -595 +taa -596 +▁franse -597 +εε -598 +▁[ -599 +▁« -600 +ami -601 +ega -602 +fɛn -603 +▁ho -604 +bolo -605 +▁laban -606 +▁hakili -607 +eni -608 +▁ahụ -609 +▁ndị -610 +amerika -611 +ru -612 +ty -613 +té -614 +dio -615 +sin -616 +▁pa -617 +mali -618 +ropa -619 +▁lab -620 +▁foro -621 +▁yiriwa -622 +▁farafin -623 +law -624 +ver -625 +▁naf -626 +ts -627 +ard -628 +dia -629 +▁fu -630 +▁/ -631 +▁at -632 +▁daɲɛ -633 +.. -634 +ww -635 +ere -636 +nin -637 +▁en -638 +▁go -639 +▁yé -640 +▁tra -641 +▁kama -642 +ɔrɔnya -643 +▁senega -644 +▁– -645 +int -646 +son -647 +▁bụ -648 +▁sh -649 +▁wi -650 +ulon -651 +kɛlaw -652 +kɛrɛn -653 +▁siri -654 +▁tariku -655 +▁baarakɛ -656 +▁+ -657 +sia -658 +▁baw -659 +▁dabɔ -660 +▁marifa -661 +rụ -662 +на -663 +▁, -664 +las -665 +bali -666 +jɛgɛ -667 +yali -668 +▁taama -669 +▁kɛmɛda -670 +▁sigilen -671 +rè -672 +che -673 +kow -674 +dama -675 +lenw -676 +▁kolon -677 +▁mɔgɔw -678 +▁sigira -679 +▁ameriki -680 +▁jamanadenw -681 +▁ɛ -682 +pan -683 +▁lu -684 +▁un -685 +▁duni -686 +▁lajɛ -687 +▁laka -688 +▁sila -689 +èn -690 +ск -691 +ena -692 +▁aka -693 +▁gine -694 +ра -695 +ber -696 +▁es -697 +▁wo -698 +▁dun -699 +▁laa -700 +publi -701 +▁cent -702 +▁tugu -703 +dɔnnen -704 +▁kɛrɛn -705 +▁bamakɔ -706 +▁jɔyɔrɔ -707 +▁politiki -708 +▁в -709 +are -710 +baw -711 +naf -712 +▁dé -713 +▁nt -714 +▁ra -715 +land -716 +tara -717 +▁tali -718 +▁wale -719 +▁cogoya -720 +▁masala -721 +kɛrɛnnen -722 +ré -723 +то -724 +mis -725 +▁je -726 +afri -727 +▁mas -728 +▁mili -729 +▁sisan -730 +el -731 +fo -732 +ps -733 +chi -734 +kar -735 +yɛn -736 +▁kaba -737 +▁minɛ -738 +▁site -739 +▁к -740 +jan -741 +res -742 +ton -743 +▁bar -744 +▁bɛn -745 +▁nafa -746 +▁kɛrɛnkɛrɛnnen -747 +ph -748 +ɛni -749 +hara -750 +▁ihe -751 +arabu -752 +bagan -753 +kalan -754 +▁kɔkan -755 +▁mansa -756 +▁kabini -757 +ck -758 +baa -759 +bia -760 +mba -761 +tra -762 +▁sun -763 +▁fanba -764 +▁tulon -765 +▁kunnaf -766 +▁farafinna -767 +lé -768 +va -769 +ces -770 +cha -771 +lin -772 +mar -773 +tte -774 +▁ale -775 +▁fla -776 +sɛbɛn -777 +▁sika -778 +ال -779 +tik -780 +ment -781 +tali -782 +▁nan -783 +▁hali -784 +▁tila -785 +afrika -786 +▁eropa -787 +▁laadala -788 +▁ịhụnanya -789 +▁jamanaden -790 +kw -791 +▁hi -792 +▁sɛ -793 +bila -794 +▁abụ -795 +▁mun -796 +▁sou -797 +▁cɛma -798 +▁kalo -799 +▁ukraine -800 +ct -801 +tɛ -802 +ɲa -803 +▁л -804 +▁р -805 +babu -806 +sira -807 +▁kar -808 +▁nana -809 +▁yɛlɛ -810 +▁danbɔ -811 +▁irisi -812 +▁sahara -813 +▁sigida -814 +▁kunnafoni -815 +za -816 +rit -817 +èrè -818 +▁sɛb -819 +ugula -820 +ɛnajɛ -821 +▁wari -822 +▁bonya -823 +▁filmu -824 +tɔ -825 +▁; -826 +▁th -827 +▁sam -828 +▁uni -829 +kelen -830 +kɔrɔn -831 +▁fɔli -832 +▁fɛɛrɛ -833 +▁sɛben -834 +▁hadama -835 +▁danfara -836 +по -837 +▁| -838 +liw -839 +ste -840 +tes -841 +uli -842 +ence -843 +lanw -844 +▁lib -845 +▁kilo -846 +▁kolo -847 +▁tiɲɛ -848 +// -849 +vo -850 +▁ʃ -851 +can -852 +mes -853 +ɛlɛ -854 +▁as -855 +▁pe -856 +dasi -857 +fasi -858 +wari -859 +▁ala -860 +▁mon -861 +▁yan -862 +▁ɲin -863 +▁dɔgɔ -864 +▁jugu -865 +▁minu -866 +▁musa -867 +▁jigin -868 +▁saint -869 +kuntigi -870 +:// -871 +ilɛ -872 +tɔn -873 +bola -874 +gera -875 +▁dala -876 +▁tɛmɛ -877 +▁akụkọ -878 +▁faran -879 +▁senkan -880 +▁farikolo -881 +mb -882 +sɛ -883 +des -884 +han -885 +mah -886 +nes -887 +▁nk -888 +▁pi -889 +ania -890 +▁art -891 +▁bam -892 +▁kul -893 +▁par -894 +▁dɛmɛ -895 +▁sini -896 +▁dunia -897 +▁sɔrɔdasi -898 +no -899 +arị -900 +der -901 +▁ex -902 +▁nu -903 +bili -904 +▁hak -905 +donna -906 +mancɛ -907 +tinin -908 +ɛnama -909 +▁kɛɲɛ -910 +▁seko -911 +▁sera -912 +cation -913 +▁atlan -914 +▁kongo -915 +▁foroba -916 +▁fitinin -917 +dɔ -918 +nô -919 +tle -920 +usu -921 +▁am -922 +▁au -923 +▁er -924 +▁gi -925 +buru -926 +sɛgɛ -927 +▁ama -928 +▁jɔn -929 +▁wee -930 +▁fili -931 +▁nɛgɛ -932 +▁sara -933 +▁sɛgɛ -934 +▁bagan -935 +▁kungo -936 +▁segin -937 +▁africa -938 +▁nafolo -939 +▁jamanakuntigi -940 +ен -941 +▁* -942 +▁» -943 +lar -944 +yɔn -945 +ɔra -946 +▁fè -947 +paɲi -948 +▁mus -949 +▁tum -950 +▁bara -951 +▁ɛndu -952 +▁ebola -953 +▁galle -954 +▁kɛnɛya -955 +▁sɔrɔko -956 +▁yɛlɛma -957 +▁cɛmancɛ -958 +▁dɔnkili -959 +▁yɛrɛmah -960 +▁madɔnnen -961 +▁sigiyɔrɔ -962 +ho -963 +aka -964 +ben -965 +ger -966 +gon -967 +mɛn -968 +orr -969 +run -970 +sun -971 +tto -972 +urs -973 +▁bô -974 +▁là -975 +▁sé -976 +▁ال -977 +pụta -978 +were -979 +▁and -980 +▁dum -981 +▁for -982 +▁les -983 +▁por -984 +akụkọ -985 +▁jama -986 +▁kara -987 +▁lase -988 +▁mugu -989 +▁sanu -990 +gnette -991 +▁diinɛ -992 +▁kɛcogo -993 +▁masakɛ -994 +". -995 +fu -996 +gɔ -997 +it -998 +ов -999 +dew -1000 +kis -1001 +sis -1002 +sti -1003 +umb -1004 +ɔni -1005 +▁ge -1006 +▁tè -1007 +sion -1008 +tɛrɛ -1009 +▁kala -1010 +▁wati -1011 +orrent -1012 +▁kataa -1013 +▁sudan -1014 +▁woroduguyanfan -1015 +ak -1016 +uk -1017 +▁у -1018 +▁‘ -1019 +ala -1020 +ang -1021 +bur -1022 +ral -1023 +the -1024 +▁ak -1025 +▁el -1026 +ɔnin -1027 +baara -1028 +▁kono -1029 +▁môgô -1030 +tional -1031 +▁arabu -1032 +▁inter -1033 +▁labɛn -1034 +▁surun -1035 +▁ɲuman -1036 +▁kalanso -1037 +▁sirilanw -1038 +▁sɛgɛsɛgɛ -1039 +né -1040 +pp -1041 +ss -1042 +ية -1043 +▁< -1044 +sɛn -1045 +▁qu -1046 +faso -1047 +▁com -1048 +▁shi -1049 +bilen -1050 +ɲɔgɔn -1051 +▁jiri -1052 +▁kore -1053 +▁onye -1054 +▁risi -1055 +▁togo -1056 +▁yoro -1057 +▁dɔnko -1058 +▁hakil -1059 +▁motto -1060 +▁ninnu -1061 +▁silamɛ -1062 +▁faranfasi -1063 +bɛ -1064 +jo -1065 +ld -1066 +fil -1067 +gar -1068 +kon -1069 +ria -1070 +ɔpu -1071 +fina -1072 +jata -1073 +main -1074 +tini -1075 +ɲini -1076 +gharị -1077 +▁dɔrɔn -1078 +▁kulɛri -1079 +▁lakali -1080 +▁ɲinini -1081 +▁dɔnniya -1082 +▁gallery -1083 +▁kumajago -1084 + -19372 +▁andries -19373 +▁carinna -19374 +▁gassama -19375 +▁jatebɔw -19376 +▁leppard -19377 +▁mapping -19378 +▁quintes -19379 +▁rapport -19380 +▁sapporo -19381 +▁shikago -19382 +▁ɲɛbilen -19383 +bɛladjɛla -19384 +kɔrɔbilen -19385 +wikiquote -19386 +▁brachysy -19387 +▁comeback -19388 +▁dembella -19389 +▁déposses -19390 +▁jaabilan -19391 +▁koreïchy -19392 +▁korofina -19393 +▁mousolou -19394 +▁trabajos -19395 +▁ɲagalaan -19396 +▁ɲamakoro -19397 +▁ɲwandafa -19398 +▁ɲɛgɛnniw -19399 +ppɔ -19400 +ppɔd -19401 +rald -19402 +sbur -19403 +ural -19404 +ọala -19405 +▁akj -19406 +▁akè -19407 +angha -19408 +angle -19409 +blanc -19410 +burga -19411 +faala -19412 +ppini -19413 +thegu -19414 +theus -19415 +yaala -19416 +▁ella -19417 +▁elvi -19418 +▁ikwa -19419 +▁pese -19420 +amural -19421 +anghai -19422 +appini -19423 +layidu -19424 +ppɔdrɔ -19425 +sburgh -19426 +themba -19427 +thenia -19428 +tinian -19429 +ttoral -19430 +▁akjou -19431 +▁daala -19432 +▁fabur -19433 +▁gothe -19434 +▁viral -19435 +▁ŋɔnin -19436 +metheus -19437 +samadhi -19438 +turisiw -19439 +yabaara -19440 +▁akjouj -19441 +▁bagada -19442 +▁elvira -19443 +▁kokèna -19444 +▁konoti -19445 +▁môgôma -19446 +▁neural -19447 +▁ntọala -19448 +▁sayiji -19449 +▁wulili -19450 +ppɔdrɔme -19451 +ttsburgh -19452 +▁akjoujt -19453 +▁diplome -19454 +▁konotio -19455 +▁leblanc -19456 +▁mafaala -19457 +▁matsayi -19458 +▁minsenw -19459 +▁taniwor -19460 +▁ɲumanba -19461 +angletɛri -19462 +baarakɛla -19463 +▁bagadaji -19464 +▁bagayɔkɔ -19465 +▁gabonais -19466 +▁ikwadori -19467 +▁kpọtụụrụ -19468 +▁littoral -19469 +▁nothemba -19470 +▁shanghai -19471 +▁ŋɔnintan -19472 +▁ɲɛjɔyɔrɔ -19473 +▁ɲɛshinen -19474 +▁автома́т -19475 +▁българия -19476 +▁дальнего -19477 +▁директор -19478 +▁политиче -19479 +▁приговор -19480 +▁разговор -19481 +▁сахалине -19482 +▁художниц -19483 +▁التجانية -19484 +▁ߓߊߘߋ߲ߡߊ߫ -19485 +▁ߓߊ߲ߊߙߊ߲߫ -19486 +▁ߞߊߙߊ߲ߘߋ߲ -19487 +▁ọmụmaatụ -19488 +acquarelli -19489 +agbanyeghị -19490 +alemaɲikan -19491 +angilɛtɛri -19492 +bissaugine -19493 +calcaratus -19494 +cartwright -19495 +centralize -19496 +chologique -19497 +concepcion -19498 +cptailurus -19499 +)". -19500 +efu -19501 +ngɔ -19502 +yuk -19503 +▁жи -19504 +akra -19505 +itum -19506 +kisɔ -19507 +lumb -19508 +peak -19509 +tait -19510 +́ngɔ -19511 +▁gem -19512 +▁oak -19513 +▁vak -19514 +▁ɲak -19515 +akari -19516 +eduzi -19517 +kisin -19518 +mouté -19519 +sigiw -19520 +siste -19521 +yukyu -19522 +مملكة -19523 +▁geer -19524 +▁geli -19525 +▁mcco -19526 +▁mogɔ -19527 +▁sɔni -19528 +▁vakf -19529 +bensis -19530 +gandew -19531 +ittait -19532 +itumbu -19533 +jinenw -19534 +kataba -19535 +kisɔde -19536 +lumbus -19537 +ulsion -19538 +▁kongɔ -19539 +▁notho -19540 +▁vakfı -19541 +peaking -19542 +takisin -19543 +المملكة -19544 +▁berlin -19545 +▁chakra -19546 +▁galmés -19547 +▁geertz -19548 +▁kalade -19549 +▁kalaya -19550 +▁kɔ́ngɔ -19551 +▁lasera -19552 +▁malaki -19553 +▁mccoll -19554 +▁ryukyu -19555 +▁samiyɛ -19556 +▁zakari -19557 +▁ɲakata -19558 +▁житель -19559 +dominika -19560 +internet -19561 +itumbuka -19562 +▁assiste -19563 +▁curaçao -19564 +▁ekisɔde -19565 +▁karaben -19566 +▁karabin -19567 +▁lakoron -19568 +▁lankolo -19569 +▁oakland -19570 +▁vakfıke -19571 +▁watijan -19572 +▁windows -19573 +▁ɲasigiw -19574 +catalogue -19575 +▁columbus -19576 +▁djigandé -19577 +▁filɛlanw -19578 +▁kaladeen -19579 +▁portigal -19580 +▁quittait -19581 +▁toumouté -19582 +▁wagandew -19583 +cueilleurs -19584 +dantigɛkan -19585 +devānagarī -19586 +directions -19587 +exposition -19588 +faidherbia -19589 +faransɛkan -19590 +formateurs -19591 +fédération -19592 +gargantuan -19593 +garɛtitigi -19594 +generateur -19595 +gonosticta -19596 +inderianus -19597 +industries -19598 +inpainting -19599 +asho -19600 +bens -19601 +sung -19602 +sunu -19603 +▁sén -19604 +akade -19605 +akash -19606 +benin -19607 +digon -19608 +kolun -19609 +maben -19610 +neurs -19611 +regon -19612 +rogon -19613 +seurs -19614 +teurs -19615 +▁?..) -19616 +▁bôle -19617 +▁bôli -19618 +▁oben -19619 +▁ségi -19620 +ashoka -19621 +garand -19622 +kọpụta -19623 +sawara -19624 +sunuya -19625 +tanger -19626 +wepụta -19627 +werela -19628 +▁andro -19629 +▁bôlen -19630 +▁deuil -19631 +▁digon -19632 +▁forge -19633 +▁forti -19634 +▁iklan -19635 +▁jaaka -19636 +▁jamad -19637 +▁jamae -19638 +▁jibow -19639 +▁kwaji -19640 +▁mogon -19641 +▁porti -19642 +▁sagon -19643 +▁sugon -19644 +asseurs -19645 +kolunbu -19646 +ịkọpụta -19647 +▁bokisi -19648 +▁chopin -19649 +▁jamais -19650 +▁lebens -19651 +▁mogony -19652 +▁oregon -19653 +▁songon -19654 +▁urogon -19655 +akademin -19656 +gasawara -19657 +▁balikuw -19658 +▁bàgànin -19659 +▁djɛkulu -19660 +▁ewerela -19661 +▁fortior -19662 +▁jamadɔg -19663 +▁magalɛn -19664 +▁manikaw -19665 +▁mwepụta -19666 +▁obenata -19667 +▁saakash -19668 +▁samsung -19669 +akademinu -19670 +▁bokisiti -19671 +▁christga -19672 +▁fasofaso -19673 +▁jamatigi -19674 +▁jensenen -19675 +▁kojuguba -19676 +▁porteurs -19677 +▁sitiwere -19678 +▁tanneurs -19679 +jelinkusun -19680 +jumhuriyah -19681 +kalansobaw -19682 +kgconduite -19683 +kpochapụwo -19684 +kèlawariyi -19685 +kɔnɔnafili -19686 +lantankɛnɛ -19687 +lanthropus -19688 +latilennan -19689 +leidoscope -19690 +leymanpasa -19691 +liberiakaw -19692 +lɔgɔnɛdiya -19693 +madafɛdugu -19694 +madagaskar -19695 +mammifères -19696 +maninkakan -19697 +marisikalo -19698 +melligerus -19699 +hof -19700 +who -19701 +▁»; -19702 +beho -19703 +larp -19704 +mlar -19705 +omie -19706 +phip -19707 +▁erɔ -19708 +▁fèè -19709 +▁»). -19710 +bougo -19711 +liyɔn -19712 +mları -19713 +mtsov -19714 +senho -19715 +speri -19716 +▁auth -19717 +▁erle -19718 +▁erɔp -19719 +▁gici -19720 +▁gila -19721 +▁mɔli -19722 +phippi -19723 +sumaan -19724 +sɛgɛli -19725 +terhof -19726 +waburu -19727 +ımları -19728 +▁amazi -19729 +▁aurit -19730 +▁egoli -19731 +▁erlew -19732 +▁gbeho -19733 +▁joulo -19734 +▁jɔnna -19735 +▁liyɔn -19736 +▁musam -19737 +▁mussa -19738 +asọpụrụ -19739 +sperity -19740 +tımları -19741 +verture -19742 +wanburu -19743 +▁barack -19744 +▁baraji -19745 +▁barali -19746 +▁barazi -19747 +▁chegui -19748 +▁dɔgɔsɔ -19749 +▁dɔkɔni -19750 +▁giciye -19751 +▁guyani -19752 +▁jɔntan -19753 +▁lemuru -19754 +▁madina -19755 +▁nɛgɛye -19756 +▁parado -19757 +▁sanyɔn -19758 +senhoter -19759 +uverture -19760 +òwanburu -19761 +ıtımları -19762 +▁amazigh -19763 +▁auritus -19764 +▁authori -19765 +▁chaleur -19766 +▁distrik -19767 +▁ephippi -19768 +▁furumaw -19769 +▁jouloun -19770 +▁kungolɛ -19771 +▁nemtsov -19772 +▁paradox -19773 +▁princes -19774 +▁sarakaw -19775 +▁seginla -19776 +▁somôgôw -19777 +▁sɔngɔba -19778 +▁touareg -19779 +senhoteru -19780 +▁erlewine -19781 +▁kɛnɛyaso -19782 +▁musamman -19783 +▁nowaburu -19784 +▁nɛgɛyele -19785 +▁peterhof -19786 +▁princess -19787 +▁tɔgɔlama -19788 +▁yɛlɛmalɛ -19789 +▁ɲamanton -19790 +minankalan -19791 +nàfàsɔ̀rɔ̀ -19792 +opoldville -19793 +opérations -19794 +otocobolus -19795 +pdcwaaqbaj -19796 +politiques -19797 +presentati -19798 +profession -19799 +gnô -19800 +arịọ -19801 +derb -19802 +dɔda -19803 +hind -19804 +noma -19805 +noto -19806 +noun -19807 +orno -19808 +shup -19809 +usui -19810 +▁amh -19811 +▁amɔ -19812 +▁nuc -19813 +dimii -19814 +karno -19815 +notoc -19816 +order -19817 +sendɔ -19818 +tlego -19819 +▁amɔs -19820 +▁hakè -19821 +▁kadɔ -19822 +▁kɔge -19823 +▁park -19824 +▁yusu -19825 +▁ɲɛdɔ -19826 +giorno -19827 +mifenw -19828 +▁amami -19829 +▁amman -19830 +▁conno -19831 +▁exter -19832 +▁fusui -19833 +▁justi -19834 +▁litri -19835 +▁sagnô -19836 +▁tnoma -19837 +ggiorno -19838 +nounces -19839 +ɛnamaya -19840 +▁amhari -19841 +▁behind -19842 +▁cattle -19843 +▁federb -19844 +▁kuruns -19845 +▁manuce -19846 +▁mashup -19847 +▁ngonin -19848 +▁nkɔnin -19849 +▁ntilen -19850 +▁nucuru -19851 +▁script -19852 +▁siniko -19853 +▁tɔɔrɔw -19854 +▁yusufu -19855 +fication -19856 +location -19857 +ɲɛnamaya -19858 +▁abdimii -19859 +▁amamihe -19860 +▁atlanta -19861 +▁katlego -19862 +▁membres -19863 +▁sukarno -19864 +▁tadonna -19865 +▁wasaden -19866 +jacaranda -19867 +▁bishegin -19868 +▁disorder -19869 +▁dɛmɛmɔgɔ -19870 +▁externes -19871 +▁forobaca -19872 +▁justicia -19873 +▁kaladian -19874 +▁kemifenw -19875 +rocesseurs -19876 +sabikɔnkɔn -19877 +sakramento -19878 +sification -19879 +sylvicapra -19880 +sɛgɛsɛgɛli -19881 +takisininw -19882 +tanishegin -19883 +tashvatara -19884 +tribunnews -19885 +université -19886 +volutional -19887 +walekɛcogo -19888 +wantinsuyu -19889 +wikivoyage -19890 +âmakrishna -19891 +ébullition -19892 +üniversite -19893 +środowiska -19894 +ɔrokɔdonna -19895 +ɲimikɔnkɔn -19896 +рисовавшей -19897 +▁abdoulaye -19898 +▁accipiter -19899 +ssɛ -19900 +ọlụ -19901 +filɛ -19902 +hanp -19903 +nest -19904 +sɛli -19905 +ïdes -19906 +ọọlụ -19907 +▁nkè -19908 +▁nsɛ -19909 +▁tụf -19910 +▁umb -19911 +gerak -19912 +pides -19913 +seleb -19914 +zania -19915 +▁besɛ -19916 +▁dzia -19917 +▁khan -19918 +▁mudr -19919 +▁nisɛ -19920 +▁nsɛg -19921 +▁oumu -19922 +▁pier -19923 +▁piet -19924 +▁pila -19925 +▁semb -19926 +▁yomb -19927 +amides -19928 +coïdes -19929 +hanpur -19930 +kɔɲskɔ -19931 +seania -19932 +yabola -19933 +بنانية -19934 +▁adaba -19935 +▁bamkɔ -19936 +▁bọọlụ -19937 +▁dahla -19938 +▁dania -19939 +▁khanh -19940 +▁kulla -19941 +▁mudrâ -19942 +▁nkene -19943 +▁nkwan -19944 +▁salim -19945 +▁tɛssɛ -19946 +▁vɔlta -19947 +ameless -19948 +berania -19949 +kagerak -19950 +ordinat -19951 +oseania -19952 +ramides -19953 +répides -19954 +▁atlasi -19955 +▁dahlak -19956 +▁ernest -19957 +▁goloma -19958 +▁mafilɛ -19959 +▁nkuman -19960 +▁parent -19961 +▁pietro -19962 +▁pilari -19963 +▁semble -19964 +▁sesɛli -19965 +▁shania -19966 +▁tigɛla -19967 +▁tụfuru -19968 +▁umbret -19969 +trépides -19970 +velopper -19971 +▁dalakan -19972 +▁faranfa -19973 +▁iberibe -19974 +▁kalafaw -19975 +▁nkwanye -19976 +▁pierres -19977 +▁tɛmɛlen -19978 +anicoïdes -19979 +atanzania -19980 +▁daminara -19981 +▁memoriam -19982 +▁skagerak -19983 +▁tasumaka -19984 +▁umbretta -19985 +norwijikan -19986 +▁accueille -19987 +▁activiste -19988 +▁adamadéya -19989 +▁aksiyɔmuw -19990 +▁akọwapụta -19991 +▁aleksandr -19992 +▁alimentée -19993 +▁amanirena -19994 +▁americain -19995 +▁amnirense -19996 +▁améthyste -19997 +▁anciennes -19998 +▁angulaire -19999 +ovo -20000 +vod -20001 +bɛlɛ -20002 +kovo -20003 +scan -20004 +tivo -20005 +wɛlɛ -20006 +▁ʃan -20007 +▁ʃɔn -20008 +armes -20009 +budat -20010 +dogon -20011 +messo -20012 +nuovo -20013 +owari -20014 +ɛlɛkɛ -20015 +▁asar -20016 +▁asco -20017 +▁assa -20018 +▁favo -20019 +▁peas -20020 +▁peer -20021 +▁peli -20022 +▁peti -20023 +▁peyi -20024 +▁play -20025 +▁taxi -20026 +▁ʃyan -20027 +biwɛlɛ -20028 +fasili -20029 +mismes -20030 +tɔnnan -20031 +▁andre -20032 +▁araba -20033 +▁ascof -20034 +▁dɔnia -20035 +▁ganta -20036 +▁indiz -20037 +▁jerry -20038 +▁monas -20039 +▁mongo -20040 +▁monko -20041 +▁monte -20042 +▁monti -20043 +▁natal -20044 +▁yanki -20045 +▁zavod -20046 +▁ɲinan -20047 +▁alamar -20048 +▁asarki -20049 +▁assala -20050 +▁ebudat -20051 +▁filipe -20052 +▁fɔlisɛ -20053 +▁kilɛma -20054 +▁koloko -20055 +▁kolose -20056 +▁kolosi -20057 +▁mɛlɛkɛ -20058 +▁nativo -20059 +▁ntɛlɛn -20060 +▁peyiba -20061 +▁tenisi -20062 +▁toscan -20063 +▁ɲininɛ -20064 +▁babiliw -20065 +▁gantayi -20066 +▁juguman -20067 +▁kolokow -20068 +▁montico -20069 +▁peliaba -20070 +▁petites -20071 +▁players -20072 +▁yɛlenni -20073 +▁местный -20074 +▁ценника -20075 +guistique -20076 +▁ascofaré -20077 +▁assalamu -20078 +▁capitale -20079 +▁conowari -20080 +▁favorite -20081 +▁kolokowo -20082 +▁kololenw -20083 +▁mongolia -20084 +▁nabiwɛlɛ -20085 +▁permesso -20086 +▁seginnen -20087 +▁viktoria -20088 +▁ценниках -20089 +▁animismes -20090 +▁annectens -20091 +▁announces -20092 +▁antropolo -20093 +▁apatrides -20094 +▁aphorisme -20095 +▁aprilkalo -20096 +▁arajokuma -20097 +▁archuleta -20098 +▁ascetices -20099 +vins -20100 +ɲuli -20101 +sites -20102 +tɔɔrɔ -20103 +▁liby -20104 +▁rayu -20105 +▁rupi -20106 +▁samp -20107 +▁that -20108 +▁then -20109 +enidae -20110 +jalanw -20111 +kamalé -20112 +kɛmɛda -20113 +muɲuli -20114 +▁arius -20115 +▁malok -20116 +▁mites -20117 +▁nyema -20118 +▁reste -20119 +▁samar -20120 +▁sites -20121 +▁taste -20122 +▁thres -20123 +▁unice -20124 +▁unita -20125 +▁vites -20126 +kelenan -20127 +kɔrɔnfɛ -20128 +▁bovins -20129 +▁fɔlifɔ -20130 +▁jalanw -20131 +▁keynes -20132 +▁kuntaw -20133 +▁labenw -20134 +▁liberi -20135 +▁lukash -20136 +▁rayuwa -20137 +▁samene -20138 +▁samogo -20139 +▁sɛbeni -20140 +▁thiago -20141 +▁unicef -20142 +holstein -20143 +▁cɛkelen -20144 +▁etipoia -20145 +▁jikɔrɔn -20146 +▁kamèlen -20147 +▁lakaliw -20148 +▁lakelen -20149 +▁niɛnajɛ -20150 +▁ogologo -20151 +▁sampana -20152 +▁surtout -20153 +▁terrain -20154 +▁threski -20155 +▁vitesse -20156 +▁waridon -20157 +▁bajalanw -20158 +▁bankelen -20159 +▁ginshiƙi -20160 +▁jikɔrɔni -20161 +▁jiralanw -20162 +▁kankelen -20163 +▁malokini -20164 +▁threskio -20165 +kamalénnin -20166 +▁assaudiya -20167 +▁asturiano -20168 +▁auerstadt -20169 +▁aurobindo -20170 +▁authority -20171 +▁auxiliary -20172 +▁azerbijan -20173 +▁badoulaye -20174 +▁bafoulabe -20175 +▁bajangara -20176 +▁bakɔnɔnin -20177 +▁baltimore -20178 +▁banbaciya -20179 +▁banbannen -20180 +▁banjagara -20181 +▁barokunba -20182 +▁benedicta -20183 +▁bharatiya -20184 +▁biarmicus -20185 +▁bibliothè -20186 +▁bikononto -20187 +▁bilankoro -20188 +▁birililen -20189 +▁birintufa -20190 +▁bolininjɛ -20191 +▁bolobɔlan -20192 +▁bolokinin -20193 +▁boubacari -20194 +▁boudhisme -20195 +▁bourgneuf -20196 +▁breweries -20197 +▁brillants -20198 +▁bucaraman -20199 +aɲa -20200 +ịza -20201 +▁рс -20202 +adun -20203 +fact -20204 +gypt -20205 +ople -20206 +yèrè -20207 +▁act -20208 +▁ngɔ -20209 +▁рсф -20210 +neros -20211 +otuto -20212 +ritmɛ -20213 +ritɔn -20214 +ɛrɛtɛ -20215 +▁jeɲa -20216 +▁kart -20217 +▁sɛmɛ -20218 +▁tièw -20219 +▁ŋaɲa -20220 +▁ƙira -20221 +▁рсфс -20222 +anemia -20223 +douyon -20224 +fɛrɛtɛ -20225 +people -20226 +tanism -20227 +xvième -20228 +▁commi -20229 +▁egypt -20230 +▁geode -20231 +▁karkh -20232 +▁karya -20233 +▁mmezu -20234 +▁mungo -20235 +▁munum -20236 +▁nanai -20237 +▁nanda -20238 +▁nanga -20239 +▁nanni -20240 +▁phone -20241 +▁pobla -20242 +▁souko -20243 +▁soumo -20244 +▁рсфср -20245 +kolonci -20246 +tanisms -20247 +▁banaɲa -20248 +▁cheikh -20249 +▁cɛmala -20250 +▁dibila -20251 +▁duniɲa -20252 +▁josira -20253 +▁kasira -20254 +▁nanfan -20255 +▁nanina -20256 +▁sibila -20257 +▁sisili -20258 +▁sutraw -20259 +▁yɛlɛko -20260 +cisneros -20261 +fɛrɛtɛda -20262 +▁demisew -20263 +▁formisi -20264 +▁geodets -20265 +▁karitɔn -20266 +▁kartver -20267 +▁korekaw -20268 +▁munumun -20269 +▁nankɔrɔ -20270 +▁okpukpu -20271 +▁origina -20272 +▁shengin -20273 +▁sigidaw -20274 +▁sɛgɛnna -20275 +▁taasira -20276 +▁yɛlɛman -20277 +▁banamini -20278 +▁committe -20279 +▁dijitalụ -20280 +▁karkhdon -20281 +▁original -20282 +lopardalis -20283 +▁algoritmɛ -20284 +▁bamanakan -20285 +▁bulenmuso -20286 +▁burtaniya -20287 +▁burukisɛw -20288 +▁buturunin -20289 +▁byzantine -20290 +▁bɔbɔnkari -20291 +▁bɔlɔnkɔnɔ -20292 +▁bɔɳɔgɔnma -20293 +▁camasoron -20294 +▁cantonale -20295 +▁carbonell -20296 +▁categoría -20297 +▁centropus -20298 +▁centurion -20299 +ìlé -20300 +الة -20301 +bmar -20302 +cces -20303 +chaa -20304 +chak -20305 +jɛlé -20306 +léla -20307 +tìlé -20308 +èlin -20309 +دالة -20310 +ụcha -20311 +dalin -20312 +linus -20313 +natal -20314 +talie -20315 +yocha -20316 +عدالة -20317 +▁alew -20318 +▁boom -20319 +▁bret -20320 +▁viva -20321 +▁walé -20322 +jɛléfɛ -20323 +marine -20324 +ribmar -20325 +tances -20326 +▁alete -20327 +▁flash -20328 +▁icton -20329 +▁lutte -20330 +▁mieux -20331 +▁remar -20332 +▁sugar -20333 +▁sunsu -20334 +▁عدالة -20335 +chakras -20336 +enyocha -20337 +finance -20338 +kamerun -20339 +éléyama -20340 +▁donniw -20341 +▁guèlin -20342 +▁kobako -20343 +▁ladɔgɔ -20344 +▁libana -20345 +▁mechaa -20346 +▁ntụnye -20347 +▁succes -20348 +▁traces -20349 +▁téléla -20350 +▁worces -20351 +▁ɲɛmaaw -20352 +biisinka -20353 +ghribmar -20354 +restiers -20355 +▁aleteia -20356 +▁fanbaye -20357 +▁ictonyx -20358 +▁interno -20359 +▁kolombi -20360 +▁makanta -20361 +▁natalie -20362 +▁ndebele -20363 +▁ngwụcha -20364 +▁sugufew -20365 +▁sunsuun -20366 +▁الجزائر -20367 +telegraph -20368 +▁bretania -20369 +▁burdamew -20370 +▁dandalin -20371 +▁hematite -20372 +▁njegharị -20373 +meghribmar -20374 +▁anastomus -20375 +▁cervantes -20376 +▁champione -20377 +▁chantiers -20378 +▁chasseurs -20379 +▁chiappini -20380 +▁chloropus -20381 +▁chongqing -20382 +▁chouinard -20383 +▁chrechien -20384 +▁christgau -20385 +▁christian -20386 +▁cleansing -20387 +▁cleveland -20388 +▁coloniale -20389 +▁committee -20390 +▁community -20391 +▁compagnie -20392 +▁concludes -20393 +▁congolais -20394 +▁continent -20395 +▁corollary -20396 +▁cumhuriye -20397 +▁cèlasiraw -20398 +▁cɛnsennen -20399 +mph -20400 +phs -20401 +uck -20402 +cɛni -20403 +lock -20404 +luck -20405 +phre -20406 +traw -20407 +tuck -20408 +zick -20409 +ɛnia -20410 +▁ved -20411 +artra -20412 +bomba -20413 +kinpe -20414 +mphis -20415 +phrey -20416 +phron -20417 +trace -20418 +tucky -20419 +ɔlɔkɔ -20420 +▁hack -20421 +amibia -20422 +litube -20423 +nkalan -20424 +ptrace -20425 +pusion -20426 +traire -20427 +trales -20428 +▁atɛni -20429 +▁comba -20430 +▁dibaa -20431 +▁fomba -20432 +▁karmā -20433 +▁katra -20434 +▁lutra -20435 +▁nabaa -20436 +▁straw -20437 +▁tiɛni -20438 +bnaniya -20439 +ìnkalan -20440 +▁cullin -20441 +▁dogoni -20442 +▁kabori -20443 +▁karmāṇ -20444 +▁rendez -20445 +▁sunkun -20446 +▁unlock -20447 +▁vozick -20448 +▁zanuck -20449 +artradio -20450 +bnaniyah -20451 +kentucky -20452 +kiptrace -20453 +rupusion -20454 +▁combatt -20455 +▁dabɔbaa -20456 +▁karmāṇi -20457 +▁mansake -20458 +▁marabaa -20459 +▁memphis -20460 +▁misɛnia -20461 +▁siribaa -20462 +▁vedānta -20463 +▁wikinpe -20464 +adịchaghị -20465 +dɔnbaliya -20466 +kalancogo -20467 +▁biennial -20468 +▁cullinan -20469 +▁dɛmɛcɛni -20470 +▁goodluck -20471 +▁hamphrey -20472 +▁jateminè -20473 +▁kalanbaa -20474 +▁kankalan -20475 +▁kolonbia -20476 +▁laborato -20477 +▁neophron -20478 +▁sereyara -20479 +▁strawber -20480 +lubnaniyah -20481 +▁amplitube -20482 +▁chanteuse -20483 +▁combattre -20484 +▁contraire -20485 +▁dabakalas -20486 +▁dafalenya -20487 +▁dagifalle -20488 +▁dakabanan -20489 +▁dalajɛlen -20490 +▁damanamaw -20491 +▁danfarako -20492 +▁dansigili -20493 +▁datugulen -20494 +▁decipiens -20495 +▁degeneres -20496 +▁dementiev -20497 +▁derbianus -20498 +▁desanburu -20499 +ߌ߬ -20500 +llɛ -20501 +ojɛ -20502 +phé -20503 +ߘߌ߬ -20504 +diɲɛ -20505 +dton -20506 +nton -20507 +phan -20508 +endha -20509 +libya -20510 +lissa -20511 +lɛden -20512 +phéni -20513 +resun -20514 +sadhu -20515 +tsiya -20516 +tures -20517 +useni -20518 +▁balɛ -20519 +▁barr -20520 +▁gres -20521 +▁kano -20522 +▁topi -20523 +cidenw -20524 +diyasi -20525 +endhal -20526 +janman -20527 +katali -20528 +mentao -20529 +ntonso -20530 +resund -20531 +tonnan -20532 +▁barbe -20533 +▁barca -20534 +▁blues -20535 +▁bɛnkɛ -20536 +▁bɛnna -20537 +▁dambɛ -20538 +▁fanta -20539 +▁mikhe -20540 +▁minɛw -20541 +▁topic -20542 +emetụta -20543 +phénixi -20544 +sanburg -20545 +êafrîka -20546 +▁ancien -20547 +▁balɛmɛ -20548 +▁barber -20549 +▁bluesz -20550 +▁bɛnnen -20551 +▁fɛrɛtɛ -20552 +▁huseni -20553 +▁kabaya -20554 +▁kɔrojɛ -20555 +▁lakela -20556 +▁manton -20557 +▁sulawe -20558 +▁wlissa -20559 +▁ɲikali -20560 +cultures -20561 +ksanburg -20562 +tonnante -20563 +▁barbeau -20564 +▁barrama -20565 +▁blondel -20566 +▁centres -20567 +▁edgeler -20568 +▁fantaya -20569 +▁formula -20570 +▁mantonw -20571 +▁mikheil -20572 +▁oresund -20573 +▁petroli -20574 +▁sandton -20575 +▁tigrina -20576 +janmanjan -20577 +▁abdiyasi -20578 +▁bêafrîka -20579 +▁dugubala -20580 +▁kamarike -20581 +▁lakelali -20582 +▁luscinia -20583 +▁stendhal -20584 +▁sulawesi -20585 +▁tementao -20586 +▁barberini -20587 +▁diinɛkulu -20588 +▁dimansila -20589 +▁dingiraye -20590 +▁diocèseba -20591 +▁distances -20592 +▁distincte -20593 +▁diyarbakı -20594 +▁diɔyɔrɔta -20595 +▁diɛtɛminɛ -20596 +▁dlanfenba -20597 +▁dogofeere -20598 +▁dolatanla -20599 +fali -20600 +gɛlɛ -20601 +nord -20602 +▁ano -20603 +▁suè -20604 +▁zai -20605 +drape -20606 +henri -20607 +linga -20608 +ātman -20609 +▁ginɛ -20610 +▁kɔfe -20611 +▁mang -20612 +▁mank -20613 +▁mukɔ -20614 +▁pinɛ -20615 +▁sefa -20616 +eriani -20617 +gɛlɛya -20618 +isance -20619 +koroba -20620 +pinnis -20621 +ɔgɔncɛ -20622 +▁anoon -20623 +▁cukan -20624 +▁suède -20625 +▁taase -20626 +▁tille -20627 +▁unida -20628 +diocèse -20629 +drapeau -20630 +erianij -20631 +uruyala -20632 +▁adịghị -20633 +▁donkan -20634 +▁ikwesị -20635 +▁inaugu -20636 +▁jenevu -20637 +▁kyauta -20638 +▁latimɛ -20639 +▁nasira -20640 +▁seriya -20641 +▁tômôen -20642 +soomaali -20643 +vipinnis -20644 +▁boccoli -20645 +▁dayelen -20646 +▁haïdara -20647 +▁kunbena -20648 +▁mangɔrɔ -20649 +▁mukɔson -20650 +▁nienini -20651 +▁nubikaw -20652 +▁nyɔgɔna -20653 +▁tillebi -20654 +▁unidade -20655 +▁ɳɔgɔncɛ -20656 +gɛlɛyakow -20657 +▁budgetti -20658 +▁cekoroba -20659 +▁filimuko -20660 +▁houphouë -20661 +▁jiralikɛ -20662 +▁nuakshot -20663 +▁nyɛnyini -20664 +▁sekufali -20665 +lasuruyala -20666 +soomaaliya -20667 +▁dolokalan -20668 +▁dominique -20669 +▁donkilida -20670 +▁douminiko -20671 +▁dumetorum -20672 +▁dumunifèn -20673 +▁edgewater -20674 +▁editorial -20675 +▁efficaces -20676 +▁ekwesịghị -20677 +▁elizabeth -20678 +▁ensembles -20679 +▁episcopus -20680 +▁esperanto -20681 +▁eutropius -20682 +▁executive -20683 +▁explorant -20684 +▁falenfɛnw -20685 +▁famgadɔda -20686 +▁famuyalen -20687 +▁fantanani -20688 +▁faraniɔgɔ -20689 +▁faraɳɔkan -20690 +▁fariyakow -20691 +▁fasciatus -20692 +▁fascinant -20693 +▁fasodenya -20694 +▁fasojɔlaw -20695 +▁fatoumata -20696 +▁favorable -20697 +▁federasɔn -20698 +▁fertilité -20699 +igi -20700 +set -20701 +êse -20702 +ọkọ -20703 +anci -20704 +keli -20705 +sêse -20706 +yọkọ -20707 +zulu -20708 +▁"), -20709 +▁ake -20710 +▁jir -20711 +▁rnb -20712 +▁twi -20713 +▁von -20714 +anium -20715 +gnènè -20716 +irifi -20717 +kiden -20718 +tiden -20719 +▁asic -20720 +▁coup -20721 +▁fosi -20722 +▁haer -20723 +▁hake -20724 +▁numé -20725 +▁oden -20726 +▁rebe -20727 +▁seke -20728 +▁wase -20729 +▁ɛkun -20730 +denkan -20731 +tidens -20732 +yanoga -20733 +▁baden -20734 +▁diden -20735 +▁donga -20736 +▁lomek -20737 +▁luigi -20738 +▁minne -20739 +▁penti -20740 +▁urdun -20741 +▁ụyọkọ -20742 +ancient -20743 +sankeli -20744 +▁binnen -20745 +▁dongah -20746 +▁firifi -20747 +▁haerin -20748 +▁korero -20749 +▁kɛlɛla -20750 +▁minnea -20751 +▁musset -20752 +▁nantou -20753 +▁numéro -20754 +▁odense -20755 +▁sanuma -20756 +▁sigila -20757 +▁sitewe -20758 +▁tectus -20759 +dörösêse -20760 +madenkan -20761 +urmanssé -20762 +▁bubacar -20763 +▁cyanoga -20764 +▁dechara -20765 +▁isizulu -20766 +▁kurunbo -20767 +▁luganda -20768 +▁magnènè -20769 +▁miliyar -20770 +▁rebelle -20771 +▁sekeret -20772 +▁uranium -20773 +▁waseden -20774 +dsddfgghh -20775 +thridates -20776 +ödörösêse -20777 +▁bebaliso -20778 +▁ibikorwa -20779 +▁kɛlɛmasa -20780 +▁massives -20781 +▁nantoumé -20782 +▁sitewebi -20783 +▁towalima -20784 +bulgarikan -20785 +dsddfgghhv -20786 +gabailleul -20787 +rabailleul -20788 +▁acutidens -20789 +▁afrikiden -20790 +▁décennies -20791 +▁filipekaw -20792 +▁filipinas -20793 +▁filozofiw -20794 +▁firifirin -20795 +▁fitinigun -20796 +▁fitowarta -20797 +▁flashback -20798 +▁fluvglant -20799 +khe -20800 +otú -20801 +inik -20802 +lype -20803 +maël -20804 +qzân -20805 +seli -20806 +sout -20807 +▁ase -20808 +▁hyt -20809 +▁khe -20810 +▁tii -20811 +▁tix -20812 +▁ɲɛb -20813 +attle -20814 +jimaw -20815 +kheta -20816 +kibar -20817 +linik -20818 +mantu -20819 +ɛrɛla -20820 +▁hɔrɔ -20821 +▁kheo -20822 +▁lost -20823 +▁mika -20824 +▁nanɛ -20825 +▁palm -20826 +▁tiki -20827 +arinia -20828 +inikan -20829 +nkuman -20830 +tuareg -20831 +yaqzân -20832 +▁clype -20833 +▁fille -20834 +▁kuoro -20835 +▁leone -20836 +▁mansi -20837 +▁tiimɛ -20838 +▁wille -20839 +▁yaran -20840 +▁будет -20841 +ireille -20842 +tskheta -20843 +▁aubert -20844 +▁diyawo -20845 +▁halibi -20846 +▁hɔrɔɔn -20847 +▁ismaël -20848 +▁kheops -20849 +▁kinyan -20850 +▁klinik -20851 +▁mikael -20852 +▁ostria -20853 +▁relief -20854 +▁willem -20855 +bakrunba -20856 +ctarinia -20857 +milliard -20858 +pɛrɛpɛrɛ -20859 +▁alimami -20860 +▁alkibar -20861 +▁donsokè -20862 +▁gbɛrɛla -20863 +▁kerefen -20864 +▁niɔgɔna -20865 +▁nouveau -20866 +▁schools -20867 +▁seattle -20868 +▁yaranan -20869 +▁batiseli -20870 +▁cencenma -20871 +▁clypeata -20872 +▁kunmantu -20873 +▁mireille -20874 +▁mtskheta -20875 +ukrainikan -20876 +▁formisida -20877 +▁forokonin -20878 +▁francesan -20879 +▁francesca -20880 +▁franchise -20881 +▁francisco -20882 +▁frankfurt -20883 +▁furusiriw -20884 +▁fɛɛrɛyɛrɛ -20885 +▁gafekalan -20886 +▁galasikaw -20887 +▁gambiagam -20888 +▁ganamugan -20889 +▁geodetski -20890 +▁gigahertz -20891 +▁gnôgôfaga -20892 +▁gotenburg -20893 +▁granadine -20894 +▁grosvenor -20895 +▁guatemala -20896 +▁gudanarwa -20897 +▁gwakọtara -20898 +▁gwatemala -20899 +aɗ -20900 +ߛߎ -20901 +),[ -20902 +rte -20903 +tex -20904 +øse -20905 +œur -20906 +ɗaɗ -20907 +ߛߎ߲ -20908 +"),[ -20909 +aire -20910 +cœur -20911 +ents -20912 +line -20913 +lius -20914 +nake -20915 +olow -20916 +rous -20917 +teti -20918 +user -20919 +vous -20920 +▁ate -20921 +crans -20922 +daire -20923 +girte -20924 +heart -20925 +mains -20926 +ranus -20927 +snake -20928 +ɗaɗen -20929 +▁apra -20930 +▁deen -20931 +▁kaca -20932 +▁labo -20933 +▁late -20934 +▁list -20935 +▁root -20936 +cranus -20937 +gerous -20938 +leonés -20939 +nuaire -20940 +▁chore -20941 +▁cinta -20942 +▁ertso -20943 +▁nkaro -20944 +▁nkili -20945 +▁nwara -20946 +▁sampi -20947 +▁touma -20948 +▁verne -20949 +ingbing -20950 +pyright -20951 +romagna -20952 +▁agents -20953 +▁bamaan -20954 +▁dentex -20955 +▁doolow -20956 +▁marisi -20957 +▁mmehie -20958 +▁online -20959 +▁écrans -20960 +▁ߛߓߍߛߎ߲ -20961 +rocranus -20962 +yangirte -20963 +▁abdulay -20964 +▁damadɔn -20965 +▁kuɗaɗen -20966 +▁lamunun -20967 +▁ntuguun -20968 +▁perelli -20969 +▁sanjiko -20970 +▁souvent -20971 +▁annuaire -20972 +▁bamanakɔ -20973 +▁barilius -20974 +▁bingbing -20975 +▁courteti -20976 +▁digitata -20977 +▁facerías -20978 +▁latigɛra -20979 +▁syndrome -20980 +▁ɲɛnayeli -20981 +▁больнице -20982 +pyrocranus -20983 +▁copyright -20984 +▁cɛsiribaa -20985 +▁damadɔnin -20986 +▁dangerous -20987 +▁diafounou -20988 +▁dyangirte -20989 +▁gɛlɛyabaw -20990 +▁haminanko -20991 +▁hasselbla -20992 +▁hawthrone -20993 +▁hierarchy -20994 +▁hollywood -20995 +▁houphouët -20996 +▁hyaenidae -20997 +▁hyperarid -20998 +▁hɔrɔnyara -20999 +wk -21000 +dzi -21001 +esb -21002 +oye -21003 +èce -21004 +enea -21005 +esar -21006 +foto -21007 +gife -21008 +pèce -21009 +sime -21010 +ulée -21011 +ɲɛɲɛ -21012 +▁arj -21013 +▁dɔc -21014 +▁faw -21015 +▁faç -21016 +▁jwk -21017 +▁mpi -21018 +dziko -21019 +esbva -21020 +henea -21021 +inafo -21022 +inini -21023 +vidio -21024 +ésime -21025 +▁aiki -21026 +▁bekɛ -21027 +▁chad -21028 +▁cust -21029 +▁dakɛ -21030 +▁godd -21031 +▁jɛma -21032 +▁kɔda -21033 +▁litu -21034 +▁shpa -21035 +▁tuns -21036 +▁wood -21037 +espèce -21038 +gifera -21039 +minɛli -21040 +▁arjen -21041 +▁denko -21042 +▁façon -21043 +▁gizon -21044 +▁goddy -21045 +▁madga -21046 +▁unico -21047 +▁vibhū -21048 +▁yorow -21049 +onésime -21050 +▁caesar -21051 +▁dakɛɲɛ -21052 +▁dònìni -21053 +▁falaje -21054 +▁franko -21055 +▁ghenea -21056 +▁kadara -21057 +▁karibi -21058 +▁kirina -21059 +▁renale -21060 +▁senoye -21061 +▁sonono -21062 +▁unicod -21063 +▁custard -21064 +▁dɔcland -21065 +▁kalancɛ -21066 +▁nciniin -21067 +▁shpagin -21068 +▁vibhūti -21069 +branchius -21070 +mangifera -21071 +▁capacité -21072 +▁fariɲɛɲɛ -21073 +▁façonnan -21074 +▁formulée -21075 +▁hanyoyin -21076 +▁lituania -21077 +▁marakɛla -21078 +▁nɔminɛli -21079 +▁tunkurun -21080 +jmniejszym -21081 +lobailleul -21082 +▁arjentiki -21083 +▁cinquantɛ -21084 +▁façonnant -21085 +▁ichneumia -21086 +▁ikhamanga -21087 +▁imiragenw -21088 +▁incarnent -21089 +▁incolorep -21090 +▁indigénat -21091 +▁influence -21092 +▁ispanikan -21093 +▁jacaranda -21094 +▁jagoranta -21095 +▁jamadɔgon -21096 +▁jamandenw -21097 +▁jeliwtigi -21098 +▁jibɔyɔrɔw -21099 +▁، -21100 +als -21101 +ear -21102 +uan -21103 +âté -21104 +boro -21105 +dita -21106 +duit -21107 +fula -21108 +kono -21109 +▁bep -21110 +▁bey -21111 +▁beè -21112 +▁dag -21113 +▁dao -21114 +▁ses -21115 +▁ubi -21116 +▁ịme -21117 +atlan -21118 +dière -21119 +early -21120 +enici -21121 +tilan -21122 +ɛnina -21123 +▁fadi -21124 +▁fati -21125 +▁kado -21126 +▁sean -21127 +▁tuni -21128 +fulala -21129 +lanani -21130 +sodiya -21131 +tenici -21132 +ungary -21133 +▁amour -21134 +▁espan -21135 +▁faara -21136 +▁fyɛba -21137 +▁goals -21138 +▁landa -21139 +▁ninni -21140 +▁samfu -21141 +▁tangi -21142 +▁thuan -21143 +produit -21144 +sebesun -21145 +tilance -21146 +иловика -21147 +▁barisa -21148 +▁fatima -21149 +▁foloon -21150 +▁temala -21151 +verdière -21152 +иловикам -21153 +▁diɛnina -21154 +▁fadiara -21155 +▁gnanajɛ -21156 +▁gouraud -21157 +▁hampâté -21158 +▁hungary -21159 +▁iziniba -21160 +▁nickelo -21161 +▁sɛbɛnan -21162 +▁tangili -21163 +▁tlanani -21164 +▁tuniɛna -21165 +▁ɲadɔnna -21166 +▁ịmepụta -21167 +atlantiki -21168 +kosebesun -21169 +▁afrodita -21170 +▁espankan -21171 +▁futenici -21172 +▁fyɛbaden -21173 +▁nisodiya -21174 +▁quarante -21175 +▁samfuran -21176 +▁sorbonne -21177 +▁крылатой -21178 +dɔkɔtɔrɔya -21179 +▁dilannenw -21180 +▁guangdong -21181 +▁jadilanna -21182 +▁jigiyɔrɔw -21183 +▁jiriforow -21184 +▁joséphine -21185 +▁jurudonna -21186 +▁justinian -21187 +▁jutugunin -21188 +▁juwinkalo -21189 +▁jɔyɔrɔbla -21190 +▁jɛgɛncogo -21191 +▁jɛkafanga -21192 +▁kabarasso -21193 +▁kafobolon -21194 +▁kaladinba -21195 +▁kalansira -21196 +▁kalansoba -21197 +▁kalanyoro -21198 +▁kamalenni -21199 +dā -21200 +dān -21201 +nha -21202 +uki -21203 +рин -21204 +▁wé -21205 +boda -21206 +dɔni -21207 +inki -21208 +isse -21209 +kita -21210 +niki -21211 +orsa -21212 +saka -21213 +ūdān -21214 +рины -21215 +▁deg -21216 +▁mur -21217 +▁psy -21218 +▁yun -21219 +amiyɛ -21220 +dorsa -21221 +fetti -21222 +kniki -21223 +rieur -21224 +sūdān -21225 +▁aire -21226 +▁bɔna -21227 +▁dari -21228 +▁donn -21229 +▁fòlò -21230 +▁gabu -21231 +▁hôte -21232 +▁jeun -21233 +▁nasa -21234 +▁push -21235 +▁sìra -21236 +▁tili -21237 +▁tlas -21238 +▁wéle -21239 +matɛri -21240 +samiyɛ -21241 +▁aires -21242 +▁filla -21243 +▁jones -21244 +▁murdo -21245 +▁sanou -21246 +▁seung -21247 +▁zanbe -21248 +▁ирины -21249 +entinki -21250 +mansakɛ -21251 +tekniki -21252 +térieur -21253 +▁badara -21254 +▁cycles -21255 +▁darien -21256 +▁hôteli -21257 +▁jeunes -21258 +▁lusaka -21259 +▁nyaman -21260 +▁suisse -21261 +▁verden -21262 +▁ƙunshi -21263 +▁ɲashin -21264 +dorsalis -21265 +niafunké -21266 +unjougou -21267 +▁donnina -21268 +▁kurunba -21269 +▁makadji -21270 +▁masauki -21271 +▁murdoch -21272 +▁samasen -21273 +▁segintɔ -21274 +▁zanbezi -21275 +▁ịsọpụrụ -21276 +▁boilivia -21277 +▁confetti -21278 +▁dogonoka -21279 +▁jentinki -21280 +▁soomaali -21281 +▁degtyarev -21282 +▁fangaboda -21283 +▁hôtelière -21284 +▁intérieur -21285 +▁izdavačko -21286 +▁kamankunw -21287 +▁kamissoko -21288 +▁karamɔgɔw -21289 +▁kasankeli -21290 +▁kasuwanci -21291 +▁kawantili -21292 +▁kerkilila -21293 +▁khassonké -21294 +▁kidemokra -21295 +▁kilavuzlu -21296 +▁kilɛyanfa -21297 +▁kiswahili -21298 +▁kolosekaw -21299 +bir -21300 +bić -21301 +dɛn -21302 +fda -21303 +gbi -21304 +him -21305 +▁́i -21306 +jogo -21307 +loni -21308 +mgbi -21309 +sete -21310 +uran -21311 +wait -21312 +▁bɔɔ -21313 +▁kɔf -21314 +arabi -21315 +babić -21316 +ggara -21317 +himsa -21318 +terie -21319 +togow -21320 +ɛlɛna -21321 +▁bren -21322 +▁chat -21323 +▁dall -21324 +▁fɔnɔ -21325 +▁maas -21326 +▁parc -21327 +▁sibi -21328 +▁sona -21329 +▁zabi -21330 +ibabić -21331 +mgbidi -21332 +ogokan -21333 +uranga -21334 +▁cadre -21335 +▁chari -21336 +▁chatg -21337 +▁garan -21338 +▁horse -21339 +▁kwasa -21340 +▁nimat -21341 +atontrī -21342 +čibabić -21343 +▁ahimsa -21344 +▁arcole -21345 +▁dawolo -21346 +▁ensete -21347 +▁hɛlɛna -21348 +▁jigira -21349 +▁kanari -21350 +▁kulusi -21351 +▁kuwait -21352 +▁kɛjogo -21353 +▁loloni -21354 +▁plugin -21355 +arabikan -21356 +encyclop -21357 +ogokanfɔ -21358 +▁ajaccio -21359 +▁brendan -21360 +▁charity -21361 +▁chatgpt -21362 +▁garanti -21363 +▁hamadɛn -21364 +▁maasina -21365 +▁plugins -21366 +▁poterie -21367 +atauranga -21368 +mučibabić -21369 +▁britishw -21370 +▁nimatɔrɔ -21371 +▁niɔgɔkan -21372 +▁regional -21373 +▁tenggara -21374 +▁komonwelf -21375 +▁konatéjoë -21376 +▁konkoroon -21377 +▁koryalike -21378 +▁koulikɔrɔ -21379 +▁kreciyenw -21380 +▁kulubalen -21381 +▁kulunboli -21382 +▁kumadɔnna -21383 +▁kumasurun -21384 +▁kuncɛyɔrɔ -21385 +▁kuntagala -21386 +▁kuntigiya -21387 +▁kurayaliw -21388 +▁kurdistan -21389 +▁kuunyinde -21390 +▁kwalitere -21391 +▁kèlècegni -21392 +▁kôlôsiliw -21393 +▁kùnnàfònì -21394 +▁kɔkurulen -21395 +▁kɔlɔsiliw -21396 +▁kɔnkɔnfin -21397 +▁kɔnɔkobaw -21398 +▁kɔrɔbɔliw -21399 +emi -21400 +fye -21401 +nos -21402 +pta -21403 +sos -21404 +éta -21405 +cela -21406 +engo -21407 +rane -21408 +▁duo -21409 +▁ita -21410 +▁oas -21411 +▁sec -21412 +diyɛn -21413 +emile -21414 +foral -21415 +hatha -21416 +lekan -21417 +raven -21418 +sonke -21419 +ttina -21420 +▁ando -21421 +▁duke -21422 +▁foye -21423 +▁gɔɔn -21424 +▁kɛta -21425 +▁minɔ -21426 +▁nfye -21427 +▁seta -21428 +foralt -21429 +nanama -21430 +noskan -21431 +porter -21432 +strane -21433 +établi -21434 +ɛninbɔ -21435 +▁auver -21436 +▁cipta -21437 +▁inisi -21438 +▁jenya -21439 +▁kanta -21440 +▁medic -21441 +▁nugug -21442 +▁secré -21443 +rantion -21444 +établit -21445 +▁andora -21446 +▁avatar -21447 +▁craven -21448 +▁ekipuw -21449 +▁faamun -21450 +▁faraka -21451 +▁future -21452 +▁gosini -21453 +▁imagen -21454 +▁masiri -21455 +▁neotis -21456 +▁sanɔgɔ -21457 +▁wlekan -21458 +amanakan -21459 +romankan -21460 +▁bankass -21461 +▁bipolar -21462 +▁gnanama -21463 +▁inisiti -21464 +▁makomar -21465 +▁marengo -21466 +▁ɛndiyɛn -21467 +bamanakan -21468 +deductive -21469 +henrykjan -21470 +noskandia -21471 +▁auvergne -21472 +▁bɛɛninbɔ -21473 +▁comparti -21474 +▁drilling -21475 +▁farifina -21476 +▁khasonke -21477 +▁medicina -21478 +▁recursos -21479 +▁semitiki -21480 +▁taforalt -21481 +▁tannanan -21482 +▁tɔndenya -21483 +▁украинки -21484 +▁civettina -21485 +▁comporter -21486 +▁frameless -21487 +▁fransikaw -21488 +▁inisititu -21489 +▁kilometre -21490 +▁kɛlɛbilen -21491 +▁kɛlɛmansa -21492 +▁kɛlɛtigiw -21493 +▁kɛnkaliba -21494 +▁kɛnyɛrɛye -21495 +▁labɔlabaw -21496 +▁labɛncogo -21497 +▁ladamubaw -21498 +▁ladilibaw -21499 +lị -21500 +hus -21501 +jɛr -21502 +soa -21503 +why -21504 +▁io -21505 +▁tb -21506 +▁uô -21507 +bach -21508 +badi -21509 +lier -21510 +onio -21511 +sane -21512 +till -21513 +unil -21514 +ürkç -21515 +▁cré -21516 +▁cɛk -21517 +▁myx -21518 +▁ner -21519 +▁ɲɔn -21520 +abalị -21521 +dasoa -21522 +kohus -21523 +szawa -21524 +türkç -21525 +▁body -21526 +▁créa -21527 +▁elen -21528 +▁iugu -21529 +gulier -21530 +türkçe -21531 +▁agụrụ -21532 +▁bosna -21533 +▁dénou -21534 +▁dôsow -21535 +▁dɔnɛn -21536 +▁fujɛr -21537 +▁infor -21538 +▁iolan -21539 +▁iugum -21540 +▁jikan -21541 +▁kitaa -21542 +▁mines -21543 +▁rifle -21544 +▁still -21545 +▁warso -21546 +ɛnɛfura -21547 +▁balama -21548 +▁nerlan -21549 +▁općine -21550 +▁pisini -21551 +▁tamaan -21552 +▁wilila -21553 +▁ɲɛɲini -21554 +kerennen -21555 +warszawa -21556 +▁antonio -21557 +▁bidasoa -21558 +▁hassane -21559 +▁informe -21560 +▁iolanda -21561 +▁kitaabu -21562 +▁kobroor -21563 +▁niecine -21564 +▁nyerere -21565 +▁osaenia -21566 +▁tallinn -21567 +kɛminɛnni -21568 +washinton -21569 +▁archived -21570 +▁balamake -21571 +▁liczbach -21572 +▁lobugula -21573 +▁malabadi -21574 +▁nerlandi -21575 +▁plebejus -21576 +▁rifleman -21577 +▁régulier -21578 +▁simpsons -21579 +▁yelemata -21580 +▁ɲɛfɔcogo -21581 +▁оказался -21582 +kerennenya -21583 +▁créations -21584 +▁fɛɛnɛfura -21585 +▁ladjɛléfɛ -21586 +▁ladɔgɔman -21587 +▁lafangama -21588 +▁lafantanw -21589 +▁lafiyalen -21590 +▁lakanabaa -21591 +▁lakoronen -21592 +▁lakunnikɛ -21593 +▁lakununna -21594 +▁lamununen -21595 +▁languages -21596 +▁lankoloon -21597 +▁lapasabaa -21598 +▁lapasabaw -21599 +!, -21600 +cde -21601 +gie -21602 +giz -21603 +▁hm -21604 +cɛgo -21605 +ills -21606 +nɔgɔ -21607 +yɔgɔ -21608 +èngè -21609 +▁awo -21610 +▁dak -21611 +▁dii -21612 +▁dir -21613 +▁dié -21614 +▁mec -21615 +▁suɛ -21616 +atles -21617 +engiz -21618 +hlaba -21619 +other -21620 +xarra -21621 +yilan -21622 +▁dine -21623 +▁diou -21624 +▁faka -21625 +▁fiin -21626 +▁igbo -21627 +▁laci -21628 +▁mige -21629 +▁nihi -21630 +▁ocde -21631 +▁seth -21632 +nɔgɔsi -21633 +▁diana -21634 +▁diɔrɔ -21635 +▁hills -21636 +▁jèngè -21637 +▁kanou -21638 +▁kantɛ -21639 +▁kongu -21640 +▁kromo -21641 +▁manis -21642 +▁mecca -21643 +▁migel -21644 +▁suɛzi -21645 +▁tlema -21646 +▁yanar -21647 +kɔrɔtan -21648 +landiya -21649 +yilandi -21650 +înement -21651 +чиленко -21652 +▁dakare -21653 +▁kɛcɛgo -21654 +▁lasiya -21655 +▁manɛti -21656 +▁masaba -21657 +▁mhlaba -21658 +▁nihilo -21659 +▁shubaa -21660 +nlandiya -21661 +▁beatles -21662 +▁camanba -21663 +▁dioulas -21664 +▁disemba -21665 +▁exclave -21666 +▁kanouté -21667 +▁nisɔngɔ -21668 +▁niɔgɔyɛ -21669 +▁warikun -21670 +▁énergie -21671 +raînement -21672 +thnologue -21673 +underbird -21674 +кочиленко -21675 +▁bagayɔgɔ -21676 +▁faamamar -21677 +▁gnèleman -21678 +▁lasiyaya -21679 +▁sethente -21680 +▁siniyobo -21681 +▁ɲasaland -21682 +jamahiriya -21683 +▁binganina -21684 +▁cakɛdabaw -21685 +▁dioulasso -21686 +▁diédougou -21687 +▁kromokari -21688 +▁lasagolen -21689 +▁latigɛkan -21690 +▁lawasalen -21691 +▁laɲininen -21692 +▁legislaci -21693 +▁leicester -21694 +▁lexington -21695 +▁libanaise -21696 +▁lomekwien -21697 +▁longitude -21698 +▁macrolepi -21699 +hni -21700 +nde -21701 +nit -21702 +pni -21703 +rul -21704 +ledo -21705 +maha -21706 +nato -21707 +niin -21708 +urma -21709 +zhni -21710 +’’’, -21711 +▁jay -21712 +▁kat -21713 +▁mni -21714 +▁tas -21715 +▁tul -21716 +daɲɛw -21717 +hansa -21718 +ndekọ -21719 +shall -21720 +tikto -21721 +▁anko -21722 +▁baka -21723 +▁hare -21724 +▁libu -21725 +▁load -21726 +▁seie -21727 +▁stad -21728 +▁yeni -21729 +▁ʃaan -21730 +chepni -21731 +hɔrɔma -21732 +quisti -21733 +tiktok -21734 +▁bénit -21735 +▁canji -21736 +▁damad -21737 +▁joson -21738 +▁mauss -21739 +▁nataa -21740 +▁omaha -21741 +▁rudis -21742 +▁talen -21743 +▁tulsa -21744 +▁yeniş -21745 +bamɛtrɛ -21746 +climate -21747 +quistii -21748 +ropathi -21749 +▁ankole -21750 +▁cɛcila -21751 +▁damadᴐ -21752 +▁gourma -21753 +▁juguba -21754 +▁kalaan -21755 +▁koroko -21756 +▁lasili -21757 +▁nataaw -21758 +▁nizhni -21759 +▁sahrul -21760 +▁tannis -21761 +▁toledo -21762 +amahansa -21763 +erɔpukan -21764 +kumajago -21765 +lɔhɔrɔma -21766 +▁germani -21767 +▁josonaw -21768 +▁kasoden -21769 +▁kolonbɔ -21770 +▁olduvai -21771 +▁stadler -21772 +▁surundu -21773 +▁yenişar -21774 +▁yiribaw -21775 +adansonia -21776 +▁germanic -21777 +▁lɔhɔrɔma -21778 +▁marshall -21779 +espanyikan -21780 +▁farafinya -21781 +▁madgaskar -21782 +▁magotigiw -21783 +▁mahamadou -21784 +▁maliblues -21785 +▁malinoski -21786 +▁manantali -21787 +▁mandonnen -21788 +▁manipuler -21789 +▁maniɲanba -21790 +▁marakakan -21791 +▁marakelaw -21792 +▁mariupoli -21793 +▁marsikalo -21794 +▁masirilen -21795 +▁maximiser -21796 +▁mekanikiw -21797 +▁meksikano -21798 +▁meleagris -21799 +bdb -21800 +▁pụ -21801 +▁ɳɛ -21802 +bdbv -21803 +deon -21804 +gusa -21805 +ilin -21806 +▁dwa -21807 +▁era -21808 +▁kei -21809 +▁odé -21810 +▁ɳas -21811 +beria -21812 +duata -21813 +etara -21814 +kanso -21815 +kille -21816 +lasse -21817 +yaman -21818 +▁basa -21819 +▁djeï -21820 +▁dɔla -21821 +▁fans -21822 +▁jɛmu -21823 +▁kwen -21824 +▁pala -21825 +▁vega -21826 +aikata -21827 +christ -21828 +classe -21829 +dantes -21830 +datugu -21831 +killed -21832 +kurufa -21833 +schild -21834 +▁anima -21835 +▁beaux -21836 +▁danbé -21837 +▁dwaya -21838 +▁décla -21839 +▁furum -21840 +▁jansa -21841 +▁jerin -21842 +▁joliw -21843 +▁keith -21844 +▁nasau -21845 +▁nauti -21846 +▁sandi -21847 +▁vegas -21848 +kunwɔrɔ -21849 +▁djeïté -21850 +▁erasia -21851 +▁frejus -21852 +▁guilin -21853 +▁gèrègè -21854 +▁kɔnɔta -21855 +▁pụtara -21856 +▁ragusa -21857 +▁suguba -21858 +▁sɔrɔta -21859 +▁ɳashin -21860 +aliberia -21861 +thschild -21862 +▁animaux -21863 +▁chetara -21864 +▁jɛmukan -21865 +▁maharaj -21866 +▁mansaso -21867 +▁palatal -21868 +▁siyaman -21869 +▁viduata -21870 +▁рисунок -21871 +datugunen -21872 +pendantes -21873 +▁conduite -21874 +▁fulasolo -21875 +▁jirikari -21876 +▁kwenyere -21877 +▁nautilus -21878 +▁poussant -21879 +▁sankanso -21880 +▁shqipëri -21881 +adịkarịghị -21882 +tinkunwɔrɔ -21883 +▁bamakôkaw -21884 +▁barcelona -21885 +▁kɛlɛkeden -21886 +▁mellivora -21887 +▁mexicanos -21888 +▁mezzanone -21889 +▁mgbagwoju -21890 +▁microsoft -21891 +▁migration -21892 +▁mikrosɔft -21893 +▁militaire -21894 +▁milliards -21895 +▁milliɔnki -21896 +▁milwaukee -21897 +▁minakalan -21898 +▁miniaturi -21899 +pf -21900 +epf -21901 +nab -21902 +naî -21903 +oji -21904 +pma -21905 +sab -21906 +čna -21907 +▁[[ -21908 +brie -21909 +epfl -21910 +naba -21911 +naît -21912 +sabt -21913 +ynab -21914 +▁dil -21915 +▁wil -21916 +anima -21917 +ation -21918 +enium -21919 +ojida -21920 +ption -21921 +xerus -21922 +yentɔ -21923 +úcuta -21924 +▁bats -21925 +▁bira -21926 +▁cèba -21927 +▁daou -21928 +▁depi -21929 +anična -21930 +chilen -21931 +mation -21932 +nabawi -21933 +nanima -21934 +quelin -21935 +▁dunni -21936 +▁kènèw -21937 +▁malga -21938 +▁silan -21939 +▁siyen -21940 +brielle -21941 +doption -21942 +gandugu -21943 +rmation -21944 +vanična -21945 +▁cúcuta -21946 +▁depite -21947 +▁dilana -21948 +▁dɔnrɔn -21949 +▁jiboli -21950 +▁kanuko -21951 +▁kɛrɛcɛ -21952 +▁lamine -21953 +▁moheni -21954 +▁sounfo -21955 +▁teoriw -21956 +▁wilson -21957 +▁zaynab -21958 +▁égypte -21959 +beyanfan -21960 +chilenko -21961 +ineation -21962 +▁changer -21963 +▁connaît -21964 +▁euxerus -21965 +▁fiyentɔ -21966 +▁khalife -21967 +▁koojida -21968 +▁lôgôkun -21969 +▁relatif -21970 +▁sièkili -21971 +firmation -21972 +kpakpando -21973 +▁adoption -21974 +▁batswana -21975 +▁cristata -21976 +▁finɲanma -21977 +▁forkjeli -21978 +▁malgache -21979 +▁poquelin -21980 +▁sounfoun -21981 +▁zvanična -21982 +nanimafenw -21983 +▁bolifɛnko -21984 +▁diagayété -21985 +▁digandugu -21986 +▁djamanade -21987 +▁gabrielle -21988 +▁kelenpeya -21989 +▁minisisow -21990 +▁ministère -21991 +▁minorités -21992 +▁misikolon -21993 +▁misimusow -21994 +▁misirakaw -21995 +▁mmeghachi -21996 +▁mmekorita -21997 +▁mmekọrịta -21998 +▁mormyrops -21999 +%) -22000 +iko -22001 +ᴐna -22002 +▁(“ -22003 +▁ks -22004 +▁|} -22005 +asụs -22006 +enda -22007 +goga -22008 +luwa -22009 +thug -22010 +xles -22011 +▁bɔg -22012 +▁ilm -22013 +▁kov -22014 +▁lol -22015 +albam -22016 +asụsụ -22017 +cinin -22018 +ikotɛ -22019 +jeune -22020 +▁bèyi -22021 +▁kaga -22022 +▁kola -22023 +▁kunc -22024 +▁nᴐna -22025 +▁tite -22026 +▁ɲeni -22027 +albamu -22028 +endale -22029 +phiebɛ -22030 +sorofe -22031 +▁axles -22032 +▁donda -22033 +▁dumia -22034 +▁ibero -22035 +▁isiya -22036 +▁kovro -22037 +▁ouane -22038 +▁phoci -22039 +▁tanaj -22040 +▁vietn -22041 +▁ɲeniɲ -22042 +galikaw -22043 +▁bajida -22044 +▁bɔgɔrɔ -22045 +▁degoga -22046 +▁ilmeni -22047 +▁jadila -22048 +▁kaluwa -22049 +▁kovrov -22050 +▁kwenye -22051 +▁kôkuru -22052 +▁lignon -22053 +▁ncinin -22054 +▁saniôn -22055 +▁sonzan -22056 +▁wagadu -22057 +thcrodon -22058 +▁isiyaka -22059 +▁jiikotɛ -22060 +▁masabon -22061 +▁motikaw -22062 +▁phocian -22063 +▁premios -22064 +▁ilmenite -22065 +▁mansasiw -22066 +▁nᴐnabila -22067 +▁ɲeniɲeni -22068 +sorofekɔnɔ -22069 +▁bonendale -22070 +▁bɔgɔrɔdɔn -22071 +▁fangaɲɛma -22072 +▁including -22073 +▁masabonda -22074 +▁mouhammad -22075 +▁multimédi -22076 +▁multitude -22077 +▁municipal -22078 +▁murutilen -22079 +▁musambiki -22080 +▁musophaga -22081 +▁métropole -22082 +▁môdenmuso -22083 +▁mɔnikɛlaw -22084 +▁naissance -22085 +▁namaratôw -22086 +▁nankɔrɔla -22087 +▁nbogotigi -22088 +▁nescience -22089 +▁ngosipụta -22090 +▁ngusujeli -22091 +▁niangadou -22092 +▁nicaragua -22093 +▁niɛbɔyɔrɔ -22094 +▁niɛnɛbɔlɛ -22095 +▁nkankoron -22096 +▁nkekọrịta -22097 +▁nkɛlɛnnin -22098 +▁nsoroŋɛɲɛ -22099 +log -22100 +pir -22101 +psi -22102 +roş -22103 +▁(, -22104 +▁(= -22105 +▁(ˈ -22106 +▁gó -22107 +▁tî -22108 +blog -22109 +lerk -22110 +loka -22111 +occa -22112 +phor -22113 +uron -22114 +wura -22115 +▁gap -22116 +▁sav -22117 +araná -22118 +bbing -22119 +ciens -22120 +diako -22121 +ebola -22122 +inedo -22123 +lipsi -22124 +lokal -22125 +pirar -22126 +sente -22127 +tteur -22128 +▁davo -22129 +▁góme -22130 +▁harm -22131 +▁kans -22132 +▁kole -22133 +▁salu -22134 +▁sant -22135 +▁sino -22136 +ciosus -22137 +contra -22138 +phorus -22139 +umanen -22140 +▁cogow -22141 +▁davos -22142 +▁filiw -22143 +▁gómez -22144 +▁khald -22145 +▁klerk -22146 +▁kolek -22147 +▁nɔgɔw -22148 +▁saber -22149 +▁salut -22150 +▁socié -22151 +camelus -22152 +diakoin -22153 +loading -22154 +résente -22155 +uronaux -22156 +vipirar -22157 +▁ballad -22158 +▁filiba -22159 +▁katiri -22160 +▁kinedo -22161 +▁kolekc -22162 +▁nigiri -22163 +▁niɔgɔf -22164 +▁paraná -22165 +▁savana -22166 +▁sawura -22167 +africine -22168 +contrada -22169 +daɲɛgafe -22170 +occasion -22171 +▁barbera -22172 +▁dubbing -22173 +▁ellipsi -22174 +▁falenna -22175 +▁harmoni -22176 +▁kansɛri -22177 +▁khaldun -22178 +▁kolekcj -22179 +▁metteur -22180 +▁société -22181 +jovaciens -22182 +▁bamɛtɛrɛ -22183 +▁nafabɔli -22184 +▁niɔgɔfar -22185 +▁tigɛtigɛ -22186 +developing -22187 +▁favipirar -22188 +▁harmonika -22189 +▁kerecenya -22190 +▁kosumanen -22191 +▁kurukuruw -22192 +▁majiginni -22193 +▁nationale -22194 +▁neuronaux -22195 +▁ntamannin -22196 +▁ntenbilen -22197 +▁nyamanton -22198 +▁nòwanburu -22199 +slo -22200 +cost -22201 +fɔrɔ -22202 +gapo -22203 +nium -22204 +vary -22205 +zuha -22206 +ɔrɔw -22207 +▁fao -22208 +▁lau -22209 +▁pɔn -22210 +▁six -22211 +anaan -22212 +bokin -22213 +jalla -22214 +jikaw -22215 +suala -22216 +unisa -22217 +▁badu -22218 +▁fami -22219 +▁gala -22220 +▁mɔti -22221 +▁oslo -22222 +▁sian -22223 +▁sosi -22224 +actuel -22225 +gapore -22226 +sensta -22227 +ssinka -22228 +▁baraa -22229 +▁bɔrɔw -22230 +▁crini -22231 +▁kaboi -22232 +▁pɔnpe -22233 +arlotte -22234 +lennium -22235 +stiques -22236 +▁abokin -22237 +▁ankara -22238 +▁bamajɛ -22239 +▁bamakɛ -22240 +▁bovary -22241 +▁djalla -22242 +▁dogoya -22243 +▁famili -22244 +▁indika -22245 +▁kazuha -22246 +▁laurie -22247 +▁motion -22248 +▁sɛfɔlɔ -22249 +fɔrɔkili -22250 +kɛbaliya -22251 +senstadt -22252 +▁ambelau -22253 +▁kaboila -22254 +▁kôrôbaw -22255 +▁kɔrɔnfe -22256 +▁ntanaan -22257 +▁sianfan -22258 +▁sosiali -22259 +charlotte -22260 +deminsenw -22261 +illennium -22262 +kisandiri -22263 +▁commence -22264 +▁crinifer -22265 +▁familiar -22266 +▁nafoloba -22267 +▁samagara -22268 +▁sosialis -22269 +millennium -22270 +▁badufalen -22271 +▁fonología -22272 +▁hordaceus -22273 +▁labaarata -22274 +▁lamunulen -22275 +▁margarita -22276 +▁nɔgɔlenya -22277 +▁nɔnsiwulu -22278 +▁okestream -22279 +▁oldowayen -22280 +▁ouologuem -22281 +▁pachelbel -22282 +▁pallascio -22283 +▁paninekaw -22284 +▁panpulimu -22285 +▁paradoxum -22286 +▁parlement -22287 +▁pelengana -22288 +▁pentecoti -22289 +▁personnes -22290 +▁phoenicul -22291 +▁photoshop -22292 +▁physiques -22293 +▁plastique -22294 +▁plexiglas -22295 +▁plongeons -22296 +▁plusieurs -22297 +▁población -22298 +▁politikow -22299 +|( -22300 +ых -22301 +دي -22302 +سَ -22303 +)]. -22304 +afɔ -22305 +mɛo -22306 +pax -22307 +ديم -22308 +▁., -22309 +▁fâ -22310 +▁vh -22311 +koya -22312 +ديمق -22313 +▁adi -22314 +▁pam -22315 +▁pse -22316 +▁тру -22317 +kolen -22318 +tuhan -22319 +ديمقر -22320 +▁alig -22321 +▁badi -22322 +▁bula -22323 +▁fâri -22324 +▁hidi -22325 +▁kaka -22326 +▁kreo -22327 +▁laja -22328 +▁nika -22329 +▁omɛo -22330 +▁pseu -22331 +▁yogī -22332 +▁труд -22333 +ديمقرا -22334 +▁anetz -22335 +▁bocca -22336 +▁chili -22337 +▁eblan -22338 +▁gomme -22339 +▁login -22340 +▁manon -22341 +▁minka -22342 +▁mmeri -22343 +▁rapax -22344 +▁труды -22345 +sibagaw -22346 +▁alighi -22347 +▁badius -22348 +▁dourou -22349 +▁draman -22350 +▁fresna -22351 +▁hector -22352 +▁hidima -22353 +▁kabine -22354 +▁kreole -22355 +▁kɛrɛbɛ -22356 +▁lajaba -22357 +▁lakunu -22358 +▁mamady -22359 +▁ntolan -22360 +▁pamata -22361 +▁pseudo -22362 +sentuhan -22363 +▁dramann -22364 +▁filemon -22365 +▁flenklo -22366 +▁fresnay -22367 +▁inidiya -22368 +▁kɛlɛlɛw -22369 +▁misinin -22370 +▁pamatao -22371 +egwuregwu -22372 +kɔnɔntɔnw -22373 +upanishad -22374 +▁hepsetus -22375 +▁korobara -22376 +▁kɛrɛbɛtɛ -22377 +▁nkarifin -22378 +▁omɛopati -22379 +▁yɔrɔkoya -22380 +▁الديمقرا -22381 +lectricité -22382 +▁alighieri -22383 +▁boccaccio -22384 +▁djumarala -22385 +▁flenkloci -22386 +▁portables -22387 +▁pradīpikā -22388 +▁preduzeće -22389 +▁pressions -22390 +▁processus -22391 +▁programuw -22392 +▁progresso -22393 +▁protestan -22394 +▁prototype -22395 +▁prédisait -22396 +▁purchases -22397 +▁pɔliyɔfin -22398 +▁pɛrɛsikan -22399 +,, -22400 +:# -22401 +yj -22402 +}[ -22403 +▁ì -22404 +▁š -22405 +fyj -22406 +ism -22407 +oke -22408 +pup -22409 +ɔnɛ -22410 +▁yô -22411 +▁ìh -22412 +,,'. -22413 +aren -22414 +ason -22415 +ceph -22416 +diin -22417 +eniw -22418 +kiro -22419 +voni -22420 +zugu -22421 +▁dit -22422 +▁opo -22423 +▁sao -22424 +▁ìhè -22425 +anism -22426 +chena -22427 +coral -22428 +dukaw -22429 +pupli -22430 +rkiro -22431 +▁fɔnɛ -22432 +▁lise -22433 +▁siye -22434 +▁wfyj -22435 +barali -22436 +forbes -22437 +mizugu -22438 +vonica -22439 +wideyo -22440 +yadiin -22441 +▁bundi -22442 +▁ikomi -22443 +▁medin -22444 +▁ncɔgɔ -22445 +▁opoku -22446 +▁sieki -22447 +▁sthan -22448 +▁sèche -22449 +▁tunga -22450 +▁zapan -22451 +asoning -22452 +chanism -22453 +dumaren -22454 +issants -22455 +missiri -22456 +puplica -22457 +shchena -22458 +strauss -22459 +▁bambou -22460 +▁change -22461 +▁niduru -22462 +▁polisi -22463 +▁sangan -22464 +▁siyera -22465 +▁yalaba -22466 +▁ɲegetu -22467 +maninkaw -22468 +mizugumi -22469 +▁abidjan -22470 +▁bambouk -22471 +▁batosow -22472 +▁bundibu -22473 +▁dunniya -22474 +▁indukaw -22475 +▁kirkiro -22476 +▁mansakɛ -22477 +▁ncɔgɔɔn -22478 +▁scholia -22479 +▁solaire -22480 +▁šiprage -22481 +▁abdulayi -22482 +▁bundibug -22483 +▁dɛsɛlenw -22484 +▁fɔnɛtigi -22485 +▁juventud -22486 +▁kunbeniw -22487 +▁labarali -22488 +▁pavonica -22489 +▁directory -22490 +▁mechanism -22491 +▁moshchena -22492 +▁puissants -22493 +▁reasoning -22494 +▁redéfinir -22495 +▁relations -22496 +▁religieux -22497 +▁religiøse -22498 +▁remarques -22499 +/? -22500 +?: -22501 +▁』 -22502 +nke -22503 +ozi -22504 +▁ߒߠ -22505 +coko -22506 +hyte -22507 +unen -22508 +▁abé -22509 +▁box -22510 +▁die -22511 +▁haa -22512 +▁ߒߠߋ -22513 +decin -22514 +ghara -22515 +hytei -22516 +ision -22517 +istic -22518 +kolma -22519 +ppine -22520 +▁kɔɔr -22521 +▁lura -22522 +▁real -22523 +▁tera -22524 +cision -22525 +misozi -22526 +sheets -22527 +▁fanka -22528 +▁janba -22529 +▁jogin -22530 +▁kofan -22531 +▁musta -22532 +▁nsɛrɛ -22533 +▁tloon -22534 +iltlebi -22535 +imisozi -22536 +paghara -22537 +▁bronis -22538 +▁bàgàni -22539 +▁dienta -22540 +▁kɔɔrin -22541 +▁museet -22542 +▁njikwa -22543 +▁orange -22544 +▁whytei -22545 +adomości -22546 +finitive -22547 +▁kanulen -22548 +▁kanunen -22549 +▁mustafa -22550 +▁médecin -22551 +▁shankar -22552 +▁silamaw -22553 +▁terason -22554 +▁zimbabu -22555 +▁arabique -22556 +▁balikuya -22557 +▁baszucki -22558 +▁différen -22559 +▁mpaghara -22560 +▁niangolo -22561 +▁nkalonma -22562 +▁petridis -22563 +▁zimbabue -22564 +▁bronislaw -22565 +▁degharịrị -22566 +▁farikolma -22567 +▁joginlenw -22568 +▁kalancoko -22569 +▁kelenyako -22570 +▁précision -22571 +▁renouveau -22572 +▁repuplica -22573 +▁rifugiati -22574 +▁rodríguez -22575 +▁romanikan -22576 +▁rostratus -22577 +▁rufescens -22578 +▁sakamakon -22579 +▁sakoumana -22580 +▁salamanto -22581 +▁samnyâsin -22582 +▁sanfɛyɔrɔ -22583 +▁saniyalan -22584 +▁sannakolo -22585 +▁sarasvati -22586 +▁satirical -22587 +▁sayijirin -22588 +▁scoresese -22589 +▁sebastián -22590 +▁seginkɛra -22591 +▁selective -22592 +▁selilɛriw -22593 +▁sensation -22594 +▁serekunda -22595 +▁seribanin -22596 +▁shinsegae -22597 +▁sibiridon -22598 +▁sikiralan -22599 +.( -22600 +fn -22601 +sı -22602 +vɔ -22603 +amd -22604 +edo -22605 +pec -22606 +wir -22607 +endu -22608 +mapp -22609 +opec -22610 +swir -22611 +sɛna -22612 +tumu -22613 +vɔla -22614 +▁bli -22615 +▁jɔw -22616 +▁kfɛ -22617 +▁lfn -22618 +▁lɔn -22619 +▁mbi -22620 +edobe -22621 +rouen -22622 +zmapp -22623 +▁glam -22624 +▁goun -22625 +▁kafa -22626 +▁kasa -22627 +▁kwat -22628 +▁laga -22629 +▁maba -22630 +▁opus -22631 +▁yésu -22632 +raneus -22633 +▁belle -22634 +▁chini -22635 +▁ciyar -22636 +▁daegu -22637 +▁kosèn -22638 +▁magwa -22639 +▁mange -22640 +▁maïga -22641 +▁meera -22642 +▁minin -22643 +▁złota -22644 +ejedebe -22645 +garangi -22646 +▁gounas -22647 +▁kafada -22648 +▁kasabi -22649 +▁kumaba -22650 +▁lagafo -22651 +▁lawalé -22652 +▁milvus -22653 +▁nimaya -22654 +▁yamato -22655 +buyekalo -22656 +cameroun -22657 +swirling -22658 +▁bankası -22659 +▁bikanni -22660 +▁faceira -22661 +▁glamour -22662 +▁gounass -22663 +▁jɛnsɛna -22664 +▁kazakst -22665 +▁kosènbè -22666 +▁kumakan -22667 +▁lɔnduru -22668 +▁magwaan -22669 +▁mbipụta -22670 +▁miliyan -22671 +▁raconta -22672 +▁tangala -22673 +▁tounani -22674 +▁موريتان -22675 +legorguei -22676 +▁bantukan -22677 +▁burutumu -22678 +▁laticeps -22679 +▁manamana -22680 +▁ouenzzin -22681 +dɔgɔtɔrɔya -22682 +▁afrikaden -22683 +▁ingarangi -22684 +▁kazakstan -22685 +▁sikorolen -22686 +▁sinankuun -22687 +▁sinsinibɛ -22688 +▁sinsinnan -22689 +▁sirenaika -22690 +▁skiptrace -22691 +▁soberania -22692 +▁sociologi -22693 +▁soggiorno -22694 +▁sojobaara -22695 +▁solokujan -22696 +▁sorodachi -22697 +▁sosiyetew -22698 +▁streaming -22699 +ln -22700 +gew -22701 +mln -22702 +uda -22703 +▁sü -22704 +anta -22705 +onés -22706 +sura -22707 +undp -22708 +ɛrsa -22709 +▁cfa -22710 +▁jor -22711 +▁lum -22712 +▁nav -22713 +▁ppp -22714 +▁sɔw -22715 +▁ߘߐ߫ -22716 +▁ߣߌ߫ -22717 +bowda -22718 +cauda -22719 +lenti -22720 +▁dite -22721 +▁east -22722 +▁enco -22723 +▁fast -22724 +▁waan -22725 +▁yara -22726 +chiani -22727 +etstop -22728 +élande -22729 +▁asura -22730 +▁balle -22731 +▁bangu -22732 +▁egido -22733 +▁jorji -22734 +▁manda -22735 +▁nongo -22736 +▁renmu -22737 +▁sauve -22738 +▁tigew -22739 +▁waanɛ -22740 +▁watiw -22741 +▁weere -22742 +kukalan -22743 +llionés -22744 +zélande -22745 +ɛripunk -22746 +▁balaan -22747 +▁ballet -22748 +▁buguri -22749 +▁debala -22750 +▁dɔntaw -22751 +▁emilia -22752 +▁encore -22753 +▁fakoli -22754 +▁fariye -22755 +▁jarida -22756 +▁jorjia -22757 +▁lumine -22758 +▁nyokon -22759 +▁shirin -22760 +▁ߝߊ߫ߙߊ߬ -22761 +bɛripunk -22762 +▁kalanma -22763 +▁kouanta -22764 +▁kumalaw -22765 +▁madɛrsa -22766 +▁militon -22767 +▁navarra -22768 +▁sauveur -22769 +▁talking -22770 +▁tchiani -22771 +naissance -22772 +seregbede -22773 +terambere -22774 +▁bangudɔn -22775 +▁lumineux -22776 +▁románico -22777 +▁tounkara -22778 +populasion -22779 +▁albicauda -22780 +▁dilanfɛnw -22781 +▁gramática -22782 +▁jirikunan -22783 +▁masabowda -22784 +▁studiorum -22785 +▁subjectif -22786 +▁sumankoyi -22787 +▁sunbalani -22788 +▁sunguruun -22789 +▁surakakan -22790 +▁surunyala -22791 +▁surunyali -22792 +▁sweetstop -22793 +▁sɔmikɛlen -22794 +▁sɔrɔcogow -22795 +▁sɔrɔkodon -22796 +▁sɛgɛbanpo -22797 +▁sɛrɛkiliw -22798 +▁sɛtanburu -22799 +*] -22800 +fv -22801 +gm -22802 +mf -22803 +’, -22804 +[*] -22805 +gér -22806 +may -22807 +zow -22808 +ɔga -22809 +аши -22810 +ụma -22811 +goda -22812 +gunw -22813 +hemi -22814 +kilɛ -22815 +laho -22816 +lour -22817 +sona -22818 +sɛrɛ -22819 +tafv -22820 +tune -22821 +urfi -22822 +▁amô -22823 +▁dya -22824 +▁imf -22825 +▁jiè -22826 +▁mug -22827 +▁njz -22828 +[*]). -22829 +deola -22830 +dɔnke -22831 +mayer -22832 +quard -22833 +sinus -22834 +▁woso -22835 +▁zoro -22836 +▁маши -22837 +aniɔga -22838 +gérard -22839 +lahoma -22840 +▁amôna -22841 +▁amụma -22842 +▁andes -22843 +▁bozow -22844 +▁diata -22845 +▁djiré -22846 +▁heart -22847 +▁kɔɔnɔ -22848 +▁maris -22849 +▁minor -22850 +▁moriw -22851 +▁muggu -22852 +▁pegun -22853 +▁siyar -22854 +▁tgoda -22855 +▁zurfi -22856 +lourdio -22857 +▁asinus -22858 +▁diinɛw -22859 +▁dorcas -22860 +▁katɛmɛ -22861 +▁manque -22862 +▁nehemi -22863 +▁sogolo -22864 +▁yɛrɛbɔ -22865 +entielle -22866 +kɔrɔbɔli -22867 +lourdios -22868 +publiken -22869 +sɛrɛkili -22870 +▁ardeola -22871 +▁jaridun -22872 +▁jatigiw -22873 +▁kalanen -22874 +▁rapides -22875 +leichtman -22876 +principes -22877 +▁baptiste -22878 +▁jacquard -22879 +▁jikoroni -22880 +▁oklahoma -22881 +▁revision -22882 +kɛtiokoyaw -22883 +quentielle -22884 +▁cɛfarinya -22885 +▁jerusalem -22886 +▁ogasawara -22887 +▁taamasiɲɛ -22888 +▁tafunteni -22889 +▁takokelen -22890 +▁tamasheck -22891 +▁tamasiyew -22892 +▁taniworon -22893 +▁tankanika -22894 +▁tanninani -22895 +▁taqbaylit -22896 +▁tayilandi -22897 +▁terrasson -22898 +▁tessougué -22899 +arụ -22900 +rex -22901 +uvi -22902 +▁wy -22903 +malo -22904 +peru -22905 +ryth -22906 +soba -22907 +sofi -22908 +tama -22909 +▁daɳ -22910 +▁etn -22911 +▁aman -22912 +▁behl -22913 +▁daɳɛ -22914 +▁juba -22915 +▁kiss -22916 +▁mask -22917 +▁nogo -22918 +▁papa -22919 +▁wabi -22920 +alauvi -22921 +igname -22922 +koloci -22923 +lorifi -22924 +rythré -22925 +rụpụta -22926 +▁behlü -22927 +▁bight -22928 +▁brain -22929 +▁denkè -22930 +▁déter -22931 +▁kunne -22932 +▁noken -22933 +▁sorex -22934 +rythrée -22935 +tilebin -22936 +▁behlül -22937 +▁bogoti -22938 +▁cheick -22939 +▁daniɛl -22940 +▁donsow -22941 +▁dôsoba -22942 +▁forbes -22943 +▁koloon -22944 +▁kuruun -22945 +▁kɔnɔfɛ -22946 +▁tarihi -22947 +▁togoda -22948 +ficience -22949 +tamasheq -22950 +▁benkadi -22951 +▁fromazi -22952 +▁gbanwee -22953 +▁kɔnɔnin -22954 +▁kɛɲɛlen -22955 +▁nrụpụta -22956 +▁tileman -22957 +▁tlacogo -22958 +islāmiyya -22959 +lorifique -22960 +▁badabolo -22961 +▁cristina -22962 +▁détermin -22963 +▁filɛsofi -22964 +▁kungodaw -22965 +▁nogosira -22966 +▁pauvreté -22967 +▁reservew -22968 +▁sualauvi -22969 +▁sɛbɛnnin -22970 +▁trinidad -22971 +▁wabiwɔrɔ -22972 +▁érythrée -22973 +déficience -22974 +ffairsjour -22975 +▁alopochen -22976 +▁dagayɔrɔw -22977 +▁etnologie -22978 +▁tetraodon -22979 +▁tidjaniya -22980 +▁tigilamaw -22981 +▁tijaniyaw -22982 +▁tijaniyya -22983 +▁tilayɔrɔw -22984 +▁tirumalai -22985 +▁tiɲɛbaliw -22986 +▁tlashegin -22987 +▁tlomageni -22988 +▁tortonian -22989 +▁touristes -22990 +▁toussaint -22991 +▁townships -22992 +▁transport -22993 +▁trigonoce -22994 +▁tshivenda -22995 +▁tsokosogo -22996 +▁tulobilew -22997 +▁tulubilen -22998 +▁tulubilew -22999 +mọ -23000 +nr -23001 +xo -23002 +ип -23003 +יו -23004 +ظا -23005 +▁} -23006 +arm -23007 +cit -23008 +uye -23009 +шип -23010 +ظام -23011 +▁") -23012 +gies -23013 +kwar -23014 +mago -23015 +mọkụ -23016 +vert -23017 +wada -23018 +yaan -23019 +yaxo -23020 +نظام -23021 +▁bow -23022 +▁eke -23023 +▁kum -23024 +▁yil -23025 +bules -23026 +dekan -23027 +kundi -23028 +récit -23029 +ɛmɔgɔ -23030 +шипра -23031 +▁angl -23032 +▁bagh -23033 +▁buta -23034 +▁dabo -23035 +▁hadj -23036 +▁yilè -23037 +▁نظام -23038 +panish -23039 +pomọkụ -23040 +refini -23041 +yeyaxo -23042 +шипраг -23043 +▁bayad -23044 +▁buaré -23045 +▁daara -23046 +▁ekele -23047 +▁folon -23048 +▁franz -23049 +▁geren -23050 +▁kauye -23051 +▁madhy -23052 +▁samun -23053 +▁ʃyaan -23054 +▁людей -23055 +firearm -23056 +ivresse -23057 +шипраге -23058 +▁babada -23059 +▁babara -23060 +▁bogies -23061 +▁butast -23062 +▁gordon -23063 +▁tuskan -23064 +kɔnɔwari -23065 +libiyyah -23066 +lohoroma -23067 +▁baghdad -23068 +▁fabules -23069 +▁facería -23070 +▁miɛmɔgɔ -23071 +▁soginen -23072 +▁spanish -23073 +▁syngman -23074 +▁tyeyaxo -23075 +kwararrun -23076 +▁bagabaga -23077 +▁balanzan -23078 +▁butastur -23079 +▁denkundi -23080 +▁eapensis -23081 +▁julidɛsɛ -23082 +▁kɔrɔtali -23083 +▁madhyama -23084 +▁minɛyɔrɔ -23085 +▁okpomọkụ -23086 +▁chambered -23087 +▁karabinta -23088 +▁labanyɔrɔ -23089 +▁soumounou -23090 +▁tubabulaw -23091 +▁turdoides -23092 +▁turquoise -23093 +▁twatwalen -23094 +▁tɔgɔlakaw -23095 +▁tɔnɔbɔtan -23096 +▁ultrabeat -23097 +▁unctuosus -23098 +▁underwood -23099 +?] -23100 +sā -23101 +śa -23102 +ил -23103 +ߊߟ -23104 +idu -23105 +mpɛ -23106 +tiw -23107 +ƙat -23108 +ߊߟߎ -23109 +▁fn -23110 +▁kd -23111 +arte -23112 +clip -23113 +cnrs -23114 +romɛ -23115 +tiin -23116 +овил -23117 +ߊߟߎ߫ -23118 +dobsk -23119 +lotii -23120 +onkan -23121 +rever -23122 +sitiw -23123 +thani -23124 +ƙatun -23125 +▁akan -23126 +▁dond -23127 +▁hiti -23128 +▁kdwe -23129 +▁kise -23130 +▁nich -23131 +▁nkus -23132 +▁team -23133 +▁ọkpa -23134 +kinolo -23135 +ановил -23136 +▁albus -23137 +▁denis -23138 +▁dondô -23139 +▁hanni -23140 +▁koidu -23141 +▁merit -23142 +▁panja -23143 +▁pompɛ -23144 +▁takeo -23145 +alitéso -23146 +ejigide -23147 +ladonna -23148 +romɛkaw -23149 +thaniel -23150 +▁autant -23151 +▁baboon -23152 +▁dowèrè -23153 +▁fluidi -23154 +▁gosita -23155 +▁nkusun -23156 +▁panjab -23157 +▁samiye -23158 +▁sigiba -23159 +▁sirala -23160 +▁sɔrɔka -23161 +▁yɔrɔbɔ -23162 +kinolozi -23163 +становил -23164 +▁buƙatun -23165 +▁dembele -23166 +▁forever -23167 +▁hitikan -23168 +▁lionkan -23169 +▁nichbis -23170 +▁podobsk -23171 +▁presses -23172 +▁shubaga -23173 +▁brachyce -23174 +▁chinekaw -23175 +▁fluidité -23176 +▁takeover -23177 +italiyanci -23178 +umandougou -23179 +▁kuntilena -23180 +▁kɛlɛkɛdew -23181 +▁nathaniel -23182 +▁pyramides -23183 +▁réalitéso -23184 +▁vancouver -23185 +▁vieilloti -23186 +▁volumique -23187 +▁voyageurs -23188 +▁vélingara -23189 +▁vɛdantiki -23190 +▁wahlbergi -23191 +▁wikiquote -23192 +▁wolofukan -23193 +▁wolonfila -23194 +▁wolonkoto -23195 +▁worcester -23196 +▁wulukucɛn -23197 +▁wulunintu -23198 +▁wystawien -23199 +kk -23200 +kũ -23201 +sô -23202 +zs -23203 +ɗe -23204 +ות -23205 +kũy -23206 +lzs -23207 +ɲɔn -23208 +רות -23209 +bles -23210 +buli -23211 +fliw -23212 +insi -23213 +kera -23214 +kũyũ -23215 +laya -23216 +lefi -23217 +viad -23218 +▁ago -23219 +▁huy -23220 +▁inj -23221 +ertec -23222 +lllzs -23223 +nouve -23224 +simón -23225 +łobez -23226 +▁asan -23227 +▁buɗe -23228 +▁bènn -23229 +▁degu -23230 +▁dɔbɔ -23231 +▁erik -23232 +▁mɔkɔ -23233 +▁sôsô -23234 +▁tayi -23235 +bulika -23236 +niwolo -23237 +nouvel -23238 +ɲɔngɔn -23239 +▁ainsi -23240 +▁donli -23241 +▁fokan -23242 +▁kaadị -23243 +▁kasin -23244 +▁sango -23245 +▁tante -23246 +▁tiogo -23247 +▁zviad -23248 +tikibaw -23249 +▁asante -23250 +▁asmara -23251 +▁biggan -23252 +▁deguun -23253 +▁furuli -23254 +▁hɛrɛba -23255 +▁kewari -23256 +▁madame -23257 +▁molefi -23258 +▁musoya -23259 +▁ocelli -23260 +▁sarama -23261 +▁subsis -23262 +▁traiti -23263 +bɛliziki -23264 +jjklllzs -23265 +pubulika -23266 +▁artiste -23267 +▁benkera -23268 +▁falatow -23269 +▁injinia -23270 +▁logical -23271 +▁romance -23272 +budadiinɛ -23273 +niwolofla -23274 +▁capables -23275 +▁desertec -23276 +▁halalaya -23277 +▁kalafliw -23278 +▁kalansen -23279 +▁kɔrɔbalɛ -23280 +▁nɔgɔlenw -23281 +repubulika -23282 +▁bitikibaw -23283 +▁funansere -23284 +▁ocellifer -23285 +▁sinsinikɛ -23286 +▁toumagnon -23287 +▁wasadenya -23288 +▁wɔlɔbugun -23289 +▁yaranango -23290 +▁yarjejeni -23291 +▁yiriwalɛn -23292 +▁yomboliba -23293 +▁yorubakan -23294 +▁èzimbabwe -23295 +▁ébranlent -23296 +▁éducation -23297 +▁équilibre -23298 +▁şalpazarı -23299 +jy -23300 +ƙa -23301 +baf -23302 +dgi -23303 +ɛgɔ -23304 +▁ɛɛ -23305 +atro -23306 +kɔgɔ -23307 +mkpọ -23308 +nier -23309 +vina -23310 +▁ley -23311 +▁oum -23312 +▁ɛɛà -23313 +bodgi -23314 +ferus -23315 +ɛgɔda -23316 +▁bɔlɔ -23317 +▁cath -23318 +▁jani -23319 +▁kane -23320 +▁meng -23321 +▁mest -23322 +▁node -23323 +▁reto -23324 +▁tise -23325 +baflaw -23326 +kalash -23327 +kɔgɔji -23328 +nadosi -23329 +umanya -23330 +▁alaƙa -23331 +▁barth -23332 +▁diati -23333 +▁doual -23334 +▁furmi -23335 +▁harve -23336 +▁leyre -23337 +▁olasa -23338 +▁oumou -23339 +▁sagar -23340 +▁sutan -23341 +▁tataw -23342 +ejikọta -23343 +kolonbu -23344 +▁boliso -23345 +▁bozola -23346 +▁bɔlɔɔn -23347 +▁harvey -23348 +▁masana -23349 +▁morgan -23350 +▁mumbai -23351 +▁pepper -23352 +▁sinɔgɔ -23353 +▁teatro -23354 +akwalite -23355 +lawirisi -23356 +▁alcinus -23357 +▁bakongo -23358 +▁catholi -23359 +▁corvina -23360 +▁fangaba -23361 +▁furmien -23362 +▁kôrôlen -23363 +▁mengata -23364 +▁rations -23365 +▁sesotho -23366 +▁signier -23367 +ganiɛgɔda -23368 +▁anglekan -23369 +▁ateliers -23370 +▁bartholo -23371 +▁karthala -23372 +▁lafiyale -23373 +▁medellín -23374 +▁moolaadé -23375 +▁nielbank -23376 +▁sulaiman -23377 +▁sutanama -23378 +▁wɔɔrɔnan -23379 +bolawirisi -23380 +▁barnadosi -23381 +▁diatiminè -23382 +▁duruhttps -23383 +▁fasjamana -23384 +▁furmientu -23385 +▁mengatasi -23386 +▁ɲaamɛŋɔni -23387 +▁ɲeshinnen -23388 +▁ɲininkali -23389 +▁ɲɔgɔnforo -23390 +▁ɲɛblalila -23391 +▁ɳakuntlen -23392 +▁навальной -23393 +▁силовикам -23394 +▁установил -23395 +▁федерация -23396 +▁художницу -23397 +▁ценникахв -23398 +▁الإسلامية -23399 +,' -23400 +ߏ߬ -23401 +▁מ -23402 +odo -23403 +èri -23404 +▁—, -23405 +bosa -23406 +itin -23407 +piye -23408 +urse -23409 +▁dio -23410 +▁kol -23411 +chimi -23412 +doodo -23413 +intra -23414 +tièri -23415 +▁ante -23416 +▁diai -23417 +▁feya -23418 +▁gaza -23419 +▁glan -23420 +▁koin -23421 +▁mime -23422 +▁miss -23423 +▁nate -23424 +▁plum -23425 +▁walɛ -23426 +▁well -23427 +▁тера -23428 +▁ịkwa -23429 +fourou -23430 +lobosa -23431 +ngiran -23432 +waitin -23433 +▁abdal -23434 +▁franc -23435 +▁ganbe -23436 +▁koinè -23437 +▁kolsi -23438 +▁nurse -23439 +▁també -23440 +▁vɔtɔw -23441 +ampione -23442 +chimiki -23443 +dɔnniya -23444 +kuranta -23445 +▁bɛnnin -23446 +▁cintra -23447 +▁diouna -23448 +▁feyase -23449 +▁jolibɔ -23450 +▁minani -23451 +▁papiye -23452 +▁sesoto -23453 +▁weleen -23454 +▁banbaga -23455 +▁kpatara -23456 +▁missing -23457 +▁niarela -23458 +▁nyamasa -23459 +▁plumata -23460 +▁samassa -23461 +▁sanfeda -23462 +▁toranen -23463 +▁tugulen -23464 +▁tugulɛw -23465 +▁ƙirƙira -23466 +akwadoghị -23467 +champione -23468 +salpazari -23469 +▁chimique -23470 +▁culturel -23471 +▁diaikite -23472 +▁frédéric -23473 +▁tambédou -23474 +èchampione -23475 +▁algazella -23476 +▁banbagaci -23477 +▁biglobosa -23478 +▁demisenya -23479 +▁farikoloj -23480 +▁jikuranta -23481 +▁konfourou -23482 +▁ɲɔgɔnfaga -23483 +▁الجزائرية -23484 +▁اللبنانية -23485 +▁مصرالعربي -23486 +▁ߖߘߍ߬ߡߊ߬ߖߌ -23487 +▁ߞߊ߬ߙߊ߲߬ߓߊ -23488 +adricinctus -23489 +agriculture -23490 +akpatụbeghị -23491 +amayalakali -23492 +arepubliken -23493 +association -23494 +bakɔrɔnkuru -23495 +balikukalan -23496 +bolibatolaw -23497 +centralized -23498 +ekwuchitere -23499 +ym -23500 +▁# -23501 +▁ߙ -23502 +ndị -23503 +tim -23504 +▁mā -23505 +arit -23506 +gɔɔn -23507 +keda -23508 +lɛrɔ -23509 +pony -23510 +seen -23511 +vezo -23512 +▁cun -23513 +▁dac -23514 +▁eun -23515 +▁iwu -23516 +bange -23517 +dakar -23518 +soles -23519 +▁cɛnt -23520 +▁etym -23521 +▁haɗi -23522 +▁iris -23523 +▁jiya -23524 +▁jubɔ -23525 +▁npan -23526 +▁saka -23527 +▁somo -23528 +▁togu -23529 +ranéen -23530 +▁dacko -23531 +▁damba -23532 +▁ghọta -23533 +▁mvezo -23534 +▁mārga -23535 +▁nyɛfô -23536 +▁sabaa -23537 +▁sogow -23538 +▁somos -23539 +▁tanga -23540 +▁trais -23541 +▁bɛlɛrɔ -23542 +▁cakeda -23543 +▁cogomi -23544 +▁jatela -23545 +▁jiyabe -23546 +▁jusigi -23547 +▁muanda -23548 +▁mɔgaya -23549 +▁ngurun -23550 +▁police -23551 +▁sutara -23552 +▁terror -23553 +ological -23554 +▁damanas -23555 +▁diakite -23556 +▁gbadara -23557 +▁gɔngɔɔn -23558 +▁liquide -23559 +▁atụnyere -23560 +▁bamabara -23561 +▁consoles -23562 +▁jusigira -23563 +▁nônôkènè -23564 +▁présenté -23565 +▁sankaran -23566 +▁bolimafɛn -23567 +▁kunkuruun -23568 +▁magoqwana -23569 +▁squamosal -23570 +▁tamkharit -23571 +▁tiamantiɛ -23572 +erianijeria -23573 +expositions -23574 +fangajamana -23575 +ganmarayɔrɔ -23576 +giosprinter -23577 +gɔnbailleul -23578 +hemorrhoids -23579 +herzégovine -23580 +infographic -23581 +ingüísticos -23582 +inibailleul -23583 +iridescence -23584 +iserepublic -23585 +iśtirakiyah -23586 +jelinkusuun -23587 +jovaciennes -23588 +kansurunnin -23589 +korobɔrɔkan -23590 +laedefabrik -23591 +libreoffice -23592 +lɛkisandiri -23593 +mandingokan -23594 +missirikoro -23595 +monteaguila -23596 +mototakisiw -23597 +nisenutigiw -23598 +politanisms -23599 +pr -23600 +vw -23601 +yè -23602 +doe -23603 +kie -23604 +mok -23605 +▁fm -23606 +").[ -23607 +anes -23608 +kaya -23609 +▁/// -23610 +▁feɳ -23611 +▁gdi -23612 +▁kaj -23613 +▁kee -23614 +▁rye -23615 +▁vab -23616 +jɛman -23617 +taxis -23618 +unity -23619 +▁anka -23620 +▁ciɲɛ -23621 +▁dɔnw -23622 +▁engy -23623 +▁kada -23624 +▁kajš -23625 +▁kugo -23626 +▁kult -23627 +▁kuta -23628 +▁odoe -23629 +▁taís -23630 +isanes -23631 +moksha -23632 +▁bolow -23633 +▁bosat -23634 +▁chart -23635 +▁sayes -23636 +▁seyba -23637 +▁sisie -23638 +▁slavw -23639 +▁soura -23640 +▁tesis -23641 +feereso -23642 +polskie -23643 +▁badenw -23644 +▁bakers -23645 +▁butiki -23646 +▁feɳama -23647 +▁groupe -23648 +▁jenɛsi -23649 +▁kultur -23650 +▁minɛko -23651 +▁nksiin -23652 +▁nkɔsɔn -23653 +ractions -23654 +▁bɔgɔlan -23655 +▁kɔfɛtaw -23656 +▁minɛtaw -23657 +▁oseania -23658 +▁recolon -23659 +▁sangani -23660 +▁souraka -23661 +▁station -23662 +▁suganti -23663 +▁tissent -23664 +▁fagalenw -23665 +▁faisanes -23666 +▁hippopot -23667 +▁jamboree -23668 +▁kingston -23669 +▁kɛrɛkɛrɛ -23670 +▁miiriyaw -23671 +▁nayasɔrɔ -23672 +▁nijeriya -23673 +▁sɛnɛfenw -23674 +▁vabariik -23675 +▁elizabeti -23676 +▁funankɛya -23677 +▁kulturene -23678 +▁religious -23679 +▁timinandi -23680 +pplications -23681 +proceedings -23682 +realization -23683 +refinitions -23684 +southafrica -23685 +taurotragus -23686 +tikajamhuri -23687 +tikiditunga -23688 +tográfiques -23689 +tophilornis -23690 +udaljenosti -23691 +yiriwasiraw -23692 +yumhūriyyat -23693 +électricité -23694 +équatoriale -23695 +ñèchampione -23696 +ɔribailleul -23697 +григорцевич -23698 +русификация -23699 +?" -23700 +lp -23701 +pk -23702 +tị -23703 +wp -23704 +ebi -23705 +hum -23706 +▁dᴐ -23707 +dika -23708 +dolo -23709 +kabu -23710 +tulu -23711 +tura -23712 +▁bih -23713 +▁bɛk -23714 +▁hae -23715 +▁llp -23716 +▁moo -23717 +▁rpk -23718 +▁upo -23719 +itlin -23720 +llman -23721 +▁bola -23722 +▁casi -23723 +▁cuun -23724 +▁deke -23725 +▁dolô -23726 +▁feré -23727 +▁goon -23728 +▁mati -23729 +▁tang -23730 +▁thee -23731 +▁wadu -23732 +▁yapa -23733 +agbatị -23734 +labila -23735 +silama -23736 +▁bioko -23737 +▁dugus -23738 +▁galet -23739 +▁haeun -23740 +▁moves -23741 +▁mɔnni -23742 +▁nahum -23743 +▁silva -23744 +▁sɔnŋo -23745 +▁turai -23746 +▁upolu -23747 +▁yanka -23748 +candace -23749 +dafrica -23750 +sanding -23751 +spécial -23752 +▁casita -23753 +▁duguye -23754 +▁jibɔɔn -23755 +▁kolɛri -23756 +▁latika -23757 +▁matiyu -23758 +▁setịpụ -23759 +▁sutura -23760 +▁sɔnŋoy -23761 +▁toured -23762 +▁waduba -23763 +▁wilili -23764 +▁yèrèma -23765 +arafalen -23766 +bejasson -23767 +terhouse -23768 +▁bollman -23769 +▁caitlin -23770 +▁histori -23771 +▁kastili -23772 +▁kɔnkɛra -23773 +▁lakalan -23774 +▁sarasin -23775 +▁yapaani -23776 +sudafrica -23777 +▁bucorvus -23778 +▁haeundae -23779 +▁itinéran -23780 +▁nolabila -23781 +▁supplied -23782 +▁taniwɔrɔ -23783 +▁wɔlɔkama -23784 +▁ameridika -23785 +▁gɛlɛmanba -23786 +▁karagnara -23787 +▁kôdjalada -23788 +▁lakɔlisow -23789 +▁taamacogo -23790 +▁ybejasson -23791 +orobailleul -23792 +спитанников -23793 +▁accredited -23794 +▁accélérées -23795 +▁africaines -23796 +▁aglomerasi -23797 +▁alimentent -23798 +▁anthreptes -23799 +/( -23800 +qs -23801 +ghz -23802 +▁où -23803 +guns -23804 +oche -23805 +sima -23806 +sosi -23807 +▁bɛr -23808 +▁kil -23809 +▁kɔs -23810 +▁ntɔ -23811 +▁tak -23812 +▁òtù -23813 +chewa -23814 +inɛka -23815 +sénou -23816 +unizi -23817 +▁deni -23818 +▁jèli -23819 +▁kome -23820 +▁wits -23821 +▁yuli -23822 +amaara -23823 +routel -23824 +tigiko -23825 +tunizi -23826 +▁djene -23827 +▁finis -23828 +▁minna -23829 +▁nsonw -23830 +▁scran -23831 +▁taale -23832 +▁tunun -23833 +▁unani -23834 +sènbɔli -23835 +transla -23836 +▁autour -23837 +▁brevis -23838 +▁daaman -23839 +▁jinɛka -23840 +▁komedi -23841 +▁kɔsɛbɛ -23842 +▁malien -23843 +▁malila -23844 +▁mamadu -23845 +▁okɔsɔn -23846 +▁papers -23847 +▁taksiw -23848 +▁yonkon -23849 +antioche -23850 +laurence -23851 +soguinex -23852 +sosiyali -23853 +ttemberg -23854 +▁bɛrɛbɛn -23855 +▁djenepo -23856 +▁froutel -23857 +▁jiidili -23858 +▁kiltiri -23859 +▁lajɛbaw -23860 +▁légende -23861 +▁somɔgɔw -23862 +▁kotigiko -23863 +▁province -23864 +▁scranton -23865 +▁sɛbɛnina -23866 +portigikan -23867 +▁anchorage -23868 +▁bɛrɛbɛnna -23869 +▁côkôrôbaw -23870 +▁finyesira -23871 +▁koordinat -23872 +▁laniarius -23873 +▁mananinnc -23874 +▁pygmalion -23875 +▁sigikuluw -23876 +theguardian -23877 +translateur -23878 +▁arabukalan -23879 +▁argentique -23880 +▁arrondisse -23881 +▁artbreeder -23882 +▁astronomie -23883 +▁atlantique -23884 +▁baarakɛnaf -23885 +▁baarakɛtaw -23886 +▁bagabagali -23887 +▁bamanjamuw -23888 +▁banaɲaɲini -23889 +▁bangalades -23890 +▁barakɛlenw -23891 +▁benjervili -23892 +▁bidorsalis -23893 +▁biduurunan -23894 +▁bilisaɲami -23895 +▁binganinaw -23896 +▁biologique -23897 +▁biribiriba -23898 +▁biwolofila -23899 +دن -23900 +مد -23901 +وغ -23902 +َو -23903 +ߍ߲ -23904 +▁ߡ -23905 +▁ߦ -23906 +▁朝 -23907 +meo -23908 +ída -23909 +ردن -23910 +هَو -23911 +ߣߍ߲ -23912 +▁hɔ -23913 +▁ww -23914 +ekew -23915 +nedi -23916 +sajè -23917 +seko -23918 +ߌߣߍ߲ -23919 +▁hbo -23920 +▁won -23921 +▁حمد -23922 +▁هَو -23923 +gagné -23924 +pical -23925 +romeo -23926 +umina -23927 +▁aids -23928 +▁aída -23929 +▁blom -23930 +▁ciin -23931 +▁mena -23932 +▁naba -23933 +▁niag -23934 +▁righ -23935 +anwale -23936 +▁...), -23937 +▁boliw -23938 +▁djiri -23939 +▁hamel -23940 +▁jonya -23941 +▁julie -23942 +▁nkebi -23943 +▁okôrô -23944 +▁phate -23945 +▁rouen -23946 +jermani -23947 +ologila -23948 +▁desiro -23949 +▁doyoro -23950 +▁gassam -23951 +▁guémou -23952 +▁hɔbori -23953 +▁katowi -23954 +▁konipo -23955 +▁menaka -23956 +▁rights -23957 +▁sidiki -23958 +▁tondon -23959 +dugusajè -23960 +rintugan -23961 +▁alumina -23962 +▁anagram -23963 +▁blombos -23964 +▁foureau -23965 +▁kòsegin -23966 +▁niagami -23967 +▁ntọhapụ -23968 +▁phatell -23969 +▁sistɛmu -23970 +▁sonekew -23971 +▁tuguniw -23972 +▁bamanana -23973 +▁desgagné -23974 +▁eurozone -23975 +▁foureaui -23976 +▁gassamba -23977 +▁katowice -23978 +▁martinez -23979 +▁nabatara -23980 +▁omniglot -23981 +▁shuyaniw -23982 +▁tondonen -23983 +▁tropical -23984 +▁whakaatu -23985 +birintugan -23986 +▁anagramme -23987 +▁jamhuriya -23988 +▁nkebiokwu -23989 +▁ruppellii -23990 +▁tugubagaw -23991 +▁ƙungiyoyi -23992 +▁blockchain -23993 +▁bolocoronw -23994 +▁bolofaraye -23995 +▁bolonobila -23996 +▁bonapartis -23997 +▁bronkhorst -23998 +▁bukantigiw -23999 +tf -24000 +."( -24001 +ath -24002 +ôle -24003 +▁bf -24004 +▁bâ -24005 +▁cf -24006 +▁kb -24007 +▁kù -24008 +arts -24009 +goli -24010 +uses -24011 +valt -24012 +▁ụkọ -24013 +imɔgɔ -24014 +jinân -24015 +liath -24016 +▁ador -24017 +▁conf -24018 +▁haba -24019 +▁jawu -24020 +▁mɛgɛ -24021 +▁nton -24022 +▁pola -24023 +▁rôle -24024 +▁side -24025 +▁tuun -24026 +koloma -24027 +ouloud -24028 +thomas -24029 +▁diabi -24030 +▁dolou -24031 +▁frago -24032 +▁kùran -24033 +▁lomba -24034 +▁minji -24035 +▁polak -24036 +▁yefen -24037 +▁zones -24038 +kananda -24039 +karitɔn -24040 +▁causes -24041 +▁faraku -24042 +▁farine -24043 +▁furajɛ -24044 +▁habaku -24045 +▁jatigɛ -24046 +▁kontao -24047 +▁lombad -24048 +▁majago -24049 +▁makona -24050 +▁rapide -24051 +▁confine -24052 +▁filakan -24053 +▁fragoso -24054 +▁fɔkanna -24055 +▁gobroni -24056 +▁goliath -24057 +▁habakuk -24058 +▁kandake -24059 +▁mɔngoli -24060 +▁neimɔgɔ -24061 +▁nwesịrị -24062 +▁sirabaw -24063 +▁sɛnɛbaw -24064 +▁tulokun -24065 +vekananda -24066 +▁donotulu -24067 +▁lakoloma -24068 +▁maouloud -24069 +▁obscurus -24070 +▁sogoforo -24071 +▁tasavalt -24072 +▁adsimilis -24073 +▁danfarali -24074 +▁datugulan -24075 +▁dorokolen -24076 +▁fɔlɔmɔgɔw -24077 +▁katedrali -24078 +▁lombadria -24079 +▁montagnon -24080 +▁bundibugyo -24081 +▁buraburaba -24082 +▁bɔbailleul -24083 +▁bɛrɛsunuya -24084 +▁californie -24085 +▁camouflage -24086 +▁cantonment -24087 +▁caractères -24088 +▁castellano -24089 +▁catholique -24090 +▁changeants -24091 +▁chitumbuka -24092 +▁cincinnati -24093 +▁clairvoyan -24094 +▁compartido -24095 +▁compostela -24096 +▁conciencia -24097 +▁conclusion -24098 +▁conference -24099 +red -24100 +stg -24101 +voz -24102 +▁jô -24103 +▁mp -24104 +▁må -24105 +▁nê -24106 +egbu -24107 +ginɛ -24108 +mman -24109 +nôgô -24110 +orje -24111 +pslf -24112 +sɛnɛ -24113 +tzer -24114 +yesu -24115 +▁bɛo -24116 +▁ida -24117 +▁izh -24118 +▁kay -24119 +▁kaz -24120 +▁yin -24121 +akọwa -24122 +lalen -24123 +mmanụ -24124 +talen -24125 +ọpụrụ -24126 +▁alha -24127 +▁bɛbɔ -24128 +▁dɛbɛ -24129 +▁mill -24130 +fɔyɔrɔ -24131 +nôgôya -24132 +witzer -24133 +▁bacon -24134 +▁diama -24135 +▁idaha -24136 +▁izhma -24137 +▁mural -24138 +▁preto -24139 +▁stede -24140 +▁super -24141 +landugu -24142 +malaria -24143 +vinisme -24144 +▁acacia -24145 +▁belize -24146 +▁donnin -24147 +▁gɛtɛrɛ -24148 +▁kazali -24149 +▁kitara -24150 +▁laginɛ -24151 +▁servoz -24152 +▁sɛnɛna -24153 +▁sọpụrụ -24154 +▁taanen -24155 +▁talent -24156 +▁téliya -24157 +dugumada -24158 +▁alhakin -24159 +▁barbara -24160 +▁cemajan -24161 +▁columba -24162 +▁djallon -24163 +▁izhmash -24164 +▁jurakan -24165 +▁senumaw -24166 +▁songhoy -24167 +▁stedeli -24168 +▁switzer -24169 +sɛnɛyɔrɔw -24170 +▁dɔgɔmanw -24171 +▁gaborone -24172 +▁jamakulu -24173 +▁kazalika -24174 +▁lablalen -24175 +▁pentalen -24176 +▁gambensis -24177 +▁herpesles -24178 +▁hɔrɔnyali -24179 +▁kọwachara -24180 +▁laghafoli -24181 +▁ounjougou -24182 +▁pretorius -24183 +▁stedelijk -24184 +▁tarihinta -24185 +▁vizcounty -24186 +▁applecrest -24187 +▁connection -24188 +▁construite -24189 +▁consultado -24190 +▁containing -24191 +▁convention -24192 +▁cricetomys -24193 +▁crossroads -24194 +▁cucullatus -24195 +▁cɛsirilanw -24196 +▁dagamaïssa -24197 +▁daminɛkuma -24198 +▁daminɛyɔrɔ -24199 +"( -24200 +afe -24201 +fal -24202 +sam -24203 +▁ip -24204 +fore -24205 +krou -24206 +mamu -24207 +pies -24208 +rète -24209 +samn -24210 +site -24211 +▁guy -24212 +▁ice -24213 +▁nih -24214 +▁tlo -24215 +▁tom -24216 +arian -24217 +crète -24218 +diatɛ -24219 +kiban -24220 +quées -24221 +▁anga -24222 +▁bian -24223 +▁gụrụ -24224 +▁host -24225 +▁kɔɔn -24226 +▁tiga -24227 +▁ɲafe -24228 +▁الله -24229 +amanɔn -24230 +banchi -24231 +before -24232 +bluesz -24233 +falgar -24234 +fɔlanw -24235 +songon -24236 +▁apies -24237 +▁bangɛ -24238 +▁basum -24239 +▁bɛɛla -24240 +▁ellen -24241 +▁fémin -24242 +▁kèlaw -24243 +▁kɔron -24244 +▁lepen -24245 +▁songô -24246 +▁tilsi -24247 +▁urząd -24248 +▁walas -24249 +▁yukan -24250 +akacala -24251 +intaran -24252 +kamalen -24253 +pogolon -24254 +quarian -24255 +▁bianca -24256 +▁dɛkrou -24257 +▁labana -24258 +▁nasara -24259 +▁patrie -24260 +▁saraba -24261 +▁songôw -24262 +▁tilsit -24263 +▁alimamu -24264 +▁bodiatɛ -24265 +▁codiuku -24266 +▁diyenin -24267 +▁dugukol -24268 +▁kɛlɛnna -24269 +▁makiban -24270 +▁mallaka -24271 +▁métiers -24272 +▁nkalama -24273 +▁santiri -24274 +▁semitor -24275 +▁website -24276 +▁discrète -24277 +▁dugukolw -24278 +▁ebolatɔw -24279 +▁ethiopia -24280 +▁fangabaw -24281 +▁féminine -24282 +▁marquées -24283 +▁portland -24284 +▁ɲintaran -24285 +kùnnàkalan -24286 +▁antologie -24287 +▁bikɔnɔtɔn -24288 +▁enhaipeun -24289 +▁jɛkɔnɔnin -24290 +▁santiriba -24291 +▁semitorqu -24292 +▁trafalgar -24293 +antiquarian -24294 +▁danbetigiw -24295 +▁dandéresso -24296 +▁dangifalle -24297 +▁dankanbolo -24298 +▁dannaselen -24299 +": -24300 +yb -24301 +did -24302 +eli -24303 +eng -24304 +rew -24305 +wro -24306 +▁aś -24307 +▁cj -24308 +asie -24309 +cson -24310 +▁alu -24311 +▁dal -24312 +▁ici -24313 +engdu -24314 +faraf -24315 +wrold -24316 +yeeli -24317 +▁beyi -24318 +▁bile -24319 +▁drew -24320 +▁dura -24321 +▁haki -24322 +▁ikwu -24323 +▁jagu -24324 +▁jake -24325 +▁tapo -24326 +▁tedɔ -24327 +bobaga -24328 +bɔyɔrɔ -24329 +karaan -24330 +maliza -24331 +wroldl -24332 +▁alube -24333 +▁ampat -24334 +▁gadir -24335 +▁jɔlan -24336 +▁kolen -24337 +▁laala -24338 +▁leral -24339 +▁metre -24340 +▁tradi -24341 +▁waabɔ -24342 +llinula -24343 +▁bafila -24344 +▁dallas -24345 +▁fralen -24346 +▁jaguar -24347 +▁janata -24348 +▁joseon -24349 +▁kɛlɛya -24350 +▁meteri -24351 +▁nleban -24352 +▁tucson -24353 +▁yenmin -24354 +▁alubetu -24355 +▁chengdu -24356 +▁minyɔrɔ -24357 +▁mungala -24358 +▁sonsaan -24359 +▁swedish -24360 +▁sɔrɔbaw -24361 +▁tɔrɔtaw -24362 +▁ɲangata -24363 +compagnie -24364 +▁erɔpukaw -24365 +▁hakilima -24366 +▁laghachi -24367 +▁laissant -24368 +▁nlebanya -24369 +▁tjikouna -24370 +malización -24371 +▁batensoda -24372 +▁delagrave -24373 +▁gallinula -24374 +▁kakoulima -24375 +▁sankaraan -24376 +▁ɲangataan -24377 +awirilikalo -24378 +▁biscutatus -24379 +▁deliciosus -24380 +▁denmisɛniw -24381 +▁dependenci -24382 +▁desebagato -24383 +▁devanāgarī -24384 +▁dictionary -24385 +▁différence -24386 +▁différente -24387 +▁dignitaire -24388 +▁diyarbakır -24389 +▁djoungonda -24390 +▁dofɛrɛtɛda -24391 +▁domesticus -24392 +▁donɲwanakɛ -24393 +▁doublement -24394 +▁dramatique -24395 +▁dugumayɔrɔ -24396 +▁définitive -24397 +▁développer -24398 +▁dɔkilibala -24399 +bat -24400 +era -24401 +leh -24402 +mau -24403 +swe -24404 +łki -24405 +как -24406 +atɔn -24407 +kowi -24408 +shan -24409 +sity -24410 +soni -24411 +ûtra -24412 +▁aba -24413 +▁ble -24414 +▁cav -24415 +▁ero -24416 +▁lah -24417 +kokan -24418 +kowie -24419 +swela -24420 +sûtra -24421 +verso -24422 +▁baki -24423 +▁bern -24424 +▁bèla -24425 +▁fark -24426 +▁kale -24427 +▁kuko -24428 +▁laba -24429 +▁pape -24430 +▁shuu -24431 +▁tlon -24432 +▁wugu -24433 +amatɔn -24434 +atimes -24435 +kariti -24436 +maures -24437 +shangu -24438 +yirika -24439 +▁abaja -24440 +▁bougô -24441 +▁desse -24442 +▁katié -24443 +▁kongô -24444 +▁kotor -24445 +▁maera -24446 +▁njikọ -24447 +▁npaan -24448 +▁rabat -24449 +▁saleh -24450 +▁seyne -24451 +rakowie -24452 +▁aragon -24453 +▁bannen -24454 +▁bleble -24455 +▁caiman -24456 +▁dugugi -24457 +▁estate -24458 +▁falaan -24459 +▁jakhan -24460 +▁leones -24461 +▁médina -24462 +▁ntɛfɛn -24463 +▁roisin -24464 +▁sengor -24465 +▁thenia -24466 +baptiste -24467 +ispaniya -24468 +shanguve -24469 +▁abajada -24470 +▁aleksey -24471 +▁animali -24472 +▁bernard -24473 +▁density -24474 +▁dugulen -24475 +▁kantigi -24476 +▁katiéna -24477 +▁martian -24478 +▁shirley -24479 +▁waïgalo -24480 +worldnews -24481 +▁bayirika -24482 +▁eritreya -24483 +▁halakili -24484 +▁jakhanke -24485 +▁krakowie -24486 +▁rzymełki -24487 +▁botsiwana -24488 +▁mainugnai -24489 +▁orchestré -24490 +▁petherici -24491 +▁récemment -24492 +▁sinamatɔn -24493 +▁sukaradon -24494 +ispaniyakan -24495 +▁dɔkɔtɔrɔya -24496 +▁dɛgɛyɔrɔba -24497 +▁electricus -24498 +▁endlicheri -24499 +td -24500 +feb -24501 +yat -24502 +ɔna -24503 +▁(* -24504 +basi -24505 +geti -24506 +jiki -24507 +zion -24508 +▁hes -24509 +▁igè -24510 +fiɲɛw -24511 +▁dabe -24512 +▁douz -24513 +▁emee -24514 +▁fola -24515 +▁göre -24516 +▁jiin -24517 +▁kone -24518 +▁niɔn -24519 +▁romu -24520 +yevsky -24521 +▁falan -24522 +▁faral -24523 +▁folaw -24524 +▁kuyat -24525 +▁laben -24526 +▁niafo -24527 +▁peulh -24528 +▁tyran -24529 +▁upper -24530 +▁yahoo -24531 +kɔnɔtɔn -24532 +zionale -24533 +ération -24534 +▁dageti -24535 +▁dôgôya -24536 +▁foloye -24537 +▁görele -24538 +▁hajida -24539 +▁hester -24540 +▁lamɔna -24541 +▁mabɔli -24542 +▁morala -24543 +▁morisi -24544 +▁vinsan -24545 +▁zimbab -24546 +eswatini -24547 +toyevsky -24548 +▁beljiki -24549 +▁dabelen -24550 +▁kaikosi -24551 +▁kenneth -24552 +▁seconde -24553 +bikɔnɔtɔn -24554 +stoyevsky -24555 +▁cambodia -24556 +▁colonies -24557 +▁jalakoro -24558 +▁morisius -24559 +▁sanfɛkan -24560 +▁thiocary -24561 +▁transfer -24562 +▁beganmara -24563 +▁nazionale -24564 +▁pluvianus -24565 +▁vincennes -24566 +▁yɛrɛtagan -24567 +▁zimbabbwe -24568 +inabailleul -24569 +▁autochtone -24570 +▁denmisɛnya -24571 +▁department -24572 +▁entreprise -24573 +▁enwechaghị -24574 +▁erythropus -24575 +▁ethnologue -24576 +▁excellence -24577 +▁exposition -24578 +▁falenfalen -24579 +▁falikɛwulu -24580 +▁familiaris -24581 +▁farakoloci -24582 +▁farakɔrɔba -24583 +▁faransekan -24584 +▁farikoloma -24585 +▁fasɔrɔsira -24586 +▁febuyekalo -24587 +▁fellowship -24588 +▁filimukɛla -24589 +▁finlandfin -24590 +▁flanflanko -24591 +▁forestiers -24592 +▁forkjelige -24593 +▁forobacako -24594 +▁fugulablen -24595 +▁funankɛniw -24596 +▁furuɲwanma -24597 +▁fôlôbugula -24598 +▁fɔnɛtigima -24599 +bta -24600 +ibi -24601 +rer -24602 +tof -24603 +unh -24604 +▁(" -24605 +▁pv -24606 +anac -24607 +asar -24608 +chou -24609 +quer -24610 +yafi -24611 +▁día -24612 +▁nai -24613 +▁pvt -24614 +▁soa -24615 +▁ịlụ -24616 +anaba -24617 +blara -24618 +innpe -24619 +toffe -24620 +vella -24621 +▁fada -24622 +▁jonw -24623 +▁kaye -24624 +▁nuwa -24625 +▁robo -24626 +▁suba -24627 +▁zebu -24628 +buquer -24629 +samuya -24630 +▁alima -24631 +▁atman -24632 +▁canac -24633 +▁delta -24634 +▁dicko -24635 +▁dolen -24636 +▁gérer -24637 +▁maria -24638 +▁nabta -24639 +▁naija -24640 +▁sabuw -24641 +▁savai -24642 +▁sensu -24643 +entente -24644 +mivella -24645 +unhuman -24646 +▁gredos -24647 +▁itinye -24648 +▁makoɲa -24649 +▁mantra -24650 +▁musoko -24651 +▁nègèso -24652 +▁saloum -24653 +▁sumano -24654 +▁torres -24655 +▁welela -24656 +▁yayata -24657 +▁étoffe -24658 +banweela -24659 +▁amaokwu -24660 +▁karbala -24661 +▁naijaha -24662 +▁nkobaan -24663 +▁oriolus -24664 +▁pathfin -24665 +▁yaalata -24666 +buquerque -24667 +▁dumanaba -24668 +▁insulasi -24669 +▁kɔninnpe -24670 +▁kɛlɛdenw -24671 +▁yayatawa -24672 +▁cartouche -24673 +▁comivella -24674 +▁kalangafɛ -24675 +▁makoɲafin -24676 +▁naijahall -24677 +▁radcliffe -24678 +▁setanburu -24679 +▁shilatunu -24680 +▁agbanweela -24681 +▁bellicosus -24682 +▁dugubakɔnɔ -24683 +▁fɛnɲɛnamaw -24684 +▁gallerella -24685 +▁generating -24686 +▁gengerenin -24687 +▁geografski -24688 +▁gibraltari -24689 +▁glaucidium -24690 +▁gnèmogobaw -24691 +▁graphiques -24692 +▁greensboro -24693 +▁grenadiniw -24694 +▁guinéegine -24695 +▁gundolakow -24696 +▁gundolatɔn -24697 +▁gymnarchus -24698 +▁gèrègèniya -24699 +nd -24700 +dem -24701 +enc -24702 +whi -24703 +ɔro -24704 +ива -24705 +cyan -24706 +dali -24707 +daro -24708 +kdem -24709 +sron -24710 +télé -24711 +ɲana -24712 +▁iii -24713 +▁nyu -24714 +▁scs -24715 +▁tld -24716 +alien -24717 +encée -24718 +lease -24719 +which -24720 +ysage -24721 +▁gɔnw -24722 +▁isth -24723 +▁jomo -24724 +▁seki -24725 +▁téli -24726 +▁yɔro -24727 +hawara -24728 +▁bolen -24729 +▁cilen -24730 +▁dôgôt -24731 +▁gnèmo -24732 +▁minan -24733 +▁otélé -24734 +▁rodri -24735 +▁scops -24736 +▁tanpa -24737 +▁cumber -24738 +▁jɛmanw -24739 +▁kidali -24740 +▁miniko -24741 +▁minkɔn -24742 +▁monaco -24743 +▁nyuwan -24744 +▁tikdem -24745 +▁walaan -24746 +▁архива -24747 +́шникова -24748 +▁batiguè -24749 +▁bolendo -24750 +▁dumuniw -24751 +▁gnèmoko -24752 +▁isthmus -24753 +▁lalande -24754 +▁nɔnkɔɔn -24755 +▁paysage -24756 +▁rodrigu -24757 +▁thomson -24758 +▁tianjin -24759 +▁timboté -24760 +▁ɲɛmaaya -24761 +ударствен -24762 +▁clochard -24763 +▁dibimanw -24764 +▁dôgôtôrô -24765 +▁dɔnnifɛn -24766 +▁kamasron -24767 +▁muhawara -24768 +▁nyuwanna -24769 +▁surafana -24770 +▁teliyaba -24771 +▁tilacogo -24772 +▁wolodugu -24773 +niallmccar -24774 +сударствен -24775 +▁dumunifɛn -24776 +▁korolenba -24777 +▁maɲambugu -24778 +▁rodrigues -24779 +▁solarpunk -24780 +▁taaninani -24781 +▁warijashi -24782 +▁ƙwararrun -24783 +ала́шникова -24784 +▁cumberland -24785 +▁gouéléyama -24786 +▁gɛrɛntɛlen -24787 +▁hadamdenya -24788 +▁hakilimaya -24789 +▁harmagedɔn -24790 +▁hassaniyya -24791 +▁hasselblad -24792 +▁hispanyolo -24793 +▁historique -24794 +▁hypostases -24795 +▁hɔrɔnyalen -24796 +▁igbineweka -24797 +▁importante -24798 +▁incluyendo -24799 +cma -24800 +get -24801 +cmac -24802 +difi -24803 +mais -24804 +reli -24805 +varo -24806 +ɛnna -24807 +▁cma -24808 +▁gré -24809 +▁ier -24810 +▁ịkọ -24811 +bemba -24812 +difié -24813 +dolus -24814 +donta -24815 +grans -24816 +varoš -24817 +ɔrɔfi -24818 +▁alde -24819 +▁enzo -24820 +▁ghọọ -24821 +▁gnèn -24822 +▁jeni -24823 +▁kote -24824 +▁saye -24825 +across -24826 +emecha -24827 +nances -24828 +▁autre -24829 +▁diaɲa -24830 +▁foncé -24831 +▁innaf -24832 +▁jɛman -24833 +▁liens -24834 +▁mayen -24835 +▁minèn -24836 +▁nikan -24837 +▁nwata -24838 +▁pagna -24839 +▁taaɲɛ -24840 +finkolo -24841 +kalanko -24842 +▁bidenw -24843 +▁damani -24844 +▁docmac -24845 +▁dumais -24846 +▁innafo -24847 +▁kartaj -24848 +▁sennin -24849 +▁sontag -24850 +▁target -24851 +▁العظمى -24852 +religion -24853 +republik -24854 +xondonta -24855 +ɔrɔfilen -24856 +▁babemba -24857 +▁codifié -24858 +▁jumɛfin -24859 +▁lenasia -24860 +▁migrans -24861 +▁montana -24862 +▁nubicus -24863 +▁thienta -24864 +sittacula -24865 +ternances -24866 +▁binanani -24867 +▁byzatine -24868 +▁dakɔrɔta -24869 +▁guttural -24870 +▁kononana -24871 +▁saralenw -24872 +▁sigasiga -24873 +▁troglody -24874 +▁bugulakaw -24875 +▁kartajena -24876 +▁sɛbɛnɛnna -24877 +▁waribonba -24878 +▁étonnante -24879 +▁guimbayara -24880 +▁industrial -24881 +▁influencée -24882 +▁inhalation -24883 +▁institutum -24884 +▁intemporel -24885 +▁interarmes -24886 +▁intramural -24887 +▁introducci -24888 +▁intrépides -24889 +▁invincible -24890 +▁isakadiinɛ -24891 +▁ispanyikan -24892 +▁italiyanci -24893 +▁iterambere -24894 +▁jagorancin -24895 +▁jamhuriyar -24896 +▁janganmina -24897 +▁jatebaliya -24898 +▁jatebɔcogo -24899 +!). -24900 +)). -24901 +tov -24902 +”). -24903 +ahịa -24904 +dean -24905 +riki -24906 +toto -24907 +yade -24908 +zari -24909 +▁lhu -24910 +▁moi -24911 +▁uto -24912 +▁wto -24913 +▁xpo -24914 +areid -24915 +digèn -24916 +mucus -24917 +ɔnɔmɛ -24918 +▁bede -24919 +▁dowu -24920 +▁kete -24921 +▁kode -24922 +▁kôso -24923 +▁rpgw -24924 +▁timɛ -24925 +▁tɛdɔ -24926 +▁ɲiɲi -24927 +accent -24928 +bawtun -24929 +vriers -24930 +▁banbo -24931 +▁banin -24932 +▁briki -24933 +▁dinɛw -24934 +▁fɔtaw -24935 +▁lover -24936 +▁masan -24937 +▁minɛɛ -24938 +▁santo -24939 +▁tɔgɔo -24940 +▁woman -24941 +▁xposu -24942 +▁yonha -24943 +▁ɲɔrɔn -24944 +yadeles -24945 +▁andean -24946 +▁boyana -24947 +▁caleya -24948 +▁german -24949 +▁laburu -24950 +▁marale -24951 +▁môbili -24952 +▁pareid -24953 +▁siraan -24954 +▁sumanw -24955 +▁traorè -24956 +▁yonhap -24957 +▁ɲiɲila -24958 +kọpụtara -24959 +tɛrɔnɔmɛ -24960 +▁bayanan -24961 +▁cissoko -24962 +▁germany -24963 +▁kɔrzari -24964 +▁masanta -24965 +▁mmelite -24966 +▁saratov -24967 +▁xposure -24968 +manbawtun -24969 +▁farafinw -24970 +▁janamanw -24971 +▁lohoroma -24972 +▁marakɔrɔ -24973 +▁ouvriers -24974 +lasigidenw -24975 +uetersenro -24976 +▁akọpụtara -24977 +▁baninkɔnɔ -24978 +▁noyadeles -24979 +▁saniyalen -24980 +▁tigitigiw -24981 +musokôrôbaw -24982 +▁belaruskaw -24983 +▁dutɛrɔnɔmɛ -24984 +▁jatigiyake -24985 +▁jerenkeren -24986 +▁jidagayɔrɔ -24987 +▁jingoistic -24988 +▁jiriboloda -24989 +▁jisigiyɔrɔ -24990 +▁jogoɲumaya -24991 +▁journalist -24992 +▁jɛkukuwkan -24993 +▁jɛkulukono -24994 +▁kafaraokan -24995 +▁kalansobaw -24996 +▁kamiandugu -24997 +▁kanhɔnrɔya -24998 +▁karabentao -24999 +ebe -25000 +rwa -25001 +āja -25002 +ịde -25003 +▁"' -25004 +▁vu -25005 +bɔra -25006 +liwa -25007 +robe -25008 +wain -25009 +wuru -25010 +ọhịa -25011 +▁bwa -25012 +▁ɲɛw -25013 +donso -25014 +hamma -25015 +nkulu -25016 +ɔnɔbɔ -25017 +▁fɛre -25018 +▁guda -25019 +▁horn -25020 +▁jada -25021 +▁kajɔ -25022 +▁kebe -25023 +▁kewa -25024 +▁kowa -25025 +▁labi -25026 +▁nèrè -25027 +▁oena -25028 +▁puru -25029 +▁rāja -25030 +▁tewu -25031 +▁tolo -25032 +▁wuru -25033 +fariya -25034 +kununi -25035 +mekalo -25036 +rwalen -25037 +tetiki -25038 +▁durun -25039 +▁faraw -25040 +▁lemma -25041 +▁night -25042 +▁sarov -25043 +▁siglo -25044 +▁tiden -25045 +▁twain -25046 +ardrobe -25047 +▁dhamma -25048 +▁duruna -25049 +▁fagara -25050 +▁kewapụ -25051 +▁kowace -25052 +▁malabo -25053 +▁miniti -25054 +▁musolu -25055 +▁mɔnɔbɔ -25056 +▁nabɔra -25057 +▁sajumɛ -25058 +▁turuyi -25059 +▁waraka -25060 +▁yawuru -25061 +ostralia -25062 +tigininw -25063 +▁armenia -25064 +▁funtira -25065 +▁mainuka -25066 +▁nuwamba -25067 +▁silamen -25068 +▁cɛfariya -25069 +▁dimanche -25070 +▁gônoproj -25071 +▁iteghete -25072 +▁nkwalite -25073 +▁sɔrɔfenw -25074 +▁wardrobe -25075 +▁yiriliwa -25076 +▁yirwalen -25077 +jebailleul -25078 +university -25079 +▁fɛnkununi -25080 +▁jɛkulutɔn -25081 +▁sintetiki -25082 +▁baaraɲᴐgᴐn -25083 +▁damaliscus -25084 +▁jɛkuludenw -25085 +▁karanbagaw -25086 +▁karijakuma -25087 +▁karikatɛri -25088 +▁kartajikaw -25089 +▁kartverket -25090 +▁kassambara -25091 +▁kasuwancin -25092 +▁kasuwannin -25093 +▁kelenyatɔn -25094 +▁kilometres -25095 +▁kilomètèrè -25096 +▁kingsleyae -25097 +▁kinkoumana -25098 +▁kolonkalan -25099 +mị -25100 +] -31835 +я -31836 +ل -31837 ++ -31838 +ь -31839 +% -31840 +ʃ -31841 +б -31842 +ي -31843 +ā -31844 +ч -31845 +ò -31846 +ة -31847 +* -31848 += -31849 +ц -31850 +ر -31851 +ᴐ -31852 +‘ -31853 +م -31854 +! -31855 +· -31856 +í -31857 +ï -31858 +ї -31859 +â -31860 +х -31861 +ú -31862 +ù -31863 +ы -31864 +ф -31865 +ш -31866 +_ -31867 +ж -31868 +و -31869 +? -31870 +ߊ -31871 +ƙ -31872 +ю -31873 +̀ -31874 +á -31875 +ɳ -31876 +ó -31877 +ب -31878 +ɗ -31879 +& -31880 +ü -31881 +є -31882 +ì -31883 +ê -31884 +ج -31885 +ë -31886 +ş -31887 +س -31888 +ع -31889 +ن -31890 +ߞ -31891 +ñ -31892 +ه -31893 +ߏ -31894 +ߒ -31895 +߬ -31896 +ī -31897 +ъ -31898 +э -31899 +ت -31900 +د -31901 +ߋ -31902 +ߘ -31903 +߫ -31904 +߲ -31905 +ı -31906 +œ -31907 +ś -31908 +ū -31909 +ߓ -31910 +° -31911 +İ -31912 +ߌ -31913 +ὲ -31914 +ⴰ -31915 +日 -31916 +î -31917 +ö -31918 +́ -31919 +إ -31920 +ش -31921 +ߍ -31922 +ߎ -31923 +‰ -31924 +{ -31925 +ä -31926 +ø -31927 +щ -31928 +י -31929 +् -31930 +ṇ -31931 +ⵜ -31932 +本 -31933 +# -31934 +ã -31935 +û -31936 +ć -31937 +غ -31938 +ك -31939 +ߐ -31940 +ߙ -31941 +ߝ -31942 +ߡ -31943 +社 -31944 +} -31945 +ł -31946 +ũ -31947 +λ -31948 +ѣ -31949 +ئ -31950 +ز -31951 +ߖ -31952 +ߛ -31953 +ߟ -31954 +ߠ -31955 +ߣ -31956 +ߦ -31957 +ध -31958 +म -31959 +ố -31960 +′ -31961 +『 -31962 +』 -31963 +の -31964 +史 -31965 +朝 -31966 +英 -31967 +集 -31968 +$ -31969 +^ -31970 +£ -31971 +× -31972 +å -31973 +ą -31974 +č -31975 +š -31976 +ʻ -31977 +ˈ -31978 +ː -31979 +δ -31980 +σ -31981 +ה -31982 +ו -31983 +ל -31984 +מ -31985 +ר -31986 +ת -31987 +، -31988 +ح -31989 +ص -31990 +ظ -31991 +ق -31992 +ى -31993 +َ -31994 +ग -31995 diff --git a/models/tokenizer/bm_tokenizer_8k.model b/models/tokenizer/bm_tokenizer_8k.model new file mode 100644 index 0000000000000000000000000000000000000000..5c0069a2d5c4ef65c3aeea78b743e31e27bf6933 --- /dev/null +++ b/models/tokenizer/bm_tokenizer_8k.model @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b7ebf2d24f769b1286b48c8e35b7389a0e0e1303d97a28ec9d43ae1701d59f89 +size 371453 diff --git a/models/tokenizer/bm_tokenizer_8k.vocab b/models/tokenizer/bm_tokenizer_8k.vocab new file mode 100644 index 0000000000000000000000000000000000000000..71866a1079efd27e447ec08bff248383a62ec411 --- /dev/null +++ b/models/tokenizer/bm_tokenizer_8k.vocab @@ -0,0 +1,8000 @@ + 0 + 0 + 0 + 0 +▁k -0 +an -1 +▁s -2 +▁b -3 +▁d -4 +▁n -5 +▁y -6 +▁m -7 +in -8 +▁f -9 +▁ka -10 +la -11 +ar -12 +▁t -13 +▁ye -14 +am -15 +on -16 +en -17 +▁a -18 +li -19 +▁c -20 +ri -21 +▁j -22 +▁la -23 +ti -24 +ba -25 +le -26 +ɔn -27 +gu -28 +go -29 +ya -30 +ra -31 +▁bɛ -32 +ara -33 +ugu -34 +▁ni -35 +un -36 +▁na -37 +▁w -38 +ana -39 +is -40 +▁min -41 +at -42 +ɔr -43 +ɛn -44 +▁ma -45 +▁o -46 +ma -47 +len -48 +re -49 +ani -50 +ko -51 +ka -52 +▁kɛ -53 +▁si -54 +ɔrɔ -55 +si -56 +lo -57 +▁( -58 +▁sa -59 +▁dugu -60 +ro -61 +▁ko -62 +amana -63 +ɔg -64 +▁san -65 +ga -66 +na -67 +rie -68 +il -69 +tion -70 +ama -71 +▁cat -72 +▁ani -73 +égo -74 +égorie -75 +▁catégorie -76 +ou -77 +▁p -78 +di -79 +▁ba -80 +▁don -81 +ni -82 +▁ta -83 +ul -84 +▁jamana -85 +▁di -86 +gi -87 +ɔgɔ -88 +▁h -89 +▁kan -90 +er -91 +▁ɲ -92 +▁u -93 +▁wa -94 +ɛr -95 +▁e -96 +▁i -97 +so -98 +ta -99 +kan -100 +ran -101 +▁saba -102 +▁se -103 +ɔnɔ -104 +da -105 +ogo -106 +bi -107 +▁de -108 +ki -109 +ur -110 +sa -111 +▁fɛ -112 +▁sabab -113 +ari -114 +lan -115 +▁da -116 +oro -117 +▁ch -118 +▁be -119 +▁fɔ -120 +▁g -121 +▁fa -122 +▁kɔ -123 +▁kɔnɔ -124 +es -125 +▁sababou -126 +▁in -127 +▁dɔ -128 +▁ke -129 +▁tun -130 +▁fran -131 +kɛ -132 +iri -133 +les -134 +ɛrɛ -135 +▁bama -136 +te -137 +us -138 +olo -139 +or -140 +▁is -141 +ire -142 +ille -143 +aman -144 +he -145 +▁sɔrɔ -146 +aran -147 +▁ku -148 +▁ti -149 +fɛ -150 +▁é -151 +niya -152 +ɛb -153 +▁bamako -154 +bara -155 +tions -156 +ais -157 +▁franç -158 +bn -159 +ini -160 +bam -161 +▁français -162 +se -163 +▁dic -164 +▁kelen -165 +▁char -166 +▁isbn -167 +▁ha -168 +um -169 +ditions -170 +▁donniya -171 +▁charles -172 +naire -173 +▁diction -174 +baille -175 +bambara -176 +bailleul -177 +▁éditions -178 +▁dictionnaire -179 +ke -180 +den -181 +eri -182 +nu -183 +aransi -184 +▁taa -185 +▁sigi -186 +▁bɔ -187 +▁an -188 +▁man -189 +▁bi -190 +inɛ -191 +▁ji -192 +fa -193 +lɛ -194 +ɲɛ -195 +▁fan -196 +gɛ -197 +▁af -198 +▁minnu -199 +▁mali -200 +ch -201 +mɛ -202 +). -203 +to -204 +de -205 +▁v -206 +▁kɔfɛ -207 +▁sira -208 +ji -209 +wa -210 +▁ja -211 +uru -212 +▁ɲɛ -213 +ulu -214 +▁" -215 +ɔrɔn -216 +lu -217 +▁baara -218 +bɔ -219 +ameri -220 +be -221 +jɛ -222 +▁yo -223 +▁mɔgɔ -224 +▁fara -225 +▁kun -226 +▁dan -227 +▁sen -228 +ye -229 +oli -230 +▁caman -231 +dugu -232 +▁mo -233 +wu -234 +ina -235 +ine -236 +ge -237 +▁fi -238 +▁cɛ -239 +ku -240 +▁mara -241 +ca -242 +yɔrɔ -243 +lɔ -244 +▁tɛ -245 +▁. -246 +man -247 +▁kuma -248 +bo -249 +bu -250 +tu -251 +▁faransi -252 +ce -253 +nen -254 +lima -255 +▁yɔrɔ -256 +▁to -257 +me -258 +qu -259 +▁tu -260 +▁dɔn -261 +ne -262 +don -263 +tigi -264 +ɔgɔn -265 +▁jamanaw -266 +px -267 +▁ɛn -268 +▁tɔgɔ -269 +▁woro -270 +▁su -271 +▁yɛ -272 +pa -273 +lon -274 +ent -275 +▁faso -276 +▁gu -277 +gan -278 +▁ameri -279 +▁ca -280 +▁do -281 +▁mu -282 +▁ya -283 +▁kɛra -284 +▁bɛɛ -285 +ɛnɛ -286 +yalen -287 +), -288 +▁worodugu -289 +ci -290 +cogo -291 +we -292 +▁mi -293 +▁nke -294 +▁ọ -295 +hi -296 +kolo -297 +▁fo -298 +▁afri -299 +▁ga -300 +ha -301 +ɛbɛn -302 +▁jon -303 +jamana -304 +▁walima -305 +do -306 +mu -307 +▁ban -308 +fan -309 +▁tle -310 +nan -311 +▁nin -312 +▁kɔrɔ -313 +▁kɛlɛ -314 +▁yɛrɛ -315 +▁so -316 +ban -317 +▁kalan -318 +heli -319 +▁cogo -320 +▁l -321 +tɛr -322 +uni -323 +▁kos -324 +inɛti -325 +▁fanga -326 +▁saheli -327 +tɛrinɛti -328 +ja -329 +wi -330 +▁dugum -331 +▁ɛntɛrinɛti -332 +▁dɛ -333 +▁re -334 +kili -335 +▁dugumogo -336 +▁yooro -337 +▁bo -338 +▁jɛ -339 +yiri -340 +▁fɔlɔ -341 +kun -342 +▁le -343 +ati -344 +▁r -345 +oni -346 +amara -347 +th -348 +yan -349 +▁ɲɔgɔn -350 +ate -351 +▁fana -352 +▁siti -353 +faransi -354 +du -355 +hụ -356 +st -357 +▁bolo -358 +al -359 +rô -360 +▁kon -361 +bin -362 +ɛbɛ -363 +▁z -364 +▁we -365 +▁kelenyalen -366 +ôrô -367 +▁masa -368 +ilan -369 +▁waati -370 +kọ -371 +▁du -372 +▁bon -373 +▁den -374 +▁fasojamana -375 +kɛla -376 +▁mans -377 +gh -378 +▁ki -379 +▁dam -380 +mi -381 +yi -382 +sen -383 +fi -384 +isi -385 +tin -386 +risi -387 +co -388 +▁sugu -389 +▁wala -390 +pu -391 +aba -392 +▁co -393 +▁tile -394 +▁jira -395 +▁tlebi -396 +▁mansamara -397 +kɔ -398 +vi -399 +gwu -400 +ɛgɛ -401 +▁wɛrɛ -402 +fin -403 +mɔgɔ -404 +▁me -405 +▁te -406 +denw -407 +▁afrika -408 +pe -409 +ata -410 +▁al -411 +▁ne -412 +▁amerika -413 +po -414 +dɔn -415 +af -416 +▁kɛmɛ -417 +.[ -418 +gin -419 +kulu -420 +▁kosɛbɛ -421 +ve -422 +ter -423 +▁jɔ -424 +▁jo -425 +▁nka -426 +amanan -427 +▁gun -428 +▁li -429 +▁vi -430 +▁tan -431 +▁jate -432 +que -433 +▁faaba -434 +▁sɛbɛn -435 +▁egwu -436 +▁: -437 +tan -438 +▁ci -439 +▁- -440 +▁diɲɛ -441 +fɔ -442 +pi -443 +▁yen -444 +▁walasa -445 +▁bamanan -446 +zi -447 +▁ar -448 +▁of -449 +▁bɔra -450 +yanfan -451 +kụ -452 +▁kè -453 +▁dɔw -454 +fe -455 +amu -456 +kɔnɔ -457 +▁bila -458 +▁bè -459 +ɛna -460 +urun -461 +▁olu -462 +▁kɔrɔn -463 +▁dugukolo -464 +ing -465 +et -466 +▁ro -467 +▁fɛn -468 +▁kɔn -469 +▁hakɛ -470 +mo -471 +▁no -472 +▁po -473 +dị -474 +gô -475 +kalo -476 +▁son -477 +▁kulu -478 +▁yiri -479 +bụ -480 +cɛ -481 +ft -482 +▁ju -483 +ɛrɛn -484 +ariya -485 +▁yoga -486 +as -487 +▁mar -488 +▁kô -489 +▁ali -490 +▁— -491 +tiki -492 +▁tɔn -493 +▁jago -494 +san -495 +iriki -496 +▁uk -497 +▁daminɛ -498 +▁dô -499 +▁afiriki -500 +▁sin -501 +lle -502 +bli -503 +dala -504 +▁bana -505 +▁sababu -506 +▁“ -507 +kɔn -508 +ɛri -509 +▁fô -510 +wift -511 +▁fil -512 +▁mis -513 +ry -514 +▁ŋ -515 +▁aw -516 +uman -517 +▁swift -518 +▁mari -519 +▁bé -520 +tigɛ -521 +▁kɔgɔ -522 +sh -523 +▁jan -524 +▁fila -525 +▁jɛkulu -526 +ôgô -527 +ariku -528 +▁kura -529 +▁tuma -530 +▁wele -531 +▁con -532 +▁pro -533 +▁poli -534 +▁suguya -535 +▁fe -536 +▁tɔ -537 +▁kɛr -538 +▁boli -539 +su -540 +dan -541 +▁dị -542 +kụkọ -543 +▁the -544 +▁bɛna -545 +▁wɛrɛw -546 +▁kɔgɔji -547 +yo -548 +kaw -549 +wan -550 +▁sis -551 +▁kɛnɛ -552 +▁ukra -553 +au -554 +min -555 +fara -556 +jago -557 +▁bin -558 +▁sôrô -559 +▁ɲɛmɔgɔ -560 +▁ɔ -561 +ene -562 +kɔrɔ -563 +▁ce -564 +▁nɔ -565 +▁on -566 +▁muso -567 +▁sɛnɛ -568 +▁dilan -569 +ll -570 +tt -571 +ɲi -572 +ịhụ -573 +▁fari -574 +▁bamanankan -575 +ali -576 +gne -577 +nanya -578 +ịhụnanya -579 +▁bu -580 +▁lo -581 +▁des -582 +▁kab -583 +▁с -584 +▁lam -585 +▁sariya -586 +pụ -587 +▁et -588 +baga -589 +▁fin -590 +▁jɛn -591 +je -592 +▁ụ -593 +our -594 +ron -595 +taa -596 +▁franse -597 +εε -598 +▁[ -599 +▁« -600 +ami -601 +ega -602 +fɛn -603 +▁ho -604 +bolo -605 +▁laban -606 +▁hakili -607 +eni -608 +▁ahụ -609 +▁ndị -610 +amerika -611 +ru -612 +ty -613 +té -614 +dio -615 +sin -616 +▁pa -617 +mali -618 +ropa -619 +▁lab -620 +▁foro -621 +▁yiriwa -622 +▁farafin -623 +law -624 +ver -625 +▁naf -626 +ts -627 +ard -628 +dia -629 +▁fu -630 +▁/ -631 +▁at -632 +▁daɲɛ -633 +.. -634 +ww -635 +ere -636 +nin -637 +▁en -638 +▁go -639 +▁yé -640 +▁tra -641 +▁kama -642 +ɔrɔnya -643 +▁senega -644 +▁– -645 +int -646 +son -647 +▁bụ -648 +▁sh -649 +▁wi -650 +ulon -651 +kɛlaw -652 +kɛrɛn -653 +▁siri -654 +▁tariku -655 +▁baarakɛ -656 +▁+ -657 +sia -658 +▁baw -659 +▁dabɔ -660 +▁marifa -661 +rụ -662 +на -663 +▁, -664 +las -665 +bali -666 +jɛgɛ -667 +yali -668 +▁taama -669 +▁kɛmɛda -670 +▁sigilen -671 +rè -672 +che -673 +kow -674 +dama -675 +lenw -676 +▁kolon -677 +▁mɔgɔw -678 +▁sigira -679 +▁ameriki -680 +▁jamanadenw -681 +▁ɛ -682 +pan -683 +▁lu -684 +▁un -685 +▁duni -686 +▁lajɛ -687 +▁laka -688 +▁sila -689 +èn -690 +ск -691 +ena -692 +▁aka -693 +▁gine -694 +ра -695 +ber -696 +▁es -697 +▁wo -698 +▁dun -699 +▁laa -700 +publi -701 +▁cent -702 +▁tugu -703 +dɔnnen -704 +▁kɛrɛn -705 +▁bamakɔ -706 +▁jɔyɔrɔ -707 +▁politiki -708 +▁в -709 +are -710 +baw -711 +naf -712 +▁dé -713 +▁nt -714 +▁ra -715 +land -716 +tara -717 +▁tali -718 +▁wale -719 +▁cogoya -720 +▁masala -721 +kɛrɛnnen -722 +ré -723 +то -724 +mis -725 +▁je -726 +afri -727 +▁mas -728 +▁mili -729 +▁sisan -730 +el -731 +fo -732 +ps -733 +chi -734 +kar -735 +yɛn -736 +▁kaba -737 +▁minɛ -738 +▁site -739 +▁к -740 +jan -741 +res -742 +ton -743 +▁bar -744 +▁bɛn -745 +▁nafa -746 +▁kɛrɛnkɛrɛnnen -747 +ph -748 +ɛni -749 +hara -750 +▁ihe -751 +arabu -752 +bagan -753 +kalan -754 +▁kɔkan -755 +▁mansa -756 +▁kabini -757 +ck -758 +baa -759 +bia -760 +mba -761 +tra -762 +▁sun -763 +▁fanba -764 +▁tulon -765 +▁kunnaf -766 +▁farafinna -767 +lé -768 +va -769 +ces -770 +cha -771 +lin -772 +mar -773 +tte -774 +▁ale -775 +▁fla -776 +sɛbɛn -777 +▁sika -778 +ال -779 +tik -780 +ment -781 +tali -782 +▁nan -783 +▁hali -784 +▁tila -785 +afrika -786 +▁eropa -787 +▁laadala -788 +▁ịhụnanya -789 +▁jamanaden -790 +kw -791 +▁hi -792 +▁sɛ -793 +bila -794 +▁abụ -795 +▁mun -796 +▁sou -797 +▁cɛma -798 +▁kalo -799 +▁ukraine -800 +ct -801 +tɛ -802 +ɲa -803 +▁л -804 +▁р -805 +babu -806 +sira -807 +▁kar -808 +▁nana -809 +▁yɛlɛ -810 +▁danbɔ -811 +▁irisi -812 +▁sahara -813 +▁sigida -814 +▁kunnafoni -815 +za -816 +rit -817 +èrè -818 +▁sɛb -819 +ugula -820 +ɛnajɛ -821 +▁wari -822 +▁bonya -823 +▁filmu -824 +tɔ -825 +▁; -826 +▁th -827 +▁sam -828 +▁uni -829 +kelen -830 +kɔrɔn -831 +▁fɔli -832 +▁fɛɛrɛ -833 +▁sɛben -834 +▁hadama -835 +▁danfara -836 +по -837 +▁| -838 +liw -839 +ste -840 +tes -841 +uli -842 +ence -843 +lanw -844 +▁lib -845 +▁kilo -846 +▁kolo -847 +▁tiɲɛ -848 +// -849 +vo -850 +▁ʃ -851 +can -852 +mes -853 +ɛlɛ -854 +▁as -855 +▁pe -856 +dasi -857 +fasi -858 +wari -859 +▁ala -860 +▁mon -861 +▁yan -862 +▁ɲin -863 +▁dɔgɔ -864 +▁jugu -865 +▁minu -866 +▁musa -867 +▁jigin -868 +▁saint -869 +kuntigi -870 +:// -871 +ilɛ -872 +tɔn -873 +bola -874 +gera -875 +▁dala -876 +▁tɛmɛ -877 +▁akụkọ -878 +▁faran -879 +▁senkan -880 +▁farikolo -881 +mb -882 +sɛ -883 +des -884 +han -885 +mah -886 +nes -887 +▁nk -888 +▁pi -889 +ania -890 +▁art -891 +▁bam -892 +▁kul -893 +▁par -894 +▁dɛmɛ -895 +▁sini -896 +▁dunia -897 +▁sɔrɔdasi -898 +no -899 +arị -900 +der -901 +▁ex -902 +▁nu -903 +bili -904 +▁hak -905 +donna -906 +mancɛ -907 +tinin -908 +ɛnama -909 +▁kɛɲɛ -910 +▁seko -911 +▁sera -912 +cation -913 +▁atlan -914 +▁kongo -915 +▁foroba -916 +▁fitinin -917 +dɔ -918 +nô -919 +tle -920 +usu -921 +▁am -922 +▁au -923 +▁er -924 +▁gi -925 +buru -926 +sɛgɛ -927 +▁ama -928 +▁jɔn -929 +▁wee -930 +▁fili -931 +▁nɛgɛ -932 +▁sara -933 +▁sɛgɛ -934 +▁bagan -935 +▁kungo -936 +▁segin -937 +▁africa -938 +▁nafolo -939 +▁jamanakuntigi -940 +ен -941 +▁* -942 +▁» -943 +lar -944 +yɔn -945 +ɔra -946 +▁fè -947 +paɲi -948 +▁mus -949 +▁tum -950 +▁bara -951 +▁ɛndu -952 +▁ebola -953 +▁galle -954 +▁kɛnɛya -955 +▁sɔrɔko -956 +▁yɛlɛma -957 +▁cɛmancɛ -958 +▁dɔnkili -959 +▁yɛrɛmah -960 +▁madɔnnen -961 +▁sigiyɔrɔ -962 +ho -963 +aka -964 +ben -965 +ger -966 +gon -967 +mɛn -968 +orr -969 +run -970 +sun -971 +tto -972 +urs -973 +▁bô -974 +▁là -975 +▁sé -976 +▁ال -977 +pụta -978 +were -979 +▁and -980 +▁dum -981 +▁for -982 +▁les -983 +▁por -984 +akụkọ -985 +▁jama -986 +▁kara -987 +▁lase -988 +▁mugu -989 +▁sanu -990 +gnette -991 +▁diinɛ -992 +▁kɛcogo -993 +▁masakɛ -994 +". -995 +fu -996 +gɔ -997 +it -998 +ов -999 +dew -1000 +kis -1001 +sis -1002 +sti -1003 +umb -1004 +ɔni -1005 +▁ge -1006 +▁tè -1007 +sion -1008 +tɛrɛ -1009 +▁kala -1010 +▁wati -1011 +orrent -1012 +▁kataa -1013 +▁sudan -1014 +▁woroduguyanfan -1015 +ak -1016 +uk -1017 +▁у -1018 +▁‘ -1019 +ala -1020 +ang -1021 +bur -1022 +ral -1023 +the -1024 +▁ak -1025 +▁el -1026 +ɔnin -1027 +baara -1028 +▁kono -1029 +▁môgô -1030 +tional -1031 +▁arabu -1032 +▁inter -1033 +▁labɛn -1034 +▁surun -1035 +▁ɲuman -1036 +▁kalanso -1037 +▁sirilanw -1038 +▁sɛgɛsɛgɛ -1039 +né -1040 +pp -1041 +ss -1042 +ية -1043 +▁< -1044 +sɛn -1045 +▁qu -1046 +faso -1047 +▁com -1048 +▁shi -1049 +bilen -1050 +ɲɔgɔn -1051 +▁jiri -1052 +▁kore -1053 +▁onye -1054 +▁risi -1055 +▁togo -1056 +▁yoro -1057 +▁dɔnko -1058 +▁hakil -1059 +▁motto -1060 +▁ninnu -1061 +▁silamɛ -1062 +▁faranfasi -1063 +bɛ -1064 +jo -1065 +ld -1066 +fil -1067 +gar -1068 +kon -1069 +ria -1070 +ɔpu -1071 +fina -1072 +jata -1073 +main -1074 +tini -1075 +ɲini -1076 +gharị -1077 +▁dɔrɔn -1078 +▁kulɛri -1079 +▁lakali -1080 +▁ɲinini -1081 +▁dɔnniya -1082 +▁gallery -1083 +▁kumajago -1084 + -7835 +я -7836 +ل -7837 ++ -7838 +ь -7839 +% -7840 +ʃ -7841 +б -7842 +ي -7843 +ā -7844 +ч -7845 +ò -7846 +ة -7847 +* -7848 += -7849 +ц -7850 +ر -7851 +ᴐ -7852 +‘ -7853 +م -7854 +! -7855 +· -7856 +í -7857 +ï -7858 +ї -7859 +â -7860 +х -7861 +ú -7862 +ù -7863 +ы -7864 +ф -7865 +ш -7866 +_ -7867 +ж -7868 +و -7869 +? -7870 +ߊ -7871 +ƙ -7872 +ю -7873 +̀ -7874 +á -7875 +ɳ -7876 +ó -7877 +ب -7878 +ɗ -7879 +& -7880 +ü -7881 +є -7882 +ì -7883 +ê -7884 +ج -7885 +ë -7886 +ş -7887 +س -7888 +ع -7889 +ن -7890 +ߞ -7891 +ñ -7892 +ه -7893 +ߏ -7894 +ߒ -7895 +߬ -7896 +ī -7897 +ъ -7898 +э -7899 +ت -7900 +د -7901 +ߋ -7902 +ߘ -7903 +߫ -7904 +߲ -7905 +ı -7906 +œ -7907 +ś -7908 +ū -7909 +ߓ -7910 +° -7911 +İ -7912 +ߌ -7913 +ὲ -7914 +ⴰ -7915 +日 -7916 +î -7917 +ö -7918 +́ -7919 +إ -7920 +ش -7921 +ߍ -7922 +ߎ -7923 +‰ -7924 +{ -7925 +ä -7926 +ø -7927 +щ -7928 +י -7929 +् -7930 +ṇ -7931 +ⵜ -7932 +本 -7933 +# -7934 +ã -7935 +û -7936 +ć -7937 +غ -7938 +ك -7939 +ߐ -7940 +ߙ -7941 +ߝ -7942 +ߡ -7943 +社 -7944 +} -7945 +ł -7946 +ũ -7947 +λ -7948 +ѣ -7949 +ئ -7950 +ز -7951 +ߖ -7952 +ߛ -7953 +ߟ -7954 +ߠ -7955 +ߣ -7956 +ߦ -7957 +ध -7958 +म -7959 +ố -7960 +′ -7961 +『 -7962 +』 -7963 +の -7964 +史 -7965 +朝 -7966 +英 -7967 +集 -7968 +$ -7969 +^ -7970 +£ -7971 +× -7972 +å -7973 +ą -7974 +č -7975 +š -7976 +ʻ -7977 +ˈ -7978 +ː -7979 +δ -7980 +σ -7981 +ה -7982 +ו -7983 +ל -7984 +מ -7985 +ר -7986 +ת -7987 +، -7988 +ح -7989 +ص -7990 +ظ -7991 +ق -7992 +ى -7993 +َ -7994 +ग -7995 diff --git a/models/vocabulary/bm_vocabulary.parquet b/models/vocabulary/bm_vocabulary.parquet new file mode 100644 index 0000000000000000000000000000000000000000..a67c61bcd5b99f3c8046cdf67be9f17e56040dbc --- /dev/null +++ b/models/vocabulary/bm_vocabulary.parquet @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3d54a1977879161f36d59485af9d41f9f5140c9cf6590d94c12addac73e06114 +size 116321 diff --git a/models/vocabulary/bm_vocabulary_metadata.json b/models/vocabulary/bm_vocabulary_metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..dad0ca3783771240bdd1d8547837af7c2cba72a2 --- /dev/null +++ b/models/vocabulary/bm_vocabulary_metadata.json @@ -0,0 +1,16 @@ +{ + "language": "bm", + "vocabulary_size": 7195, + "statistics": { + "type_token_ratio": 0.16176133457950517, + "coverage": { + "top_100": 0.46858412541661526, + "top_1000": 0.7123194667325021, + "top_5000": 0.8629710617736788, + "top_10000": 0.9264112014389758 + }, + "hapax_count": 11151, + "hapax_ratio": 0.607816417747738, + "total_documents": 1299 + } +} \ No newline at end of file diff --git a/models/word_markov/bm_markov_ctx1_word.parquet b/models/word_markov/bm_markov_ctx1_word.parquet new file mode 100644 index 0000000000000000000000000000000000000000..d0154232f9bed7dc050d62c3cc202271cc5ad351 --- /dev/null +++ b/models/word_markov/bm_markov_ctx1_word.parquet @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c5771841e705a9dd2e47d794be576e0f304212cdfd165b9c86e4a3bbf40bc589 +size 575996 diff --git a/models/word_markov/bm_markov_ctx1_word_metadata.json b/models/word_markov/bm_markov_ctx1_word_metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..fe11e59129bd15d507728dda9df2002035ad6202 --- /dev/null +++ b/models/word_markov/bm_markov_ctx1_word_metadata.json @@ -0,0 +1,7 @@ +{ + "context_size": 1, + "variant": "word", + "language": "bm", + "unique_contexts": 18421, + "total_transitions": 140738 +} \ No newline at end of file diff --git a/models/word_markov/bm_markov_ctx2_word.parquet b/models/word_markov/bm_markov_ctx2_word.parquet new file mode 100644 index 0000000000000000000000000000000000000000..422d9695a6821fd4237c0d8f1dbcdeb9e30a1ce6 --- /dev/null +++ b/models/word_markov/bm_markov_ctx2_word.parquet @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:75d31f3bd92ad9f4e4d1c4e921aeabc69c0202e90bc20dd9e3b9f2822ae86f7f +size 1171294 diff --git a/models/word_markov/bm_markov_ctx2_word_metadata.json b/models/word_markov/bm_markov_ctx2_word_metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..91572dcd28413282c8b459c59e494bc2a4770f34 --- /dev/null +++ b/models/word_markov/bm_markov_ctx2_word_metadata.json @@ -0,0 +1,7 @@ +{ + "context_size": 2, + "variant": "word", + "language": "bm", + "unique_contexts": 65151, + "total_transitions": 139439 +} \ No newline at end of file diff --git a/models/word_markov/bm_markov_ctx3_word.parquet b/models/word_markov/bm_markov_ctx3_word.parquet new file mode 100644 index 0000000000000000000000000000000000000000..4d1d623c275489da9ab251e39784e03aa57f2d97 --- /dev/null +++ b/models/word_markov/bm_markov_ctx3_word.parquet @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3fa392bd3a195161417c5b8dfa8792082e634a6a83b57348f2a245ae4a04efba +size 1584409 diff --git a/models/word_markov/bm_markov_ctx3_word_metadata.json b/models/word_markov/bm_markov_ctx3_word_metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..26a25d5bd41b22bfb4cb6baedbef4d8132ee45c1 --- /dev/null +++ b/models/word_markov/bm_markov_ctx3_word_metadata.json @@ -0,0 +1,7 @@ +{ + "context_size": 3, + "variant": "word", + "language": "bm", + "unique_contexts": 96171, + "total_transitions": 138140 +} \ No newline at end of file diff --git a/models/word_markov/bm_markov_ctx4_word.parquet b/models/word_markov/bm_markov_ctx4_word.parquet new file mode 100644 index 0000000000000000000000000000000000000000..37d5d2087baa06402939fbb24dff0db98a870ec4 --- /dev/null +++ b/models/word_markov/bm_markov_ctx4_word.parquet @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fa556a96029c6bafa0afbbae6795406371cd660317dcbb46cb396c604196f52b +size 1827580 diff --git a/models/word_markov/bm_markov_ctx4_word_metadata.json b/models/word_markov/bm_markov_ctx4_word_metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..4b9c3a023decc2c96a6792b0e78e9ccf635a35a2 --- /dev/null +++ b/models/word_markov/bm_markov_ctx4_word_metadata.json @@ -0,0 +1,7 @@ +{ + "context_size": 4, + "variant": "word", + "language": "bm", + "unique_contexts": 108554, + "total_transitions": 136845 +} \ No newline at end of file diff --git a/models/word_ngram/bm_2gram_word.parquet b/models/word_ngram/bm_2gram_word.parquet new file mode 100644 index 0000000000000000000000000000000000000000..cc7db88174429923758ac2165933cb1f94b50c25 --- /dev/null +++ b/models/word_ngram/bm_2gram_word.parquet @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7b5007949f6bbf42d027ff51fc5b8f9e4e55c91f7a05c383cb4a9d9747400c3c +size 37545 diff --git a/models/word_ngram/bm_2gram_word_metadata.json b/models/word_ngram/bm_2gram_word_metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..764d6f75b612b566c0b58351bcd03689b9bbcbc8 --- /dev/null +++ b/models/word_ngram/bm_2gram_word_metadata.json @@ -0,0 +1,7 @@ +{ + "n": 2, + "variant": "word", + "language": "bm", + "unique_ngrams": 2854, + "total_ngrams": 140738 +} \ No newline at end of file diff --git a/models/word_ngram/bm_3gram_word.parquet b/models/word_ngram/bm_3gram_word.parquet new file mode 100644 index 0000000000000000000000000000000000000000..9f417945bdd403606a65295aefce5a52b2ed275a --- /dev/null +++ b/models/word_ngram/bm_3gram_word.parquet @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f60674a1667559b06bf2d6d1c02809b85928a179d949721898f660c388b27feb +size 52891 diff --git a/models/word_ngram/bm_3gram_word_metadata.json b/models/word_ngram/bm_3gram_word_metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..b7432bba4b75ef8b3b7c80e3a1fac3c59bcaa3d2 --- /dev/null +++ b/models/word_ngram/bm_3gram_word_metadata.json @@ -0,0 +1,7 @@ +{ + "n": 3, + "variant": "word", + "language": "bm", + "unique_ngrams": 3554, + "total_ngrams": 139439 +} \ No newline at end of file diff --git a/models/word_ngram/bm_4gram_word.parquet b/models/word_ngram/bm_4gram_word.parquet new file mode 100644 index 0000000000000000000000000000000000000000..e892e6ce5c9d658cd2b6b02adeb63540915a9572 --- /dev/null +++ b/models/word_ngram/bm_4gram_word.parquet @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1e75ace9be8417983bb1c726ad403d1c0882df8c7f950705aedd826360a33ad7 +size 136064 diff --git a/models/word_ngram/bm_4gram_word_metadata.json b/models/word_ngram/bm_4gram_word_metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..da2eaf940816f7be5e1d15f0345cca9735337a60 --- /dev/null +++ b/models/word_ngram/bm_4gram_word_metadata.json @@ -0,0 +1,7 @@ +{ + "n": 4, + "variant": "word", + "language": "bm", + "unique_ngrams": 8337, + "total_ngrams": 138140 +} \ No newline at end of file diff --git a/visualizations/embedding_isotropy.png b/visualizations/embedding_isotropy.png new file mode 100644 index 0000000000000000000000000000000000000000..660ea8b1d309d8952bb4b27a83c16e57aca48781 Binary files /dev/null and b/visualizations/embedding_isotropy.png differ diff --git a/visualizations/embedding_norms.png b/visualizations/embedding_norms.png new file mode 100644 index 0000000000000000000000000000000000000000..39e6575104958a788a5620245a3363be54ba0154 Binary files /dev/null and b/visualizations/embedding_norms.png differ diff --git a/visualizations/embedding_similarity.png b/visualizations/embedding_similarity.png new file mode 100644 index 0000000000000000000000000000000000000000..c570c0d078aaca0419e25e13c2293688dd804025 --- /dev/null +++ b/visualizations/embedding_similarity.png @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:865d3f432225d6e9fa27c3b399fbbf0f61c7c1ea14a4f190ea27238bc566bf7b +size 152019 diff --git a/visualizations/markov_branching.png b/visualizations/markov_branching.png new file mode 100644 index 0000000000000000000000000000000000000000..c60b40a378f54c6af001b617b41d63afeb1e1145 Binary files /dev/null and b/visualizations/markov_branching.png differ diff --git a/visualizations/markov_contexts.png b/visualizations/markov_contexts.png new file mode 100644 index 0000000000000000000000000000000000000000..c5a7b902a7ff482e787ae69012e18741639664bb Binary files /dev/null and b/visualizations/markov_contexts.png differ diff --git a/visualizations/markov_entropy.png b/visualizations/markov_entropy.png new file mode 100644 index 0000000000000000000000000000000000000000..42d6ce7ff14a8e1659993c6622d0bb26daba2d4e Binary files /dev/null and b/visualizations/markov_entropy.png differ diff --git a/visualizations/model_sizes.png b/visualizations/model_sizes.png new file mode 100644 index 0000000000000000000000000000000000000000..ee6a389c7c9c8a92c51a3321f6198a28daa7933f Binary files /dev/null and b/visualizations/model_sizes.png differ diff --git a/visualizations/nearest_neighbors.png b/visualizations/nearest_neighbors.png new file mode 100644 index 0000000000000000000000000000000000000000..24c85f83b2dbe8c0406253647b3926672860221e Binary files /dev/null and b/visualizations/nearest_neighbors.png differ diff --git a/visualizations/ngram_coverage.png b/visualizations/ngram_coverage.png new file mode 100644 index 0000000000000000000000000000000000000000..52d35f9ecfdb929218db11cc3fa0c46a5f01ba57 Binary files /dev/null and b/visualizations/ngram_coverage.png differ diff --git a/visualizations/ngram_entropy.png b/visualizations/ngram_entropy.png new file mode 100644 index 0000000000000000000000000000000000000000..8ccd9ff245eb1e39d3725cb0d133c935f14f257c Binary files /dev/null and b/visualizations/ngram_entropy.png differ diff --git a/visualizations/ngram_perplexity.png b/visualizations/ngram_perplexity.png new file mode 100644 index 0000000000000000000000000000000000000000..4b9f0699716890a46513ec1b6efb7ec72157ca25 Binary files /dev/null and b/visualizations/ngram_perplexity.png differ diff --git a/visualizations/ngram_unique.png b/visualizations/ngram_unique.png new file mode 100644 index 0000000000000000000000000000000000000000..bad0abaf8b933a91307e92780c66059c54ba99c5 Binary files /dev/null and b/visualizations/ngram_unique.png differ diff --git a/visualizations/performance_dashboard.png b/visualizations/performance_dashboard.png new file mode 100644 index 0000000000000000000000000000000000000000..b0225f0215538b8e2abc7afce21aab067ebc17e7 --- /dev/null +++ b/visualizations/performance_dashboard.png @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:497f71cd84db6090e634f92c122fb3d970763a7439bf7a29a766d2dfaad814ed +size 264741 diff --git a/visualizations/position_encoding_comparison.png b/visualizations/position_encoding_comparison.png new file mode 100644 index 0000000000000000000000000000000000000000..a70e69ed91d8f0a07d3ffbf12d1bdce3956a8963 --- /dev/null +++ b/visualizations/position_encoding_comparison.png @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8da2bfb78a8a446ee726698884fc1e00a3e218dd11ffc0cc8ae45cc7dff852bc +size 112594 diff --git a/visualizations/tokenizer_compression.png b/visualizations/tokenizer_compression.png new file mode 100644 index 0000000000000000000000000000000000000000..7fa97890d52b716e5dae56fdcf106b6b4892dc66 Binary files /dev/null and b/visualizations/tokenizer_compression.png differ diff --git a/visualizations/tokenizer_fertility.png b/visualizations/tokenizer_fertility.png new file mode 100644 index 0000000000000000000000000000000000000000..c9181f132e1bcae96dd0e9b0fa6bb28e8534efcd Binary files /dev/null and b/visualizations/tokenizer_fertility.png differ diff --git a/visualizations/tokenizer_oov.png b/visualizations/tokenizer_oov.png new file mode 100644 index 0000000000000000000000000000000000000000..f61617dd924b9182933cb438ed3ac347d19ed146 Binary files /dev/null and b/visualizations/tokenizer_oov.png differ diff --git a/visualizations/tokenizer_total_tokens.png b/visualizations/tokenizer_total_tokens.png new file mode 100644 index 0000000000000000000000000000000000000000..0300b46b5ac7cda51e15a41772a74df0ca85557c Binary files /dev/null and b/visualizations/tokenizer_total_tokens.png differ diff --git a/visualizations/top20_words.png b/visualizations/top20_words.png new file mode 100644 index 0000000000000000000000000000000000000000..5cc0b668d0521d39aa8796046cc23a1cd5c09525 Binary files /dev/null and b/visualizations/top20_words.png differ diff --git a/visualizations/tsne_sentences.png b/visualizations/tsne_sentences.png new file mode 100644 index 0000000000000000000000000000000000000000..ada1b4f2eb640e6d5f8cae47d7c3c45d14bb2a05 --- /dev/null +++ b/visualizations/tsne_sentences.png @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b2a788e0b63e0030e80f58ac14eaa5bff4c0dcbde24971f7a6dcb11ea004fb83 +size 230699 diff --git a/visualizations/tsne_words.png b/visualizations/tsne_words.png new file mode 100644 index 0000000000000000000000000000000000000000..dfd76a3841b998377b6c1e5066aa3b6a336418da --- /dev/null +++ b/visualizations/tsne_words.png @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4ec16b56ae65a586d368d56e5888463ef1f21e71c7258c472096b2360895e851 +size 697319 diff --git a/visualizations/vocab_coverage.png b/visualizations/vocab_coverage.png new file mode 100644 index 0000000000000000000000000000000000000000..a8449807790a09ede5bf0a19e5c86aa858d846c6 Binary files /dev/null and b/visualizations/vocab_coverage.png differ diff --git a/visualizations/vocab_freq_dist.png b/visualizations/vocab_freq_dist.png new file mode 100644 index 0000000000000000000000000000000000000000..c56e219e3f730f2783e3743cf3e274c1010726e3 Binary files /dev/null and b/visualizations/vocab_freq_dist.png differ diff --git a/visualizations/zipf_law.png b/visualizations/zipf_law.png new file mode 100644 index 0000000000000000000000000000000000000000..5f2f726e943e9d7050a6644032deab13474809cf --- /dev/null +++ b/visualizations/zipf_law.png @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4ac160686d0e021cfdecc44e0c0dddf23702119ddf99079bccd0b4e8557d4e92 +size 108432