| { | |
| "version": "1.0", | |
| "truncation": null, | |
| "padding": null, | |
| "added_tokens": [ | |
| { | |
| "id": 0, | |
| "content": "[UNK]", | |
| "single_word": false, | |
| "lstrip": false, | |
| "rstrip": false, | |
| "normalized": false, | |
| "special": true | |
| }, | |
| { | |
| "id": 1, | |
| "content": "[CLS]", | |
| "single_word": false, | |
| "lstrip": false, | |
| "rstrip": false, | |
| "normalized": false, | |
| "special": true | |
| }, | |
| { | |
| "id": 2, | |
| "content": "[SEP]", | |
| "single_word": false, | |
| "lstrip": false, | |
| "rstrip": false, | |
| "normalized": false, | |
| "special": true | |
| }, | |
| { | |
| "id": 3, | |
| "content": "[PAD]", | |
| "single_word": false, | |
| "lstrip": false, | |
| "rstrip": false, | |
| "normalized": false, | |
| "special": true | |
| }, | |
| { | |
| "id": 4, | |
| "content": "[MASK]", | |
| "single_word": false, | |
| "lstrip": false, | |
| "rstrip": false, | |
| "normalized": false, | |
| "special": true | |
| } | |
| ], | |
| "normalizer": null, | |
| "pre_tokenizer": { | |
| "type": "Whitespace" | |
| }, | |
| "post_processor": null, | |
| "decoder": null, | |
| "model": { | |
| "type": "BPE", | |
| "dropout": null, | |
| "unk_token": "[UNK]", | |
| "continuing_subword_prefix": null, | |
| "end_of_word_suffix": null, | |
| "fuse_unk": false, | |
| "byte_fallback": false, | |
| "ignore_merges": false, | |
| "vocab": { | |
| "[UNK]": 0, | |
| "[CLS]": 1, | |
| "[SEP]": 2, | |
| "[PAD]": 3, | |
| "[MASK]": 4, | |
| "!": 5, | |
| ".": 6, | |
| "G": 7, | |
| "M": 8, | |
| "Q": 9, | |
| "T": 10, | |
| "W": 11, | |
| "a": 12, | |
| "b": 13, | |
| "d": 14, | |
| "e": 15, | |
| "f": 16, | |
| "i": 17, | |
| "j": 18, | |
| "l": 19, | |
| "m": 20, | |
| "n": 21, | |
| "o": 22, | |
| "p": 23, | |
| "q": 24, | |
| "r": 25, | |
| "s": 26, | |
| "t": 27, | |
| "u": 28, | |
| "v": 29, | |
| "w": 30, | |
| "ç": 31, | |
| "é": 32, | |
| "..": 33, | |
| "ou": 34, | |
| "aou": 35, | |
| "aouf": 36, | |
| "Waouf": 37, | |
| "rr": 38, | |
| "is": 39, | |
| "Grr": 40, | |
| "le": 41, | |
| "on": 42, | |
| "su": 43, | |
| "...": 44, | |
| "Grrr": 45, | |
| "suis": 46, | |
| "as": 47, | |
| "ble": 48, | |
| "dis": 49, | |
| "ible": 50, | |
| "je": 51, | |
| "oi": 52, | |
| "pon": 53, | |
| "pas": 54, | |
| "rd": 55, | |
| "sou": 56, | |
| "te": 57, | |
| "uoi": 58, | |
| "....": 59, | |
| "dispon": 60, | |
| "sourd": 61, | |
| "disponible": 62, | |
| "!!": 63, | |
| "!.": 64, | |
| "Ma": 65, | |
| "Quoi": 66, | |
| "Ta": 67, | |
| "Tu": 68, | |
| "aa": 69, | |
| "ai": 70, | |
| "dé": 71, | |
| "eu": 72, | |
| "fai": 73, | |
| "ir": 74, | |
| "iu": 75, | |
| "me": 76, | |
| "non": 77, | |
| "or": 78, | |
| "quoi": 79, | |
| "riu": 80, | |
| "ste": 81, | |
| "sor": 82, | |
| "tir": 83, | |
| "veu": 84, | |
| "waouf": 85, | |
| "waa": 86, | |
| "ça": 87, | |
| "les": 88, | |
| "teste": 89, | |
| "Mariu": 90, | |
| "déteste": 91, | |
| "fait": 92, | |
| "sortir": 93, | |
| "veut": 94, | |
| "Marius": 95 | |
| }, | |
| "merges": [ | |
| [ | |
| ".", | |
| "." | |
| ], | |
| [ | |
| "o", | |
| "u" | |
| ], | |
| [ | |
| "a", | |
| "ou" | |
| ], | |
| [ | |
| "aou", | |
| "f" | |
| ], | |
| [ | |
| "W", | |
| "aouf" | |
| ], | |
| [ | |
| "r", | |
| "r" | |
| ], | |
| [ | |
| "i", | |
| "s" | |
| ], | |
| [ | |
| "G", | |
| "rr" | |
| ], | |
| [ | |
| "l", | |
| "e" | |
| ], | |
| [ | |
| "o", | |
| "n" | |
| ], | |
| [ | |
| "s", | |
| "u" | |
| ], | |
| [ | |
| "..", | |
| "." | |
| ], | |
| [ | |
| "Grr", | |
| "r" | |
| ], | |
| [ | |
| "su", | |
| "is" | |
| ], | |
| [ | |
| "a", | |
| "s" | |
| ], | |
| [ | |
| "b", | |
| "le" | |
| ], | |
| [ | |
| "d", | |
| "is" | |
| ], | |
| [ | |
| "i", | |
| "ble" | |
| ], | |
| [ | |
| "j", | |
| "e" | |
| ], | |
| [ | |
| "o", | |
| "i" | |
| ], | |
| [ | |
| "p", | |
| "on" | |
| ], | |
| [ | |
| "p", | |
| "as" | |
| ], | |
| [ | |
| "r", | |
| "d" | |
| ], | |
| [ | |
| "s", | |
| "ou" | |
| ], | |
| [ | |
| "t", | |
| "e" | |
| ], | |
| [ | |
| "u", | |
| "oi" | |
| ], | |
| [ | |
| "..", | |
| ".." | |
| ], | |
| [ | |
| "dis", | |
| "pon" | |
| ], | |
| [ | |
| "sou", | |
| "rd" | |
| ], | |
| [ | |
| "dispon", | |
| "ible" | |
| ], | |
| [ | |
| "!", | |
| "!" | |
| ], | |
| [ | |
| "!", | |
| "." | |
| ], | |
| [ | |
| "M", | |
| "a" | |
| ], | |
| [ | |
| "Q", | |
| "uoi" | |
| ], | |
| [ | |
| "T", | |
| "a" | |
| ], | |
| [ | |
| "T", | |
| "u" | |
| ], | |
| [ | |
| "a", | |
| "a" | |
| ], | |
| [ | |
| "a", | |
| "i" | |
| ], | |
| [ | |
| "d", | |
| "é" | |
| ], | |
| [ | |
| "e", | |
| "u" | |
| ], | |
| [ | |
| "f", | |
| "ai" | |
| ], | |
| [ | |
| "i", | |
| "r" | |
| ], | |
| [ | |
| "i", | |
| "u" | |
| ], | |
| [ | |
| "m", | |
| "e" | |
| ], | |
| [ | |
| "n", | |
| "on" | |
| ], | |
| [ | |
| "o", | |
| "r" | |
| ], | |
| [ | |
| "q", | |
| "uoi" | |
| ], | |
| [ | |
| "r", | |
| "iu" | |
| ], | |
| [ | |
| "s", | |
| "te" | |
| ], | |
| [ | |
| "s", | |
| "or" | |
| ], | |
| [ | |
| "t", | |
| "ir" | |
| ], | |
| [ | |
| "v", | |
| "eu" | |
| ], | |
| [ | |
| "w", | |
| "aouf" | |
| ], | |
| [ | |
| "w", | |
| "aa" | |
| ], | |
| [ | |
| "ç", | |
| "a" | |
| ], | |
| [ | |
| "le", | |
| "s" | |
| ], | |
| [ | |
| "te", | |
| "ste" | |
| ], | |
| [ | |
| "Ma", | |
| "riu" | |
| ], | |
| [ | |
| "dé", | |
| "teste" | |
| ], | |
| [ | |
| "fai", | |
| "t" | |
| ], | |
| [ | |
| "sor", | |
| "tir" | |
| ], | |
| [ | |
| "veu", | |
| "t" | |
| ], | |
| [ | |
| "Mariu", | |
| "s" | |
| ] | |
| ] | |
| } | |
| } |