{ "added_tokens_decoder": { "0": { "content": "", "lstrip": false, "normalized": false, "rstrip": false, "single_word": false, "special": true }, "1": { "content": "", "lstrip": false, "normalized": false, "rstrip": false, "single_word": false, "special": true }, "2": { "content": "", "lstrip": false, "normalized": false, "rstrip": false, "single_word": false, "special": true }, "3": { "content": "", "lstrip": false, "normalized": false, "rstrip": false, "single_word": false, "special": true }, "32001": { "content": "", "lstrip": true, "normalized": false, "rstrip": false, "single_word": false, "special": true }, "32002": { "content": "ᡀ", "lstrip": false, "normalized": true, "rstrip": false, "single_word": false, "special": false }, "32003": { "content": "ᡂ", "lstrip": false, "normalized": true, "rstrip": false, "single_word": false, "special": false }, "32004": { "content": "ᡑ", "lstrip": false, "normalized": true, "rstrip": false, "single_word": false, "special": false }, "32005": { "content": "ᡘ", "lstrip": false, "normalized": true, "rstrip": false, "single_word": false, "special": false }, "32006": { "content": "ᠿ", "lstrip": false, "normalized": true, "rstrip": false, "single_word": false, "special": false }, "32007": { "content": "ᡛ", "lstrip": false, "normalized": true, "rstrip": false, "single_word": false, "special": false }, "32008": { "content": "ᢋ", "lstrip": false, "normalized": true, "rstrip": false, "single_word": false, "special": false }, "32009": { "content": "ᢒ", "lstrip": false, "normalized": true, "rstrip": false, "single_word": false, "special": false }, "32010": { "content": "ᠼ", "lstrip": false, "normalized": true, "rstrip": false, "single_word": false, "special": false }, "32011": { "content": "ᠻ", "lstrip": false, "normalized": true, "rstrip": false, "single_word": false, "special": false }, "32012": { "content": "᠀", "lstrip": false, "normalized": true, "rstrip": false, "single_word": false, "special": false }, "32013": { "content": "ᠾ", "lstrip": false, "normalized": true, "rstrip": false, "single_word": false, "special": false }, "32014": { "content": "᠅", "lstrip": false, "normalized": true, "rstrip": false, "single_word": false, "special": false }, "32015": { "content": "=", "lstrip": false, "normalized": true, "rstrip": false, "single_word": false, "special": false }, "32016": { "content": "᠓", "lstrip": false, "normalized": true, "rstrip": false, "single_word": false, "special": false }, "32017": { "content": "᠑", "lstrip": false, "normalized": true, "rstrip": false, "single_word": false, "special": false }, "32018": { "content": "᠒", "lstrip": false, "normalized": true, "rstrip": false, "single_word": false, "special": false }, "32019": { "content": "᠔", "lstrip": false, "normalized": true, "rstrip": false, "single_word": false, "special": false }, "32020": { "content": "᠐", "lstrip": false, "normalized": true, "rstrip": false, "single_word": false, "special": false }, "32021": { "content": "᠕", "lstrip": false, "normalized": true, "rstrip": false, "single_word": false, "special": false }, "32022": { "content": "᠗", "lstrip": false, "normalized": true, "rstrip": false, "single_word": false, "special": false }, "32023": { "content": "A", "lstrip": false, "normalized": true, "rstrip": false, "single_word": false, "special": false }, "32024": { "content": "a", "lstrip": false, "normalized": true, "rstrip": false, "single_word": false, "special": false }, "32025": { "content": "B", "lstrip": false, "normalized": true, "rstrip": false, "single_word": false, "special": false }, "32026": { "content": "b", "lstrip": false, "normalized": true, "rstrip": false, "single_word": false, "special": false }, "32027": { "content": "C", "lstrip": false, "normalized": true, "rstrip": false, "single_word": false, "special": false }, "32028": { "content": "c", "lstrip": false, "normalized": true, "rstrip": false, "single_word": false, "special": false }, "32029": { "content": "D", "lstrip": false, "normalized": true, "rstrip": false, "single_word": false, "special": false }, "32030": { "content": "d", "lstrip": false, "normalized": true, "rstrip": false, "single_word": false, "special": false }, "32031": { "content": "E", "lstrip": false, "normalized": true, "rstrip": false, "single_word": false, "special": false }, "32032": { "content": "e", "lstrip": false, "normalized": true, "rstrip": false, "single_word": false, "special": false }, "32033": { "content": "F", "lstrip": false, "normalized": true, "rstrip": false, "single_word": false, "special": false }, "32034": { "content": "f", "lstrip": false, "normalized": true, "rstrip": false, "single_word": false, "special": false }, "32035": { "content": "G", "lstrip": false, "normalized": true, "rstrip": false, "single_word": false, "special": false }, "32036": { "content": "g", "lstrip": false, "normalized": true, "rstrip": false, "single_word": false, "special": false }, "32037": { "content": "H", "lstrip": false, "normalized": true, "rstrip": false, "single_word": false, "special": false }, "32038": { "content": "h", "lstrip": false, "normalized": true, "rstrip": false, "single_word": false, "special": false }, "32039": { "content": "I", "lstrip": false, "normalized": true, "rstrip": false, "single_word": false, "special": false }, "32040": { "content": "i", "lstrip": false, "normalized": true, "rstrip": false, "single_word": false, "special": false }, "32041": { "content": "J", "lstrip": false, "normalized": true, "rstrip": false, "single_word": false, "special": false }, "32042": { "content": "j", "lstrip": false, "normalized": true, "rstrip": false, "single_word": false, "special": false }, "32043": { "content": "K", "lstrip": false, "normalized": true, "rstrip": false, "single_word": false, "special": false }, "32044": { "content": "k", "lstrip": false, "normalized": true, "rstrip": false, "single_word": false, "special": false }, "32045": { "content": "L", "lstrip": false, "normalized": true, "rstrip": false, "single_word": false, "special": false }, "32046": { "content": "l", "lstrip": false, "normalized": true, "rstrip": false, "single_word": false, "special": false }, "32047": { "content": "M", "lstrip": false, "normalized": true, "rstrip": false, "single_word": false, "special": false }, "32048": { "content": "m", "lstrip": false, "normalized": true, "rstrip": false, "single_word": false, "special": false }, "32049": { "content": "N", "lstrip": false, "normalized": true, "rstrip": false, "single_word": false, "special": false }, "32050": { "content": "n", "lstrip": false, "normalized": true, "rstrip": false, "single_word": false, "special": false }, "32051": { "content": "O", "lstrip": false, "normalized": true, "rstrip": false, "single_word": false, "special": false }, "32052": { "content": "o", "lstrip": false, "normalized": true, "rstrip": false, "single_word": false, "special": false }, "32053": { "content": "P", "lstrip": false, "normalized": true, "rstrip": false, "single_word": false, "special": false }, "32054": { "content": "p", "lstrip": false, "normalized": true, "rstrip": false, "single_word": false, "special": false }, "32055": { "content": "Q", "lstrip": false, "normalized": true, "rstrip": false, "single_word": false, "special": false }, "32056": { "content": "q", "lstrip": false, "normalized": true, "rstrip": false, "single_word": false, "special": false }, "32057": { "content": "R", "lstrip": false, "normalized": true, "rstrip": false, "single_word": false, "special": false }, "32058": { "content": "r", "lstrip": false, "normalized": true, "rstrip": false, "single_word": false, "special": false }, "32059": { "content": "S", "lstrip": false, "normalized": true, "rstrip": false, "single_word": false, "special": false }, "32060": { "content": "s", "lstrip": false, "normalized": true, "rstrip": false, "single_word": false, "special": false }, "32061": { "content": "T", "lstrip": false, "normalized": true, "rstrip": false, "single_word": false, "special": false }, "32062": { "content": "t", "lstrip": false, "normalized": true, "rstrip": false, "single_word": false, "special": false }, "32063": { "content": "U", "lstrip": false, "normalized": true, "rstrip": false, "single_word": false, "special": false }, "32064": { "content": "u", "lstrip": false, "normalized": true, "rstrip": false, "single_word": false, "special": false }, "32065": { "content": "V", "lstrip": false, "normalized": true, "rstrip": false, "single_word": false, "special": false }, "32066": { "content": "v", "lstrip": false, "normalized": true, "rstrip": false, "single_word": false, "special": false }, "32067": { "content": "W", "lstrip": false, "normalized": true, "rstrip": false, "single_word": false, "special": false }, "32068": { "content": "w", "lstrip": false, "normalized": true, "rstrip": false, "single_word": false, "special": false }, "32069": { "content": "X", "lstrip": false, "normalized": true, "rstrip": false, "single_word": false, "special": false }, "32070": { "content": "x", "lstrip": false, "normalized": true, "rstrip": false, "single_word": false, "special": false }, "32071": { "content": "Y", "lstrip": false, "normalized": true, "rstrip": false, "single_word": false, "special": false }, "32072": { "content": "y", "lstrip": false, "normalized": true, "rstrip": false, "single_word": false, "special": false }, "32073": { "content": "Z", "lstrip": false, "normalized": true, "rstrip": false, "single_word": false, "special": false }, "32074": { "content": "z", "lstrip": false, "normalized": true, "rstrip": false, "single_word": false, "special": false }, "32075": { "content": "᠙", "lstrip": false, "normalized": true, "rstrip": false, "single_word": false, "special": false }, "32076": { "content": "᠘", "lstrip": false, "normalized": true, "rstrip": false, "single_word": false, "special": false }, "32077": { "content": "᠖", "lstrip": false, "normalized": true, "rstrip": false, "single_word": false, "special": false }, "32078": { "content": "<", "lstrip": false, "normalized": true, "rstrip": false, "single_word": false, "special": false }, "32079": { "content": ">", "lstrip": false, "normalized": true, "rstrip": false, "single_word": false, "special": false }, "32080": { "content": "№", "lstrip": false, "normalized": true, "rstrip": false, "single_word": false, "special": false }, "32081": { "content": "+", "lstrip": false, "normalized": true, "rstrip": false, "single_word": false, "special": false }, "32082": { "content": "ᢀ", "lstrip": false, "normalized": true, "rstrip": false, "single_word": false, "special": false }, "32083": { "content": "〈", "lstrip": false, "normalized": true, "rstrip": false, "single_word": false, "special": false }, "32084": { "content": "〉", "lstrip": false, "normalized": true, "rstrip": false, "single_word": false, "special": false }, "32085": { "content": "︱", "lstrip": false, "normalized": true, "rstrip": false, "single_word": false, "special": false }, "32086": { "content": "“", "lstrip": false, "normalized": true, "rstrip": false, "single_word": false, "special": false }, "32087": { "content": "”", "lstrip": false, "normalized": true, "rstrip": false, "single_word": false, "special": false }, "32088": { "content": "Ё", "lstrip": false, "normalized": true, "rstrip": false, "single_word": false, "special": false }, "32089": { "content": "Ю", "lstrip": false, "normalized": true, "rstrip": false, "single_word": false, "special": false }, "32090": { "content": "ᡁ", "lstrip": false, "normalized": true, "rstrip": false, "single_word": false, "special": false }, "32091": { "content": "÷", "lstrip": false, "normalized": true, "rstrip": false, "single_word": false, "special": false }, "32092": { "content": "*", "lstrip": false, "normalized": true, "rstrip": false, "single_word": false, "special": false }, "32093": { "content": "&", "lstrip": false, "normalized": true, "rstrip": false, "single_word": false, "special": false }, "32094": { "content": "@", "lstrip": false, "normalized": true, "rstrip": false, "single_word": false, "special": false }, "32095": { "content": "}", "lstrip": false, "normalized": true, "rstrip": false, "single_word": false, "special": false }, "32096": { "content": "{", "lstrip": false, "normalized": true, "rstrip": false, "single_word": false, "special": false }, "32097": { "content": "[", "lstrip": false, "normalized": true, "rstrip": false, "single_word": false, "special": false }, "32098": { "content": "]", "lstrip": false, "normalized": true, "rstrip": false, "single_word": false, "special": false }, "32099": { "content": "ᢔ", "lstrip": false, "normalized": true, "rstrip": false, "single_word": false, "special": false }, "32100": { "content": "ᡶ", "lstrip": false, "normalized": true, "rstrip": false, "single_word": false, "special": false }, "32101": { "content": "ᡵ", "lstrip": false, "normalized": true, "rstrip": false, "single_word": false, "special": false }, "32102": { "content": "ᡙ", "lstrip": false, "normalized": true, "rstrip": false, "single_word": false, "special": false }, "32103": { "content": "ᢖ", "lstrip": false, "normalized": true, "rstrip": false, "single_word": false, "special": false }, "32104": { "content": "Щ", "lstrip": false, "normalized": true, "rstrip": false, "single_word": false, "special": false }, "32105": { "content": "ᡧ", "lstrip": false, "normalized": true, "rstrip": false, "single_word": false, "special": false }, "32106": { "content": "ᢍ", "lstrip": false, "normalized": true, "rstrip": false, "single_word": false, "special": false }, "32107": { "content": "ᢏ", "lstrip": false, "normalized": true, "rstrip": false, "single_word": false, "special": false }, "32108": { "content": "ᢇ", "lstrip": false, "normalized": true, "rstrip": false, "single_word": false, "special": false }, "32109": { "content": "ᡩ", "lstrip": false, "normalized": true, "rstrip": false, "single_word": false, "special": false }, "32110": { "content": "ᡥ", "lstrip": false, "normalized": true, "rstrip": false, "single_word": false, "special": false }, "32111": { "content": "Ь", "lstrip": false, "normalized": true, "rstrip": false, "single_word": false, "special": false }, "32112": { "content": "Ъ", "lstrip": false, "normalized": true, "rstrip": false, "single_word": false, "special": false }, "32113": { "content": "ᡝ", "lstrip": false, "normalized": true, "rstrip": false, "single_word": false, "special": false }, "32114": { "content": "ᡳ", "lstrip": false, "normalized": true, "rstrip": false, "single_word": false, "special": false }, "32115": { "content": "щ", "lstrip": false, "normalized": true, "rstrip": false, "single_word": false, "special": false }, "32116": { "content": "ᢐ", "lstrip": false, "normalized": true, "rstrip": false, "single_word": false, "special": false }, "32117": { "content": "ᡨ", "lstrip": false, "normalized": true, "rstrip": false, "single_word": false, "special": false }, "32118": { "content": "ᢎ", "lstrip": false, "normalized": true, "rstrip": false, "single_word": false, "special": false }, "32119": { "content": "ᢌ", "lstrip": false, "normalized": true, "rstrip": false, "single_word": false, "special": false }, "32120": { "content": "ᡡ", "lstrip": false, "normalized": true, "rstrip": false, "single_word": false, "special": false }, "32121": { "content": "ᢊ", "lstrip": false, "normalized": true, "rstrip": false, "single_word": false, "special": false }, "32122": { "content": "ᡠ", "lstrip": false, "normalized": true, "rstrip": false, "single_word": false, "special": false }, "32123": { "content": "ᡯ", "lstrip": false, "normalized": true, "rstrip": false, "single_word": false, "special": false }, "32124": { "content": "ᡤ", "lstrip": false, "normalized": true, "rstrip": false, "single_word": false, "special": false } }, "bos_token": "", "clean_up_tokenization_spaces": true, "cls_token": "", "eos_token": "", "is_fast": false, "mask_token": "", "model_max_length": 1000000000000000019884624838656, "pad_token": "", "sep_token": "", "sp_model_kwargs": {}, "tokenizer_class": "XLMRobertaTokenizer", "unk_token": "" }