{ "added_tokens_decoder": { "0": { "content": "[UNK]", "lstrip": false, "normalized": false, "rstrip": false, "single_word": false, "special": true }, "1": { "content": "[PAD]", "lstrip": false, "normalized": false, "rstrip": false, "single_word": false, "special": true }, "2": { "content": "[CLS]", "lstrip": false, "normalized": false, "rstrip": false, "single_word": false, "special": true }, "3": { "content": "[SEP]", "lstrip": false, "normalized": false, "rstrip": false, "single_word": false, "special": true }, "4": { "content": "[MASK]", "lstrip": false, "normalized": false, "rstrip": false, "single_word": false, "special": true }, "5": { "content": "[p]", "lstrip": false, "normalized": false, "rstrip": false, "single_word": false, "special": true }, "6": { "content": "[b]", "lstrip": false, "normalized": false, "rstrip": false, "single_word": false, "special": true }, "7": { "content": "[t]", "lstrip": false, "normalized": false, "rstrip": false, "single_word": false, "special": true }, "8": { "content": "[d]", "lstrip": false, "normalized": false, "rstrip": false, "single_word": false, "special": true }, "9": { "content": "[k]", "lstrip": false, "normalized": false, "rstrip": false, "single_word": false, "special": true }, "10": { "content": "[g]", "lstrip": false, "normalized": false, "rstrip": false, "single_word": false, "special": true }, "11": { "content": "[ɓ]", "lstrip": false, "normalized": false, "rstrip": false, "single_word": false, "special": true }, "12": { "content": "[ɗ]", "lstrip": false, "normalized": false, "rstrip": false, "single_word": false, "special": true }, "13": { "content": "[ƴ]", "lstrip": false, "normalized": false, "rstrip": false, "single_word": false, "special": true }, "14": { "content": "[mb]", "lstrip": false, "normalized": false, "rstrip": false, "single_word": false, "special": true }, "15": { "content": "[ɲ]", "lstrip": false, "normalized": false, "rstrip": false, "single_word": false, "special": true }, "16": { "content": "[nd]", "lstrip": false, "normalized": false, "rstrip": false, "single_word": false, "special": true }, "17": { "content": "[ŋg]", "lstrip": false, "normalized": false, "rstrip": false, "single_word": false, "special": true }, "18": { "content": "[ŋk]", "lstrip": false, "normalized": false, "rstrip": false, "single_word": false, "special": true }, "19": { "content": "[gb]", "lstrip": false, "normalized": false, "rstrip": false, "single_word": false, "special": true }, "20": { "content": "[kp]", "lstrip": false, "normalized": false, "rstrip": false, "single_word": false, "special": true }, "21": { "content": "[c]", "lstrip": false, "normalized": false, "rstrip": false, "single_word": false, "special": true }, "22": { "content": "[j]", "lstrip": false, "normalized": false, "rstrip": false, "single_word": false, "special": true }, "23": { "content": "[f]", "lstrip": false, "normalized": false, "rstrip": false, "single_word": false, "special": true }, "24": { "content": "[v]", "lstrip": false, "normalized": false, "rstrip": false, "single_word": false, "special": true }, "25": { "content": "[s]", "lstrip": false, "normalized": false, "rstrip": false, "single_word": false, "special": true }, "26": { "content": "[z]", "lstrip": false, "normalized": false, "rstrip": false, "single_word": false, "special": true }, "27": { "content": "[x]", "lstrip": false, "normalized": false, "rstrip": false, "single_word": false, "special": true }, "28": { "content": "[h]", "lstrip": false, "normalized": false, "rstrip": false, "single_word": false, "special": true }, "29": { "content": "[m]", "lstrip": false, "normalized": false, "rstrip": false, "single_word": false, "special": true }, "30": { "content": "[n]", "lstrip": false, "normalized": false, "rstrip": false, "single_word": false, "special": true }, "31": { "content": "[ŋ]", "lstrip": false, "normalized": false, "rstrip": false, "single_word": false, "special": true }, "32": { "content": "[l]", "lstrip": false, "normalized": false, "rstrip": false, "single_word": false, "special": true }, "33": { "content": "[r]", "lstrip": false, "normalized": false, "rstrip": false, "single_word": false, "special": true }, "34": { "content": "[w]", "lstrip": false, "normalized": false, "rstrip": false, "single_word": false, "special": true }, "35": { "content": "[y]", "lstrip": false, "normalized": false, "rstrip": false, "single_word": false, "special": true }, "36": { "content": "[ny]", "lstrip": false, "normalized": false, "rstrip": false, "single_word": false, "special": true }, "37": { "content": "[i]", "lstrip": false, "normalized": false, "rstrip": false, "single_word": false, "special": true }, "38": { "content": "[u]", "lstrip": false, "normalized": false, "rstrip": false, "single_word": false, "special": true }, "39": { "content": "[e]", "lstrip": false, "normalized": false, "rstrip": false, "single_word": false, "special": true }, "40": { "content": "[o]", "lstrip": false, "normalized": false, "rstrip": false, "single_word": false, "special": true }, "41": { "content": "[a]", "lstrip": false, "normalized": false, "rstrip": false, "single_word": false, "special": true }, "42": { "content": "[ə]", "lstrip": false, "normalized": false, "rstrip": false, "single_word": false, "special": true }, "43": { "content": "[ɛ]", "lstrip": false, "normalized": false, "rstrip": false, "single_word": false, "special": true }, "44": { "content": "[ɔ]", "lstrip": false, "normalized": false, "rstrip": false, "single_word": false, "special": true }, "45": { "content": "[ii]", "lstrip": false, "normalized": false, "rstrip": false, "single_word": false, "special": true }, "46": { "content": "[uu]", "lstrip": false, "normalized": false, "rstrip": false, "single_word": false, "special": true }, "47": { "content": "[ee]", "lstrip": false, "normalized": false, "rstrip": false, "single_word": false, "special": true }, "48": { "content": "[oo]", "lstrip": false, "normalized": false, "rstrip": false, "single_word": false, "special": true }, "49": { "content": "[aa]", "lstrip": false, "normalized": false, "rstrip": false, "single_word": false, "special": true }, "50": { "content": "[əə]", "lstrip": false, "normalized": false, "rstrip": false, "single_word": false, "special": true }, "51": { "content": "[ɛɛ]", "lstrip": false, "normalized": false, "rstrip": false, "single_word": false, "special": true }, "52": { "content": "[ɔɔ]", "lstrip": false, "normalized": false, "rstrip": false, "single_word": false, "special": true }, "53": { "content": "[ĩ]", "lstrip": false, "normalized": false, "rstrip": false, "single_word": false, "special": true }, "54": { "content": "[ũ]", "lstrip": false, "normalized": false, "rstrip": false, "single_word": false, "special": true }, "55": { "content": "[ẽ]", "lstrip": false, "normalized": false, "rstrip": false, "single_word": false, "special": true }, "56": { "content": "[õ]", "lstrip": false, "normalized": false, "rstrip": false, "single_word": false, "special": true }, "57": { "content": "[ã]", "lstrip": false, "normalized": false, "rstrip": false, "single_word": false, "special": true }, "58": { "content": "[ə̃]", "lstrip": false, "normalized": false, "rstrip": false, "single_word": false, "special": true }, "59": { "content": "[ɛ̃]", "lstrip": false, "normalized": false, "rstrip": false, "single_word": false, "special": true }, "60": { "content": "[ɔ̃]", "lstrip": false, "normalized": false, "rstrip": false, "single_word": false, "special": true }, "61": { "content": "[ia]", "lstrip": false, "normalized": false, "rstrip": false, "single_word": false, "special": true }, "62": { "content": "[ua]", "lstrip": false, "normalized": false, "rstrip": false, "single_word": false, "special": true }, "63": { "content": "[ei]", "lstrip": false, "normalized": false, "rstrip": false, "single_word": false, "special": true }, "64": { "content": "[ou]", "lstrip": false, "normalized": false, "rstrip": false, "single_word": false, "special": true }, "65": { "content": "[á]", "lstrip": false, "normalized": false, "rstrip": false, "single_word": false, "special": true }, "66": { "content": "[à]", "lstrip": false, "normalized": false, "rstrip": false, "single_word": false, "special": true }, "67": { "content": "[é]", "lstrip": false, "normalized": false, "rstrip": false, "single_word": false, "special": true }, "68": { "content": "[è]", "lstrip": false, "normalized": false, "rstrip": false, "single_word": false, "special": true }, "69": { "content": "[í]", "lstrip": false, "normalized": false, "rstrip": false, "single_word": false, "special": true }, "70": { "content": "[ì]", "lstrip": false, "normalized": false, "rstrip": false, "single_word": false, "special": true }, "71": { "content": "[ó]", "lstrip": false, "normalized": false, "rstrip": false, "single_word": false, "special": true }, "72": { "content": "[ò]", "lstrip": false, "normalized": false, "rstrip": false, "single_word": false, "special": true }, "73": { "content": "[ú]", "lstrip": false, "normalized": false, "rstrip": false, "single_word": false, "special": true }, "74": { "content": "[ù]", "lstrip": false, "normalized": false, "rstrip": false, "single_word": false, "special": true }, "75": { "content": "[ə́]", "lstrip": false, "normalized": false, "rstrip": false, "single_word": false, "special": true }, "76": { "content": "[ə̀]", "lstrip": false, "normalized": false, "rstrip": false, "single_word": false, "special": true }, "77": { "content": "[ɛ́]", "lstrip": false, "normalized": false, "rstrip": false, "single_word": false, "special": true }, "78": { "content": "[ɛ̀]", "lstrip": false, "normalized": false, "rstrip": false, "single_word": false, "special": true }, "79": { "content": "[ɔ́]", "lstrip": false, "normalized": false, "rstrip": false, "single_word": false, "special": true }, "80": { "content": "[ɔ̀]", "lstrip": false, "normalized": false, "rstrip": false, "single_word": false, "special": true }, "81": { "content": "[áà]", "lstrip": false, "normalized": false, "rstrip": false, "single_word": false, "special": true }, "82": { "content": "[àá]", "lstrip": false, "normalized": false, "rstrip": false, "single_word": false, "special": true }, "83": { "content": "[áa]", "lstrip": false, "normalized": false, "rstrip": false, "single_word": false, "special": true }, "84": { "content": "[aá]", "lstrip": false, "normalized": false, "rstrip": false, "single_word": false, "special": true }, "85": { "content": "[áá]", "lstrip": false, "normalized": false, "rstrip": false, "single_word": false, "special": true }, "86": { "content": "[àà]", "lstrip": false, "normalized": false, "rstrip": false, "single_word": false, "special": true }, "87": { "content": "[ə́ə́]", "lstrip": false, "normalized": false, "rstrip": false, "single_word": false, "special": true }, "88": { "content": "[ə̀ə̀]", "lstrip": false, "normalized": false, "rstrip": false, "single_word": false, "special": true }, "89": { "content": "[ɛ́ɛ́]", "lstrip": false, "normalized": false, "rstrip": false, "single_word": false, "special": true }, "90": { "content": "[ɛ̀ɛ̀]", "lstrip": false, "normalized": false, "rstrip": false, "single_word": false, "special": true }, "91": { "content": "[ɔ́ɔ́]", "lstrip": false, "normalized": false, "rstrip": false, "single_word": false, "special": true }, "92": { "content": "[ɔ̀ɔ̀]", "lstrip": false, "normalized": false, "rstrip": false, "single_word": false, "special": true }, "93": { "content": "[óó]", "lstrip": false, "normalized": false, "rstrip": false, "single_word": false, "special": true }, "94": { "content": "[òò]", "lstrip": false, "normalized": false, "rstrip": false, "single_word": false, "special": true }, "95": { "content": "[íí]", "lstrip": false, "normalized": false, "rstrip": false, "single_word": false, "special": true }, "96": { "content": "[ìì]", "lstrip": false, "normalized": false, "rstrip": false, "single_word": false, "special": true }, "97": { "content": "[úú]", "lstrip": false, "normalized": false, "rstrip": false, "single_word": false, "special": true }, "98": { "content": "[ùù]", "lstrip": false, "normalized": false, "rstrip": false, "single_word": false, "special": true }, "99": { "content": "[ǎ]", "lstrip": false, "normalized": false, "rstrip": false, "single_word": false, "special": true }, "100": { "content": "[ě]", "lstrip": false, "normalized": false, "rstrip": false, "single_word": false, "special": true }, "101": { "content": "[ǐ]", "lstrip": false, "normalized": false, "rstrip": false, "single_word": false, "special": true }, "102": { "content": "[ǒ]", "lstrip": false, "normalized": false, "rstrip": false, "single_word": false, "special": true }, "103": { "content": "[ǔ]", "lstrip": false, "normalized": false, "rstrip": false, "single_word": false, "special": true }, "104": { "content": "[ə̌]", "lstrip": false, "normalized": false, "rstrip": false, "single_word": false, "special": true }, "105": { "content": "[ɛ̌]", "lstrip": false, "normalized": false, "rstrip": false, "single_word": false, "special": true }, "106": { "content": "[ɔ̌]", "lstrip": false, "normalized": false, "rstrip": false, "single_word": false, "special": true }, "107": { "content": "[...]", "lstrip": false, "normalized": false, "rstrip": false, "single_word": false, "special": true }, "108": { "content": "[-]", "lstrip": false, "normalized": false, "rstrip": false, "single_word": false, "special": true }, "109": { "content": "[—]", "lstrip": false, "normalized": false, "rstrip": false, "single_word": false, "special": true }, "110": { "content": "[–]", "lstrip": false, "normalized": false, "rstrip": false, "single_word": false, "special": true }, "111": { "content": "[_]", "lstrip": false, "normalized": false, "rstrip": false, "single_word": false, "special": true }, "112": { "content": "[°]", "lstrip": false, "normalized": false, "rstrip": false, "single_word": false, "special": true }, "113": { "content": "[«]", "lstrip": false, "normalized": false, "rstrip": false, "single_word": false, "special": true }, "114": { "content": "[»]", "lstrip": false, "normalized": false, "rstrip": false, "single_word": false, "special": true }, "115": { "content": "[(]", "lstrip": false, "normalized": false, "rstrip": false, "single_word": false, "special": true }, "116": { "content": "[)]", "lstrip": false, "normalized": false, "rstrip": false, "single_word": false, "special": true }, "117": { "content": "[[]", "lstrip": false, "normalized": false, "rstrip": false, "single_word": false, "special": true }, "118": { "content": "[]]", "lstrip": false, "normalized": false, "rstrip": false, "single_word": false, "special": true }, "119": { "content": "[{]", "lstrip": false, "normalized": false, "rstrip": false, "single_word": false, "special": true }, "120": { "content": "[}]", "lstrip": false, "normalized": false, "rstrip": false, "single_word": false, "special": true }, "121": { "content": "[<]", "lstrip": false, "normalized": false, "rstrip": false, "single_word": false, "special": true }, "122": { "content": "[>]", "lstrip": false, "normalized": false, "rstrip": false, "single_word": false, "special": true }, "123": { "content": "[&]", "lstrip": false, "normalized": false, "rstrip": false, "single_word": false, "special": true }, "124": { "content": "[*]", "lstrip": false, "normalized": false, "rstrip": false, "single_word": false, "special": true }, "125": { "content": "[#]", "lstrip": false, "normalized": false, "rstrip": false, "single_word": false, "special": true }, "126": { "content": "[$]", "lstrip": false, "normalized": false, "rstrip": false, "single_word": false, "special": true }, "127": { "content": "[£]", "lstrip": false, "normalized": false, "rstrip": false, "single_word": false, "special": true }, "128": { "content": "[%]", "lstrip": false, "normalized": false, "rstrip": false, "single_word": false, "special": true }, "129": { "content": "[+]", "lstrip": false, "normalized": false, "rstrip": false, "single_word": false, "special": true }, "130": { "content": "[=]", "lstrip": false, "normalized": false, "rstrip": false, "single_word": false, "special": true }, "131": { "content": "[|]", "lstrip": false, "normalized": false, "rstrip": false, "single_word": false, "special": true }, "132": { "content": "[/]", "lstrip": false, "normalized": false, "rstrip": false, "single_word": false, "special": true }, "133": { "content": "[\\]", "lstrip": false, "normalized": false, "rstrip": false, "single_word": false, "special": true }, "134": { "content": "[@]", "lstrip": false, "normalized": false, "rstrip": false, "single_word": false, "special": true }, "135": { "content": "[www]", "lstrip": false, "normalized": false, "rstrip": false, "single_word": false, "special": true } }, "clean_up_tokenization_spaces": false, "cls_token": "[CLS]", "do_lower_case": true, "extra_special_tokens": {}, "mask_token": "[MASK]", "model_max_length": 1000000000000000019884624838656, "pad_token": "[PAD]", "sep_token": "[SEP]", "strip_accents": null, "tokenize_chinese_chars": true, "tokenizer_class": "BertTokenizer", "unk_token": "[UNK]" }