{ "added_tokens_decoder": { "2": { "content": "tʰ", "lstrip": true, "normalized": false, "rstrip": true, "single_word": false, "special": false }, "3": { "content": "tɕ", "lstrip": true, "normalized": false, "rstrip": true, "single_word": false, "special": false }, "4": { "content": "tɕ*", "lstrip": true, "normalized": false, "rstrip": true, "single_word": false, "special": false }, "5": { "content": "tɕʰ", "lstrip": true, "normalized": false, "rstrip": true, "single_word": false, "special": false }, "8": { "content": "k*", "lstrip": true, "normalized": false, "rstrip": true, "single_word": false, "special": false }, "9": { "content": "kʰ", "lstrip": true, "normalized": false, "rstrip": true, "single_word": false, "special": false }, "14": { "content": "t*", "lstrip": true, "normalized": false, "rstrip": true, "single_word": false, "special": false }, "15": { "content": "p*", "lstrip": true, "normalized": false, "rstrip": true, "single_word": false, "special": false }, "16": { "content": "pʰ", "lstrip": true, "normalized": false, "rstrip": true, "single_word": false, "special": false }, "18": { "content": "s*", "lstrip": true, "normalized": false, "rstrip": true, "single_word": false, "special": false }, "23": { "content": "wɛ", "lstrip": true, "normalized": false, "rstrip": true, "single_word": false, "special": false }, "27": { "content": "ɰi", "lstrip": true, "normalized": false, "rstrip": true, "single_word": false, "special": false }, "28": { "content": "jo", "lstrip": true, "normalized": false, "rstrip": true, "single_word": false, "special": false }, "29": { "content": "ju", "lstrip": true, "normalized": false, "rstrip": true, "single_word": false, "special": false }, "30": { "content": "ja", "lstrip": true, "normalized": false, "rstrip": true, "single_word": false, "special": false }, "31": { "content": "jʌ", "lstrip": true, "normalized": false, "rstrip": true, "single_word": false, "special": false }, "32": { "content": "jɛ", "lstrip": true, "normalized": false, "rstrip": true, "single_word": false, "special": false }, "33": { "content": "wa", "lstrip": true, "normalized": false, "rstrip": true, "single_word": false, "special": false }, "34": { "content": "wʌ", "lstrip": true, "normalized": false, "rstrip": true, "single_word": false, "special": false }, "35": { "content": "wi", "lstrip": true, "normalized": false, "rstrip": true, "single_word": false, "special": false }, "37": { "content": "[UNK]", "lstrip": true, "normalized": false, "rstrip": true, "single_word": false, "special": false }, "38": { "content": "[PAD]", "lstrip": true, "normalized": false, "rstrip": true, "single_word": false, "special": false }, "39": { "content": "", "lstrip": false, "normalized": false, "rstrip": false, "single_word": false, "special": true }, "40": { "content": "", "lstrip": false, "normalized": false, "rstrip": false, "single_word": false, "special": true } }, "bos_token": "", "clean_up_tokenization_spaces": true, "do_lower_case": false, "do_normalize": true, "eos_token": "", "model_max_length": 1000000000000000019884624838656, "pad_token": "[PAD]", "replace_word_delimiter_char": " ", "return_attention_mask": false, "target_lang": null, "tokenizer_class": "Wav2Vec2CTCTokenizer", "unk_token": "[UNK]", "word_delimiter_token": "|" }