{ "added_tokens_decoder": { "7": { "content": "d͡ʒ", "lstrip": true, "normalized": false, "rstrip": true, "single_word": false, "special": false }, "8": { "content": "oʊ", "lstrip": true, "normalized": false, "rstrip": true, "single_word": false, "special": false }, "12": { "content": "ʊə", "lstrip": true, "normalized": false, "rstrip": true, "single_word": false, "special": false }, "16": { "content": "aʊ", "lstrip": true, "normalized": false, "rstrip": true, "single_word": false, "special": false }, "17": { "content": "t͡ʃ", "lstrip": true, "normalized": false, "rstrip": true, "single_word": false, "special": false }, "20": { "content": "aɪ", "lstrip": true, "normalized": false, "rstrip": true, "single_word": false, "special": false }, "21": { "content": "eə", "lstrip": true, "normalized": false, "rstrip": true, "single_word": false, "special": false }, "23": { "content": "ɪə", "lstrip": true, "normalized": false, "rstrip": true, "single_word": false, "special": false }, "26": { "content": "əʊ", "lstrip": true, "normalized": false, "rstrip": true, "single_word": false, "special": false }, "27": { "content": "eɪ", "lstrip": true, "normalized": false, "rstrip": true, "single_word": false, "special": false }, "37": { "content": "ɔɪ", "lstrip": true, "normalized": false, "rstrip": true, "single_word": false, "special": false }, "46": { "content": "[UNK]", "lstrip": true, "normalized": false, "rstrip": true, "single_word": false, "special": false }, "47": { "content": "[PAD]", "lstrip": true, "normalized": false, "rstrip": true, "single_word": false, "special": false }, "49": { "content": "", "lstrip": false, "normalized": false, "rstrip": false, "single_word": false, "special": true }, "50": { "content": "", "lstrip": false, "normalized": false, "rstrip": false, "single_word": false, "special": true } }, "bos_token": "", "clean_up_tokenization_spaces": false, "do_lower_case": false, "eos_token": "", "extra_special_tokens": {}, "model_max_length": 1000000000000000019884624838656, "pad_token": "[PAD]", "processor_class": "Wav2Vec2Processor", "replace_word_delimiter_char": " ", "target_lang": null, "tokenizer_class": "Wav2Vec2CTCTokenizer", "unk_token": "[UNK]", "word_delimiter_token": " " }