| { | |
| "added_tokens_decoder": { | |
| "1": { | |
| "content": "td", | |
| "lstrip": true, | |
| "normalized": false, | |
| "rstrip": true, | |
| "single_word": false, | |
| "special": false | |
| }, | |
| "3": { | |
| "content": "ìy", | |
| "lstrip": true, | |
| "normalized": false, | |
| "rstrip": true, | |
| "single_word": false, | |
| "special": false | |
| }, | |
| "7": { | |
| "content": "nz", | |
| "lstrip": true, | |
| "normalized": false, | |
| "rstrip": true, | |
| "single_word": false, | |
| "special": false | |
| }, | |
| "13": { | |
| "content": "dr", | |
| "lstrip": true, | |
| "normalized": false, | |
| "rstrip": true, | |
| "single_word": false, | |
| "special": false | |
| }, | |
| "14": { | |
| "content": "z̀", | |
| "lstrip": true, | |
| "normalized": false, | |
| "rstrip": true, | |
| "single_word": false, | |
| "special": false | |
| }, | |
| "15": { | |
| "content": "dj", | |
| "lstrip": true, | |
| "normalized": false, | |
| "rstrip": true, | |
| "single_word": false, | |
| "special": false | |
| }, | |
| "16": { | |
| "content": "ǒw", | |
| "lstrip": true, | |
| "normalized": false, | |
| "rstrip": true, | |
| "single_word": false, | |
| "special": false | |
| }, | |
| "20": { | |
| "content": "ey", | |
| "lstrip": true, | |
| "normalized": false, | |
| "rstrip": true, | |
| "single_word": false, | |
| "special": false | |
| }, | |
| "21": { | |
| "content": "òw", | |
| "lstrip": true, | |
| "normalized": false, | |
| "rstrip": true, | |
| "single_word": false, | |
| "special": false | |
| }, | |
| "22": { | |
| "content": "nd", | |
| "lstrip": true, | |
| "normalized": false, | |
| "rstrip": true, | |
| "single_word": false, | |
| "special": false | |
| }, | |
| "23": { | |
| "content": "mb", | |
| "lstrip": true, | |
| "normalized": false, | |
| "rstrip": true, | |
| "single_word": false, | |
| "special": false | |
| }, | |
| "24": { | |
| "content": "ǔw", | |
| "lstrip": true, | |
| "normalized": false, | |
| "rstrip": true, | |
| "single_word": false, | |
| "special": false | |
| }, | |
| "25": { | |
| "content": "dh", | |
| "lstrip": true, | |
| "normalized": false, | |
| "rstrip": true, | |
| "single_word": false, | |
| "special": false | |
| }, | |
| "29": { | |
| "content": "dz", | |
| "lstrip": true, | |
| "normalized": false, | |
| "rstrip": true, | |
| "single_word": false, | |
| "special": false | |
| }, | |
| "32": { | |
| "content": "ch", | |
| "lstrip": true, | |
| "normalized": false, | |
| "rstrip": true, | |
| "single_word": false, | |
| "special": false | |
| }, | |
| "34": { | |
| "content": "uw", | |
| "lstrip": true, | |
| "normalized": false, | |
| "rstrip": true, | |
| "single_word": false, | |
| "special": false | |
| }, | |
| "39": { | |
| "content": "ǐy", | |
| "lstrip": true, | |
| "normalized": false, | |
| "rstrip": true, | |
| "single_word": false, | |
| "special": false | |
| }, | |
| "41": { | |
| "content": "ž", | |
| "lstrip": true, | |
| "normalized": false, | |
| "rstrip": true, | |
| "single_word": false, | |
| "special": false | |
| }, | |
| "42": { | |
| "content": "tdr", | |
| "lstrip": true, | |
| "normalized": false, | |
| "rstrip": true, | |
| "single_word": false, | |
| "special": false | |
| }, | |
| "45": { | |
| "content": "th", | |
| "lstrip": true, | |
| "normalized": false, | |
| "rstrip": true, | |
| "single_word": false, | |
| "special": false | |
| }, | |
| "46": { | |
| "content": "úw", | |
| "lstrip": true, | |
| "normalized": false, | |
| "rstrip": true, | |
| "single_word": false, | |
| "special": false | |
| }, | |
| "52": { | |
| "content": "ź", | |
| "lstrip": true, | |
| "normalized": false, | |
| "rstrip": true, | |
| "single_word": false, | |
| "special": false | |
| }, | |
| "56": { | |
| "content": "ow", | |
| "lstrip": true, | |
| "normalized": false, | |
| "rstrip": true, | |
| "single_word": false, | |
| "special": false | |
| }, | |
| "57": { | |
| "content": "nj", | |
| "lstrip": true, | |
| "normalized": false, | |
| "rstrip": true, | |
| "single_word": false, | |
| "special": false | |
| }, | |
| "58": { | |
| "content": "ùw", | |
| "lstrip": true, | |
| "normalized": false, | |
| "rstrip": true, | |
| "single_word": false, | |
| "special": false | |
| }, | |
| "60": { | |
| "content": "dd", | |
| "lstrip": true, | |
| "normalized": false, | |
| "rstrip": true, | |
| "single_word": false, | |
| "special": false | |
| }, | |
| "61": { | |
| "content": "íy", | |
| "lstrip": true, | |
| "normalized": false, | |
| "rstrip": true, | |
| "single_word": false, | |
| "special": false | |
| }, | |
| "67": { | |
| "content": "kp", | |
| "lstrip": true, | |
| "normalized": false, | |
| "rstrip": true, | |
| "single_word": false, | |
| "special": false | |
| }, | |
| "72": { | |
| "content": "gb", | |
| "lstrip": true, | |
| "normalized": false, | |
| "rstrip": true, | |
| "single_word": false, | |
| "special": false | |
| }, | |
| "76": { | |
| "content": "r̀", | |
| "lstrip": true, | |
| "normalized": false, | |
| "rstrip": true, | |
| "single_word": false, | |
| "special": false | |
| }, | |
| "77": { | |
| "content": "dy", | |
| "lstrip": true, | |
| "normalized": false, | |
| "rstrip": true, | |
| "single_word": false, | |
| "special": false | |
| }, | |
| "81": { | |
| "content": "sh", | |
| "lstrip": true, | |
| "normalized": false, | |
| "rstrip": true, | |
| "single_word": false, | |
| "special": false | |
| }, | |
| "82": { | |
| "content": "ěy", | |
| "lstrip": true, | |
| "normalized": false, | |
| "rstrip": true, | |
| "single_word": false, | |
| "special": false | |
| }, | |
| "84": { | |
| "content": "ngb", | |
| "lstrip": true, | |
| "normalized": false, | |
| "rstrip": true, | |
| "single_word": false, | |
| "special": false | |
| }, | |
| "89": { | |
| "content": "ŕ", | |
| "lstrip": true, | |
| "normalized": false, | |
| "rstrip": true, | |
| "single_word": false, | |
| "special": false | |
| }, | |
| "90": { | |
| "content": "ng", | |
| "lstrip": true, | |
| "normalized": false, | |
| "rstrip": true, | |
| "single_word": false, | |
| "special": false | |
| }, | |
| "91": { | |
| "content": "ndr", | |
| "lstrip": true, | |
| "normalized": false, | |
| "rstrip": true, | |
| "single_word": false, | |
| "special": false | |
| }, | |
| "92": { | |
| "content": "ów", | |
| "lstrip": true, | |
| "normalized": false, | |
| "rstrip": true, | |
| "single_word": false, | |
| "special": false | |
| }, | |
| "98": { | |
| "content": "ny", | |
| "lstrip": true, | |
| "normalized": false, | |
| "rstrip": true, | |
| "single_word": false, | |
| "special": false | |
| }, | |
| "103": { | |
| "content": "pb", | |
| "lstrip": true, | |
| "normalized": false, | |
| "rstrip": true, | |
| "single_word": false, | |
| "special": false | |
| }, | |
| "105": { | |
| "content": "tdy", | |
| "lstrip": true, | |
| "normalized": false, | |
| "rstrip": true, | |
| "single_word": false, | |
| "special": false | |
| }, | |
| "111": { | |
| "content": "iy", | |
| "lstrip": true, | |
| "normalized": false, | |
| "rstrip": true, | |
| "single_word": false, | |
| "special": false | |
| }, | |
| "112": { | |
| "content": "èy", | |
| "lstrip": true, | |
| "normalized": false, | |
| "rstrip": true, | |
| "single_word": false, | |
| "special": false | |
| }, | |
| "114": { | |
| "content": "éy", | |
| "lstrip": true, | |
| "normalized": false, | |
| "rstrip": true, | |
| "single_word": false, | |
| "special": false | |
| }, | |
| "115": { | |
| "content": "bb", | |
| "lstrip": true, | |
| "normalized": false, | |
| "rstrip": true, | |
| "single_word": false, | |
| "special": false | |
| }, | |
| "117": { | |
| "content": "ř", | |
| "lstrip": true, | |
| "normalized": false, | |
| "rstrip": true, | |
| "single_word": false, | |
| "special": false | |
| }, | |
| "125": { | |
| "content": "ts", | |
| "lstrip": true, | |
| "normalized": false, | |
| "rstrip": true, | |
| "single_word": false, | |
| "special": false | |
| }, | |
| "128": { | |
| "content": "...", | |
| "lstrip": true, | |
| "normalized": false, | |
| "rstrip": true, | |
| "single_word": false, | |
| "special": false | |
| }, | |
| "129": { | |
| "content": "[UNK]", | |
| "lstrip": true, | |
| "normalized": false, | |
| "rstrip": true, | |
| "single_word": false, | |
| "special": false | |
| }, | |
| "130": { | |
| "content": "[PAD]", | |
| "lstrip": true, | |
| "normalized": false, | |
| "rstrip": true, | |
| "single_word": false, | |
| "special": false | |
| }, | |
| "131": { | |
| "content": "<s>", | |
| "lstrip": false, | |
| "normalized": false, | |
| "rstrip": false, | |
| "single_word": false, | |
| "special": true | |
| }, | |
| "132": { | |
| "content": "</s>", | |
| "lstrip": false, | |
| "normalized": false, | |
| "rstrip": false, | |
| "single_word": false, | |
| "special": true | |
| } | |
| }, | |
| "bos_token": "<s>", | |
| "clean_up_tokenization_spaces": false, | |
| "do_lower_case": false, | |
| "eos_token": "</s>", | |
| "extra_special_tokens": {}, | |
| "model_max_length": 1000000000000000019884624838656, | |
| "pad_token": "[PAD]", | |
| "replace_word_delimiter_char": " ", | |
| "target_lang": "led", | |
| "tokenizer_class": "Wav2Vec2CTCTokenizer", | |
| "unk_token": "[UNK]", | |
| "word_delimiter_token": "|" | |
| } | |