| { | |
| "added_tokens_decoder": { | |
| "0": { | |
| "content": "<s>", | |
| "lstrip": false, | |
| "normalized": false, | |
| "rstrip": false, | |
| "single_word": false, | |
| "special": true | |
| }, | |
| "1": { | |
| "content": "<pad>", | |
| "lstrip": false, | |
| "normalized": false, | |
| "rstrip": false, | |
| "single_word": false, | |
| "special": true | |
| }, | |
| "2": { | |
| "content": "</s>", | |
| "lstrip": false, | |
| "normalized": false, | |
| "rstrip": false, | |
| "single_word": false, | |
| "special": true | |
| }, | |
| "3": { | |
| "content": "<unk>", | |
| "lstrip": false, | |
| "normalized": false, | |
| "rstrip": false, | |
| "single_word": false, | |
| "special": true | |
| }, | |
| "79": { | |
| "content": "<mask>", | |
| "lstrip": false, | |
| "normalized": false, | |
| "rstrip": false, | |
| "single_word": false, | |
| "special": true | |
| }, | |
| "80": { | |
| "content": "<ctc_blank>", | |
| "lstrip": true, | |
| "normalized": true, | |
| "rstrip": true, | |
| "single_word": false, | |
| "special": false | |
| }, | |
| "81": { | |
| "content": "ஃ", | |
| "lstrip": true, | |
| "normalized": true, | |
| "rstrip": true, | |
| "single_word": false, | |
| "special": false | |
| }, | |
| "82": { | |
| "content": "அ", | |
| "lstrip": true, | |
| "normalized": true, | |
| "rstrip": true, | |
| "single_word": false, | |
| "special": false | |
| }, | |
| "83": { | |
| "content": "ஆ", | |
| "lstrip": true, | |
| "normalized": true, | |
| "rstrip": true, | |
| "single_word": false, | |
| "special": false | |
| }, | |
| "84": { | |
| "content": "இ", | |
| "lstrip": true, | |
| "normalized": true, | |
| "rstrip": true, | |
| "single_word": false, | |
| "special": false | |
| }, | |
| "85": { | |
| "content": "ஈ", | |
| "lstrip": true, | |
| "normalized": true, | |
| "rstrip": true, | |
| "single_word": false, | |
| "special": false | |
| }, | |
| "86": { | |
| "content": "உ", | |
| "lstrip": true, | |
| "normalized": true, | |
| "rstrip": true, | |
| "single_word": false, | |
| "special": false | |
| }, | |
| "87": { | |
| "content": "ஊ", | |
| "lstrip": true, | |
| "normalized": true, | |
| "rstrip": true, | |
| "single_word": false, | |
| "special": false | |
| }, | |
| "88": { | |
| "content": "எ", | |
| "lstrip": true, | |
| "normalized": true, | |
| "rstrip": true, | |
| "single_word": false, | |
| "special": false | |
| }, | |
| "89": { | |
| "content": "ஏ", | |
| "lstrip": true, | |
| "normalized": true, | |
| "rstrip": true, | |
| "single_word": false, | |
| "special": false | |
| }, | |
| "90": { | |
| "content": "ஐ", | |
| "lstrip": true, | |
| "normalized": true, | |
| "rstrip": true, | |
| "single_word": false, | |
| "special": false | |
| }, | |
| "91": { | |
| "content": "ஒ", | |
| "lstrip": true, | |
| "normalized": true, | |
| "rstrip": true, | |
| "single_word": false, | |
| "special": false | |
| }, | |
| "92": { | |
| "content": "ஓ", | |
| "lstrip": true, | |
| "normalized": true, | |
| "rstrip": true, | |
| "single_word": false, | |
| "special": false | |
| }, | |
| "93": { | |
| "content": "ஔ", | |
| "lstrip": true, | |
| "normalized": true, | |
| "rstrip": true, | |
| "single_word": false, | |
| "special": false | |
| }, | |
| "94": { | |
| "content": "க", | |
| "lstrip": true, | |
| "normalized": true, | |
| "rstrip": true, | |
| "single_word": false, | |
| "special": false | |
| }, | |
| "95": { | |
| "content": "ங", | |
| "lstrip": true, | |
| "normalized": true, | |
| "rstrip": true, | |
| "single_word": false, | |
| "special": false | |
| }, | |
| "96": { | |
| "content": "ச", | |
| "lstrip": true, | |
| "normalized": true, | |
| "rstrip": true, | |
| "single_word": false, | |
| "special": false | |
| }, | |
| "97": { | |
| "content": "ஜ", | |
| "lstrip": true, | |
| "normalized": true, | |
| "rstrip": true, | |
| "single_word": false, | |
| "special": false | |
| }, | |
| "98": { | |
| "content": "ஞ", | |
| "lstrip": true, | |
| "normalized": true, | |
| "rstrip": true, | |
| "single_word": false, | |
| "special": false | |
| }, | |
| "99": { | |
| "content": "ட", | |
| "lstrip": true, | |
| "normalized": true, | |
| "rstrip": true, | |
| "single_word": false, | |
| "special": false | |
| }, | |
| "100": { | |
| "content": "ண", | |
| "lstrip": true, | |
| "normalized": true, | |
| "rstrip": true, | |
| "single_word": false, | |
| "special": false | |
| }, | |
| "101": { | |
| "content": "த", | |
| "lstrip": true, | |
| "normalized": true, | |
| "rstrip": true, | |
| "single_word": false, | |
| "special": false | |
| }, | |
| "102": { | |
| "content": "ந", | |
| "lstrip": true, | |
| "normalized": true, | |
| "rstrip": true, | |
| "single_word": false, | |
| "special": false | |
| }, | |
| "103": { | |
| "content": "ன", | |
| "lstrip": true, | |
| "normalized": true, | |
| "rstrip": true, | |
| "single_word": false, | |
| "special": false | |
| }, | |
| "104": { | |
| "content": "ப", | |
| "lstrip": true, | |
| "normalized": true, | |
| "rstrip": true, | |
| "single_word": false, | |
| "special": false | |
| }, | |
| "105": { | |
| "content": "ம", | |
| "lstrip": true, | |
| "normalized": true, | |
| "rstrip": true, | |
| "single_word": false, | |
| "special": false | |
| }, | |
| "106": { | |
| "content": "ய", | |
| "lstrip": true, | |
| "normalized": true, | |
| "rstrip": true, | |
| "single_word": false, | |
| "special": false | |
| }, | |
| "107": { | |
| "content": "ர", | |
| "lstrip": true, | |
| "normalized": true, | |
| "rstrip": true, | |
| "single_word": false, | |
| "special": false | |
| }, | |
| "108": { | |
| "content": "ற", | |
| "lstrip": true, | |
| "normalized": true, | |
| "rstrip": true, | |
| "single_word": false, | |
| "special": false | |
| }, | |
| "109": { | |
| "content": "ல", | |
| "lstrip": true, | |
| "normalized": true, | |
| "rstrip": true, | |
| "single_word": false, | |
| "special": false | |
| }, | |
| "110": { | |
| "content": "ள", | |
| "lstrip": true, | |
| "normalized": true, | |
| "rstrip": true, | |
| "single_word": false, | |
| "special": false | |
| }, | |
| "111": { | |
| "content": "ழ", | |
| "lstrip": true, | |
| "normalized": true, | |
| "rstrip": true, | |
| "single_word": false, | |
| "special": false | |
| }, | |
| "112": { | |
| "content": "வ", | |
| "lstrip": true, | |
| "normalized": true, | |
| "rstrip": true, | |
| "single_word": false, | |
| "special": false | |
| }, | |
| "113": { | |
| "content": "ஶ", | |
| "lstrip": true, | |
| "normalized": true, | |
| "rstrip": true, | |
| "single_word": false, | |
| "special": false | |
| }, | |
| "114": { | |
| "content": "ஷ", | |
| "lstrip": true, | |
| "normalized": true, | |
| "rstrip": true, | |
| "single_word": false, | |
| "special": false | |
| }, | |
| "115": { | |
| "content": "ஸ", | |
| "lstrip": true, | |
| "normalized": true, | |
| "rstrip": true, | |
| "single_word": false, | |
| "special": false | |
| }, | |
| "116": { | |
| "content": "ஹ", | |
| "lstrip": true, | |
| "normalized": true, | |
| "rstrip": true, | |
| "single_word": false, | |
| "special": false | |
| }, | |
| "117": { | |
| "content": "ா", | |
| "lstrip": true, | |
| "normalized": true, | |
| "rstrip": true, | |
| "single_word": false, | |
| "special": false | |
| }, | |
| "118": { | |
| "content": "ி", | |
| "lstrip": true, | |
| "normalized": true, | |
| "rstrip": true, | |
| "single_word": false, | |
| "special": false | |
| }, | |
| "119": { | |
| "content": "ீ", | |
| "lstrip": true, | |
| "normalized": true, | |
| "rstrip": true, | |
| "single_word": false, | |
| "special": false | |
| }, | |
| "120": { | |
| "content": "ு", | |
| "lstrip": true, | |
| "normalized": true, | |
| "rstrip": true, | |
| "single_word": false, | |
| "special": false | |
| }, | |
| "121": { | |
| "content": "ூ", | |
| "lstrip": true, | |
| "normalized": true, | |
| "rstrip": true, | |
| "single_word": false, | |
| "special": false | |
| }, | |
| "122": { | |
| "content": "ெ", | |
| "lstrip": true, | |
| "normalized": true, | |
| "rstrip": true, | |
| "single_word": false, | |
| "special": false | |
| }, | |
| "123": { | |
| "content": "ே", | |
| "lstrip": true, | |
| "normalized": true, | |
| "rstrip": true, | |
| "single_word": false, | |
| "special": false | |
| }, | |
| "124": { | |
| "content": "ை", | |
| "lstrip": true, | |
| "normalized": true, | |
| "rstrip": true, | |
| "single_word": false, | |
| "special": false | |
| }, | |
| "125": { | |
| "content": "ொ", | |
| "lstrip": true, | |
| "normalized": true, | |
| "rstrip": true, | |
| "single_word": false, | |
| "special": false | |
| }, | |
| "126": { | |
| "content": "ோ", | |
| "lstrip": true, | |
| "normalized": true, | |
| "rstrip": true, | |
| "single_word": false, | |
| "special": false | |
| }, | |
| "127": { | |
| "content": "ௌ", | |
| "lstrip": true, | |
| "normalized": true, | |
| "rstrip": true, | |
| "single_word": false, | |
| "special": false | |
| }, | |
| "128": { | |
| "content": "்", | |
| "lstrip": true, | |
| "normalized": true, | |
| "rstrip": true, | |
| "single_word": false, | |
| "special": false | |
| }, | |
| "129": { | |
| "content": "ௗ", | |
| "lstrip": true, | |
| "normalized": true, | |
| "rstrip": true, | |
| "single_word": false, | |
| "special": false | |
| } | |
| }, | |
| "additional_special_tokens": [ | |
| "<s>", | |
| "<pad>", | |
| "</s>", | |
| "<unk>", | |
| "<mask>" | |
| ], | |
| "bos_token": "<s>", | |
| "clean_up_tokenization_spaces": true, | |
| "eos_token": "</s>", | |
| "mask_token": "<mask>", | |
| "model_max_length": 600, | |
| "normalize": false, | |
| "pad_token": "<pad>", | |
| "processor_class": "SpeechT5Processor", | |
| "sp_model_kwargs": {}, | |
| "tokenizer_class": "SpeechT5Tokenizer", | |
| "tokenizer_file": null, | |
| "unk_token": "<unk>" | |
| } | |