mms-tts-kca / vocab.json
sanchit-gandhi's picture
Upload tokenizer
5b9d4bc
raw
history blame contribute delete
542 Bytes
{
" ": 24,
"'": 2,
"-": 25,
"_": 27,
"ă": 15,
"ŏ": 21,
"а": 43,
"б": 45,
"в": 13,
"г": 26,
"д": 34,
"е": 14,
"з": 6,
"и": 32,
"й": 33,
"к": 4,
"л": 41,
"м": 5,
"н": 35,
"о": 31,
"п": 11,
"р": 22,
"с": 10,
"т": 18,
"у": 28,
"ф": 37,
"х": 20,
"ц": 0,
"ч": 3,
"ш": 12,
"щ": 44,
"ы": 19,
"ь": 38,
"э": 36,
"ю": 40,
"я": 42,
"ё": 39,
"ў": 16,
"ӈ": 23,
"ӑ": 7,
"ә": 8,
"ԉ": 29,
"ԋ": 17,
"ԏ": 30,
"ԓ": 9,
"–": 1
}