native config MMS.json: +60
Browse filesThis view is limited to 50 files because it contains too many changes. See raw diff
- facebook__mms-tts-ata-Pele-Ata/config.json +68 -0
- facebook__mms-tts-fas-Persian/config.json +79 -0
- facebook__mms-tts-kek-Q’eqchi’/config.json +72 -0
- facebook__mms-tts-kjb-Q’anjob’al/config.json +83 -0
- facebook__mms-tts-lje-Rampi/config.json +70 -0
- facebook__mms-tts-lme-Pévé/config.json +72 -0
- facebook__mms-tts-pab-Parecís/config.json +85 -0
- facebook__mms-tts-pad-Paumarí/config.json +86 -0
- facebook__mms-tts-pag-Pangasinan/config.json +67 -0
- facebook__mms-tts-pan-Punjabi_Eastern/config.json +94 -0
- facebook__mms-tts-pap-Papiamentu/config.json +86 -0
- facebook__mms-tts-pbc-Patamona/config.json +77 -0
- facebook__mms-tts-pbi-Parkwa/config.json +71 -0
- facebook__mms-tts-pcm-Pidgin_Nigerian/config.json +71 -0
- facebook__mms-tts-peg-Pengo/config.json +73 -0
- facebook__mms-tts-pez-Penan_Eastern/config.json +68 -0
- facebook__mms-tts-pir-Piratapuyo/config.json +79 -0
- facebook__mms-tts-pis-Pijin/config.json +71 -0
- facebook__mms-tts-pjt-Pitjantjatjara/config.json +80 -0
- facebook__mms-tts-pls-Popoloca_San_Marcos_Tlacoyalco/config.json +80 -0
- facebook__mms-tts-pmf-Pamona/config.json +62 -0
- facebook__mms-tts-pny-Pinyin/config.json +90 -0
- facebook__mms-tts-poh-dialect_eastern-Poqomchi’/config.json +72 -0
- facebook__mms-tts-poh-dialect_western-Poqomchi’/config.json +64 -0
- facebook__mms-tts-poi-Popoluca_Highland/config.json +74 -0
- facebook__mms-tts-pol-Polish/config.json +81 -0
- facebook__mms-tts-por-Portuguese/config.json +78 -0
- facebook__mms-tts-poy-Pogolo/config.json +62 -0
- facebook__mms-tts-pps-Popoloca_San_Luís_Temalacayuca/config.json +81 -0
- facebook__mms-tts-prf-Paranan/config.json +71 -0
- facebook__mms-tts-prt-Prai/config.json +90 -0
- facebook__mms-tts-pui-Puinave/config.json +77 -0
- facebook__mms-tts-qub-Quechua_Huallaga/config.json +76 -0
- facebook__mms-tts-quf-Quechua_Lambayeque/config.json +70 -0
- facebook__mms-tts-quh-Quechua_South_Bolivian/config.json +78 -0
- facebook__mms-tts-qul-Quechua_North_Bolivian/config.json +73 -0
- facebook__mms-tts-quw-Quichua_Tena_Lowland/config.json +79 -0
- facebook__mms-tts-quy-Quechua_Ayacucho/config.json +71 -0
- facebook__mms-tts-quz-Quechua_Cusco/config.json +72 -0
- facebook__mms-tts-qvc-Quechua_Cajamarca/config.json +77 -0
- facebook__mms-tts-qve-Quechua_Eastern_Apurímac/config.json +75 -0
- facebook__mms-tts-qvh-Quechua_Huamalíes-Dos_de_Mayo_Huánuco/config.json +76 -0
- facebook__mms-tts-qvm-Quechua_Margos-Yarowilca-Lauricocha/config.json +76 -0
- facebook__mms-tts-qvn-Quechua_North_Junín/config.json +77 -0
- facebook__mms-tts-qvo-Quichua_Napo/config.json +71 -0
- facebook__mms-tts-qvs-Quechua_San_Martín/config.json +66 -0
- facebook__mms-tts-qvw-Quechua_Huaylla_Wanca/config.json +81 -0
- facebook__mms-tts-qvz-Quichua_Northern_Pastaza/config.json +70 -0
- facebook__mms-tts-qwh-Quechua_Huaylas_Ancash/config.json +72 -0
- facebook__mms-tts-qxh-Quechua_Panao/config.json +77 -0
facebook__mms-tts-ata-Pele-Ata/config.json
ADDED
|
@@ -0,0 +1,68 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"phoonnx_version": "1.0",
|
| 3 |
+
"engine": "transformers",
|
| 4 |
+
"phoneme_type": "graphemes",
|
| 5 |
+
"alphabet": "unicode",
|
| 6 |
+
"lang_code": "ata",
|
| 7 |
+
"audio": {
|
| 8 |
+
"sample_rate": 16000
|
| 9 |
+
},
|
| 10 |
+
"num_symbols": 256,
|
| 11 |
+
"num_speakers": 1,
|
| 12 |
+
"num_langs": 1,
|
| 13 |
+
"speaker_id_map": {},
|
| 14 |
+
"lang_id_map": {},
|
| 15 |
+
"phonemizer_model": null,
|
| 16 |
+
"add_diacritics": false,
|
| 17 |
+
"inference": {
|
| 18 |
+
"noise_scale": 0.667,
|
| 19 |
+
"length_scale": 1.0,
|
| 20 |
+
"noise_w": 0.8
|
| 21 |
+
},
|
| 22 |
+
"phoneme_id_map": {
|
| 23 |
+
" ": 19,
|
| 24 |
+
"'": 0,
|
| 25 |
+
"-": 22,
|
| 26 |
+
"0": 18,
|
| 27 |
+
"1": 11,
|
| 28 |
+
"2": 27,
|
| 29 |
+
"4": 25,
|
| 30 |
+
"5": 28,
|
| 31 |
+
"6": 23,
|
| 32 |
+
"7": 2,
|
| 33 |
+
"_": 5,
|
| 34 |
+
"a": 20,
|
| 35 |
+
"b": 6,
|
| 36 |
+
"d": 9,
|
| 37 |
+
"e": 29,
|
| 38 |
+
"f": 12,
|
| 39 |
+
"g": 16,
|
| 40 |
+
"h": 15,
|
| 41 |
+
"i": 1,
|
| 42 |
+
"k": 21,
|
| 43 |
+
"l": 26,
|
| 44 |
+
"m": 24,
|
| 45 |
+
"n": 30,
|
| 46 |
+
"o": 14,
|
| 47 |
+
"p": 7,
|
| 48 |
+
"r": 10,
|
| 49 |
+
"s": 31,
|
| 50 |
+
"t": 17,
|
| 51 |
+
"u": 3,
|
| 52 |
+
"v": 4,
|
| 53 |
+
"x": 32,
|
| 54 |
+
"z": 8,
|
| 55 |
+
"–": 13
|
| 56 |
+
},
|
| 57 |
+
"pad": null,
|
| 58 |
+
"blank": "'",
|
| 59 |
+
"bos": null,
|
| 60 |
+
"eos": null,
|
| 61 |
+
"add_blank_char": true,
|
| 62 |
+
"add_blank_word": false,
|
| 63 |
+
"use_eos_bos": false,
|
| 64 |
+
"blank_at_start": true,
|
| 65 |
+
"blank_at_end": true,
|
| 66 |
+
"word_sep_token": " ",
|
| 67 |
+
"blank_between": "tokens_and_words"
|
| 68 |
+
}
|
facebook__mms-tts-fas-Persian/config.json
ADDED
|
@@ -0,0 +1,79 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"phoonnx_version": "1.0",
|
| 3 |
+
"engine": "transformers",
|
| 4 |
+
"phoneme_type": "graphemes",
|
| 5 |
+
"alphabet": "unicode",
|
| 6 |
+
"lang_code": "fa",
|
| 7 |
+
"audio": {
|
| 8 |
+
"sample_rate": 16000
|
| 9 |
+
},
|
| 10 |
+
"num_symbols": 256,
|
| 11 |
+
"num_speakers": 1,
|
| 12 |
+
"num_langs": 1,
|
| 13 |
+
"speaker_id_map": {},
|
| 14 |
+
"lang_id_map": {},
|
| 15 |
+
"phonemizer_model": null,
|
| 16 |
+
"add_diacritics": false,
|
| 17 |
+
"inference": {
|
| 18 |
+
"noise_scale": 0.667,
|
| 19 |
+
"length_scale": 1.0,
|
| 20 |
+
"noise_w": 0.8
|
| 21 |
+
},
|
| 22 |
+
"phoneme_id_map": {
|
| 23 |
+
" ": 30,
|
| 24 |
+
"'": 40,
|
| 25 |
+
"-": 35,
|
| 26 |
+
"_": 6,
|
| 27 |
+
"ء": 14,
|
| 28 |
+
"آ": 34,
|
| 29 |
+
"أ": 3,
|
| 30 |
+
"ؤ": 36,
|
| 31 |
+
"ئ": 4,
|
| 32 |
+
"ا": 41,
|
| 33 |
+
"ب": 26,
|
| 34 |
+
"ت": 25,
|
| 35 |
+
"ث": 20,
|
| 36 |
+
"ج": 8,
|
| 37 |
+
"ح": 18,
|
| 38 |
+
"خ": 32,
|
| 39 |
+
"د": 28,
|
| 40 |
+
"ذ": 5,
|
| 41 |
+
"ر": 9,
|
| 42 |
+
"ز": 43,
|
| 43 |
+
"س": 39,
|
| 44 |
+
"ش": 31,
|
| 45 |
+
"ص": 16,
|
| 46 |
+
"ض": 42,
|
| 47 |
+
"ط": 19,
|
| 48 |
+
"ظ": 24,
|
| 49 |
+
"ع": 2,
|
| 50 |
+
"غ": 29,
|
| 51 |
+
"ف": 11,
|
| 52 |
+
"ق": 17,
|
| 53 |
+
"ك": 7,
|
| 54 |
+
"ل": 0,
|
| 55 |
+
"م": 23,
|
| 56 |
+
"ن": 22,
|
| 57 |
+
"ه": 10,
|
| 58 |
+
"و": 27,
|
| 59 |
+
"ي": 13,
|
| 60 |
+
"ٔ": 21,
|
| 61 |
+
"پ": 1,
|
| 62 |
+
"چ": 37,
|
| 63 |
+
"ژ": 38,
|
| 64 |
+
"ک": 33,
|
| 65 |
+
"گ": 12,
|
| 66 |
+
"ی": 15
|
| 67 |
+
},
|
| 68 |
+
"pad": null,
|
| 69 |
+
"blank": "ل",
|
| 70 |
+
"bos": null,
|
| 71 |
+
"eos": null,
|
| 72 |
+
"add_blank_char": true,
|
| 73 |
+
"add_blank_word": false,
|
| 74 |
+
"use_eos_bos": false,
|
| 75 |
+
"blank_at_start": true,
|
| 76 |
+
"blank_at_end": true,
|
| 77 |
+
"word_sep_token": " ",
|
| 78 |
+
"blank_between": "tokens_and_words"
|
| 79 |
+
}
|
facebook__mms-tts-kek-Q’eqchi’/config.json
ADDED
|
@@ -0,0 +1,72 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"phoonnx_version": "1.0",
|
| 3 |
+
"engine": "transformers",
|
| 4 |
+
"phoneme_type": "graphemes",
|
| 5 |
+
"alphabet": "unicode",
|
| 6 |
+
"lang_code": "kek",
|
| 7 |
+
"audio": {
|
| 8 |
+
"sample_rate": 16000
|
| 9 |
+
},
|
| 10 |
+
"num_symbols": 256,
|
| 11 |
+
"num_speakers": 1,
|
| 12 |
+
"num_langs": 1,
|
| 13 |
+
"speaker_id_map": {},
|
| 14 |
+
"lang_id_map": {},
|
| 15 |
+
"phonemizer_model": null,
|
| 16 |
+
"add_diacritics": false,
|
| 17 |
+
"inference": {
|
| 18 |
+
"noise_scale": 0.667,
|
| 19 |
+
"length_scale": 1.0,
|
| 20 |
+
"noise_w": 0.8
|
| 21 |
+
},
|
| 22 |
+
"phoneme_id_map": {
|
| 23 |
+
" ": 36,
|
| 24 |
+
"'": 7,
|
| 25 |
+
"-": 26,
|
| 26 |
+
"a": 1,
|
| 27 |
+
"b": 11,
|
| 28 |
+
"c": 4,
|
| 29 |
+
"d": 22,
|
| 30 |
+
"e": 8,
|
| 31 |
+
"f": 32,
|
| 32 |
+
"g": 29,
|
| 33 |
+
"h": 14,
|
| 34 |
+
"i": 2,
|
| 35 |
+
"j": 17,
|
| 36 |
+
"k": 15,
|
| 37 |
+
"l": 5,
|
| 38 |
+
"m": 20,
|
| 39 |
+
"n": 6,
|
| 40 |
+
"o": 13,
|
| 41 |
+
"p": 23,
|
| 42 |
+
"q": 19,
|
| 43 |
+
"r": 16,
|
| 44 |
+
"s": 18,
|
| 45 |
+
"t": 9,
|
| 46 |
+
"u": 3,
|
| 47 |
+
"v": 34,
|
| 48 |
+
"x": 12,
|
| 49 |
+
"y": 21,
|
| 50 |
+
"z": 24,
|
| 51 |
+
"|": 0,
|
| 52 |
+
"á": 33,
|
| 53 |
+
"é": 31,
|
| 54 |
+
"í": 28,
|
| 55 |
+
"ñ": 35,
|
| 56 |
+
"ó": 30,
|
| 57 |
+
"ú": 27,
|
| 58 |
+
"̱": 10,
|
| 59 |
+
"—": 25
|
| 60 |
+
},
|
| 61 |
+
"pad": null,
|
| 62 |
+
"blank": "|",
|
| 63 |
+
"bos": null,
|
| 64 |
+
"eos": null,
|
| 65 |
+
"add_blank_char": true,
|
| 66 |
+
"add_blank_word": false,
|
| 67 |
+
"use_eos_bos": false,
|
| 68 |
+
"blank_at_start": true,
|
| 69 |
+
"blank_at_end": true,
|
| 70 |
+
"word_sep_token": " ",
|
| 71 |
+
"blank_between": "tokens_and_words"
|
| 72 |
+
}
|
facebook__mms-tts-kjb-Q’anjob’al/config.json
ADDED
|
@@ -0,0 +1,83 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"phoonnx_version": "1.0",
|
| 3 |
+
"engine": "transformers",
|
| 4 |
+
"phoneme_type": "graphemes",
|
| 5 |
+
"alphabet": "unicode",
|
| 6 |
+
"lang_code": "kjb",
|
| 7 |
+
"audio": {
|
| 8 |
+
"sample_rate": 16000
|
| 9 |
+
},
|
| 10 |
+
"num_symbols": 256,
|
| 11 |
+
"num_speakers": 1,
|
| 12 |
+
"num_langs": 1,
|
| 13 |
+
"speaker_id_map": {},
|
| 14 |
+
"lang_id_map": {},
|
| 15 |
+
"phonemizer_model": null,
|
| 16 |
+
"add_diacritics": false,
|
| 17 |
+
"inference": {
|
| 18 |
+
"noise_scale": 0.667,
|
| 19 |
+
"length_scale": 1.0,
|
| 20 |
+
"noise_w": 0.8
|
| 21 |
+
},
|
| 22 |
+
"phoneme_id_map": {
|
| 23 |
+
" ": 47,
|
| 24 |
+
"'": 10,
|
| 25 |
+
"-": 33,
|
| 26 |
+
"0": 36,
|
| 27 |
+
"1": 37,
|
| 28 |
+
"2": 38,
|
| 29 |
+
"3": 41,
|
| 30 |
+
"4": 39,
|
| 31 |
+
"5": 40,
|
| 32 |
+
"6": 43,
|
| 33 |
+
"7": 44,
|
| 34 |
+
"8": 45,
|
| 35 |
+
"9": 42,
|
| 36 |
+
"a": 1,
|
| 37 |
+
"b": 13,
|
| 38 |
+
"c": 5,
|
| 39 |
+
"d": 23,
|
| 40 |
+
"e": 7,
|
| 41 |
+
"f": 32,
|
| 42 |
+
"g": 27,
|
| 43 |
+
"h": 17,
|
| 44 |
+
"i": 2,
|
| 45 |
+
"j": 11,
|
| 46 |
+
"k": 15,
|
| 47 |
+
"l": 6,
|
| 48 |
+
"m": 16,
|
| 49 |
+
"n": 3,
|
| 50 |
+
"o": 9,
|
| 51 |
+
"p": 20,
|
| 52 |
+
"q": 25,
|
| 53 |
+
"r": 22,
|
| 54 |
+
"s": 18,
|
| 55 |
+
"t": 4,
|
| 56 |
+
"u": 12,
|
| 57 |
+
"v": 35,
|
| 58 |
+
"w": 19,
|
| 59 |
+
"x": 14,
|
| 60 |
+
"y": 8,
|
| 61 |
+
"z": 21,
|
| 62 |
+
"|": 0,
|
| 63 |
+
"á": 31,
|
| 64 |
+
"é": 30,
|
| 65 |
+
"í": 29,
|
| 66 |
+
"ñ": 46,
|
| 67 |
+
"ó": 34,
|
| 68 |
+
"ú": 26,
|
| 69 |
+
"ẍ": 24,
|
| 70 |
+
"—": 28
|
| 71 |
+
},
|
| 72 |
+
"pad": null,
|
| 73 |
+
"blank": "|",
|
| 74 |
+
"bos": null,
|
| 75 |
+
"eos": null,
|
| 76 |
+
"add_blank_char": true,
|
| 77 |
+
"add_blank_word": false,
|
| 78 |
+
"use_eos_bos": false,
|
| 79 |
+
"blank_at_start": true,
|
| 80 |
+
"blank_at_end": true,
|
| 81 |
+
"word_sep_token": " ",
|
| 82 |
+
"blank_between": "tokens_and_words"
|
| 83 |
+
}
|
facebook__mms-tts-lje-Rampi/config.json
ADDED
|
@@ -0,0 +1,70 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"phoonnx_version": "1.0",
|
| 3 |
+
"engine": "transformers",
|
| 4 |
+
"phoneme_type": "graphemes",
|
| 5 |
+
"alphabet": "unicode",
|
| 6 |
+
"lang_code": "lje",
|
| 7 |
+
"audio": {
|
| 8 |
+
"sample_rate": 16000
|
| 9 |
+
},
|
| 10 |
+
"num_symbols": 256,
|
| 11 |
+
"num_speakers": 1,
|
| 12 |
+
"num_langs": 1,
|
| 13 |
+
"speaker_id_map": {},
|
| 14 |
+
"lang_id_map": {},
|
| 15 |
+
"phonemizer_model": null,
|
| 16 |
+
"add_diacritics": false,
|
| 17 |
+
"inference": {
|
| 18 |
+
"noise_scale": 0.667,
|
| 19 |
+
"length_scale": 1.0,
|
| 20 |
+
"noise_w": 0.8
|
| 21 |
+
},
|
| 22 |
+
"phoneme_id_map": {
|
| 23 |
+
" ": 31,
|
| 24 |
+
"'": 33,
|
| 25 |
+
"-": 25,
|
| 26 |
+
"0": 34,
|
| 27 |
+
"1": 20,
|
| 28 |
+
"2": 23,
|
| 29 |
+
"3": 11,
|
| 30 |
+
"4": 16,
|
| 31 |
+
"5": 4,
|
| 32 |
+
"6": 29,
|
| 33 |
+
"7": 10,
|
| 34 |
+
"_": 9,
|
| 35 |
+
"a": 24,
|
| 36 |
+
"b": 0,
|
| 37 |
+
"c": 7,
|
| 38 |
+
"d": 21,
|
| 39 |
+
"e": 6,
|
| 40 |
+
"f": 28,
|
| 41 |
+
"g": 3,
|
| 42 |
+
"h": 14,
|
| 43 |
+
"i": 17,
|
| 44 |
+
"j": 1,
|
| 45 |
+
"k": 30,
|
| 46 |
+
"l": 22,
|
| 47 |
+
"m": 32,
|
| 48 |
+
"n": 12,
|
| 49 |
+
"o": 8,
|
| 50 |
+
"p": 13,
|
| 51 |
+
"r": 19,
|
| 52 |
+
"s": 27,
|
| 53 |
+
"t": 2,
|
| 54 |
+
"u": 15,
|
| 55 |
+
"w": 5,
|
| 56 |
+
"y": 26,
|
| 57 |
+
"ꞌ": 18
|
| 58 |
+
},
|
| 59 |
+
"pad": null,
|
| 60 |
+
"blank": "b",
|
| 61 |
+
"bos": null,
|
| 62 |
+
"eos": null,
|
| 63 |
+
"add_blank_char": true,
|
| 64 |
+
"add_blank_word": false,
|
| 65 |
+
"use_eos_bos": false,
|
| 66 |
+
"blank_at_start": true,
|
| 67 |
+
"blank_at_end": true,
|
| 68 |
+
"word_sep_token": " ",
|
| 69 |
+
"blank_between": "tokens_and_words"
|
| 70 |
+
}
|
facebook__mms-tts-lme-Pévé/config.json
ADDED
|
@@ -0,0 +1,72 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"phoonnx_version": "1.0",
|
| 3 |
+
"engine": "transformers",
|
| 4 |
+
"phoneme_type": "graphemes",
|
| 5 |
+
"alphabet": "unicode",
|
| 6 |
+
"lang_code": "lme",
|
| 7 |
+
"audio": {
|
| 8 |
+
"sample_rate": 16000
|
| 9 |
+
},
|
| 10 |
+
"num_symbols": 256,
|
| 11 |
+
"num_speakers": 1,
|
| 12 |
+
"num_langs": 1,
|
| 13 |
+
"speaker_id_map": {},
|
| 14 |
+
"lang_id_map": {},
|
| 15 |
+
"phonemizer_model": null,
|
| 16 |
+
"add_diacritics": false,
|
| 17 |
+
"inference": {
|
| 18 |
+
"noise_scale": 0.667,
|
| 19 |
+
"length_scale": 1.0,
|
| 20 |
+
"noise_w": 0.8
|
| 21 |
+
},
|
| 22 |
+
"phoneme_id_map": {
|
| 23 |
+
" ": 36,
|
| 24 |
+
"'": 14,
|
| 25 |
+
"-": 35,
|
| 26 |
+
"a": 1,
|
| 27 |
+
"b": 15,
|
| 28 |
+
"c": 22,
|
| 29 |
+
"d": 10,
|
| 30 |
+
"e": 13,
|
| 31 |
+
"f": 23,
|
| 32 |
+
"g": 21,
|
| 33 |
+
"h": 19,
|
| 34 |
+
"i": 5,
|
| 35 |
+
"j": 30,
|
| 36 |
+
"k": 7,
|
| 37 |
+
"l": 26,
|
| 38 |
+
"m": 4,
|
| 39 |
+
"n": 3,
|
| 40 |
+
"o": 16,
|
| 41 |
+
"p": 31,
|
| 42 |
+
"r": 9,
|
| 43 |
+
"s": 12,
|
| 44 |
+
"t": 17,
|
| 45 |
+
"u": 6,
|
| 46 |
+
"v": 27,
|
| 47 |
+
"w": 8,
|
| 48 |
+
"y": 11,
|
| 49 |
+
"z": 18,
|
| 50 |
+
"|": 0,
|
| 51 |
+
"â": 24,
|
| 52 |
+
"ê": 34,
|
| 53 |
+
"î": 32,
|
| 54 |
+
"ô": 29,
|
| 55 |
+
"û": 33,
|
| 56 |
+
"ŋ": 25,
|
| 57 |
+
"ɓ": 20,
|
| 58 |
+
"ɗ": 28,
|
| 59 |
+
"ə": 2
|
| 60 |
+
},
|
| 61 |
+
"pad": null,
|
| 62 |
+
"blank": "|",
|
| 63 |
+
"bos": null,
|
| 64 |
+
"eos": null,
|
| 65 |
+
"add_blank_char": true,
|
| 66 |
+
"add_blank_word": false,
|
| 67 |
+
"use_eos_bos": false,
|
| 68 |
+
"blank_at_start": true,
|
| 69 |
+
"blank_at_end": true,
|
| 70 |
+
"word_sep_token": " ",
|
| 71 |
+
"blank_between": "tokens_and_words"
|
| 72 |
+
}
|
facebook__mms-tts-pab-Parecís/config.json
ADDED
|
@@ -0,0 +1,85 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"phoonnx_version": "1.0",
|
| 3 |
+
"engine": "transformers",
|
| 4 |
+
"phoneme_type": "graphemes",
|
| 5 |
+
"alphabet": "unicode",
|
| 6 |
+
"lang_code": "pab",
|
| 7 |
+
"audio": {
|
| 8 |
+
"sample_rate": 16000
|
| 9 |
+
},
|
| 10 |
+
"num_symbols": 256,
|
| 11 |
+
"num_speakers": 1,
|
| 12 |
+
"num_langs": 1,
|
| 13 |
+
"speaker_id_map": {},
|
| 14 |
+
"lang_id_map": {},
|
| 15 |
+
"phonemizer_model": null,
|
| 16 |
+
"add_diacritics": false,
|
| 17 |
+
"inference": {
|
| 18 |
+
"noise_scale": 0.667,
|
| 19 |
+
"length_scale": 1.0,
|
| 20 |
+
"noise_w": 0.8
|
| 21 |
+
},
|
| 22 |
+
"phoneme_id_map": {
|
| 23 |
+
" ": 49,
|
| 24 |
+
"'": 48,
|
| 25 |
+
"-": 27,
|
| 26 |
+
"0": 29,
|
| 27 |
+
"1": 34,
|
| 28 |
+
"2": 36,
|
| 29 |
+
"3": 44,
|
| 30 |
+
"4": 38,
|
| 31 |
+
"5": 40,
|
| 32 |
+
"6": 43,
|
| 33 |
+
"7": 39,
|
| 34 |
+
"8": 45,
|
| 35 |
+
"9": 46,
|
| 36 |
+
"a": 0,
|
| 37 |
+
"b": 19,
|
| 38 |
+
"c": 21,
|
| 39 |
+
"d": 20,
|
| 40 |
+
"e": 2,
|
| 41 |
+
"f": 22,
|
| 42 |
+
"g": 28,
|
| 43 |
+
"h": 5,
|
| 44 |
+
"i": 3,
|
| 45 |
+
"j": 16,
|
| 46 |
+
"k": 7,
|
| 47 |
+
"l": 14,
|
| 48 |
+
"m": 13,
|
| 49 |
+
"n": 8,
|
| 50 |
+
"o": 4,
|
| 51 |
+
"p": 23,
|
| 52 |
+
"q": 32,
|
| 53 |
+
"r": 10,
|
| 54 |
+
"s": 12,
|
| 55 |
+
"t": 6,
|
| 56 |
+
"u": 17,
|
| 57 |
+
"v": 31,
|
| 58 |
+
"w": 15,
|
| 59 |
+
"x": 11,
|
| 60 |
+
"y": 9,
|
| 61 |
+
"z": 35,
|
| 62 |
+
"|": 1,
|
| 63 |
+
"á": 25,
|
| 64 |
+
"â": 47,
|
| 65 |
+
"ã": 26,
|
| 66 |
+
"é": 24,
|
| 67 |
+
"ê": 41,
|
| 68 |
+
"í": 33,
|
| 69 |
+
"ó": 30,
|
| 70 |
+
"ô": 37,
|
| 71 |
+
"ú": 42,
|
| 72 |
+
"—": 18
|
| 73 |
+
},
|
| 74 |
+
"pad": null,
|
| 75 |
+
"blank": "a",
|
| 76 |
+
"bos": null,
|
| 77 |
+
"eos": null,
|
| 78 |
+
"add_blank_char": true,
|
| 79 |
+
"add_blank_word": false,
|
| 80 |
+
"use_eos_bos": false,
|
| 81 |
+
"blank_at_start": true,
|
| 82 |
+
"blank_at_end": true,
|
| 83 |
+
"word_sep_token": " ",
|
| 84 |
+
"blank_between": "tokens_and_words"
|
| 85 |
+
}
|
facebook__mms-tts-pad-Paumarí/config.json
ADDED
|
@@ -0,0 +1,86 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"phoonnx_version": "1.0",
|
| 3 |
+
"engine": "transformers",
|
| 4 |
+
"phoneme_type": "graphemes",
|
| 5 |
+
"alphabet": "unicode",
|
| 6 |
+
"lang_code": "pad",
|
| 7 |
+
"audio": {
|
| 8 |
+
"sample_rate": 16000
|
| 9 |
+
},
|
| 10 |
+
"num_symbols": 256,
|
| 11 |
+
"num_speakers": 1,
|
| 12 |
+
"num_langs": 1,
|
| 13 |
+
"speaker_id_map": {},
|
| 14 |
+
"lang_id_map": {},
|
| 15 |
+
"phonemizer_model": null,
|
| 16 |
+
"add_diacritics": false,
|
| 17 |
+
"inference": {
|
| 18 |
+
"noise_scale": 0.667,
|
| 19 |
+
"length_scale": 1.0,
|
| 20 |
+
"noise_w": 0.8
|
| 21 |
+
},
|
| 22 |
+
"phoneme_id_map": {
|
| 23 |
+
" ": 50,
|
| 24 |
+
"'": 10,
|
| 25 |
+
"-": 18,
|
| 26 |
+
"0": 35,
|
| 27 |
+
"1": 34,
|
| 28 |
+
"2": 37,
|
| 29 |
+
"3": 45,
|
| 30 |
+
"4": 38,
|
| 31 |
+
"5": 42,
|
| 32 |
+
"6": 43,
|
| 33 |
+
"7": 36,
|
| 34 |
+
"8": 46,
|
| 35 |
+
"9": 47,
|
| 36 |
+
"a": 0,
|
| 37 |
+
"b": 12,
|
| 38 |
+
"c": 22,
|
| 39 |
+
"d": 9,
|
| 40 |
+
"e": 15,
|
| 41 |
+
"f": 21,
|
| 42 |
+
"g": 19,
|
| 43 |
+
"h": 5,
|
| 44 |
+
"i": 1,
|
| 45 |
+
"j": 11,
|
| 46 |
+
"k": 6,
|
| 47 |
+
"l": 24,
|
| 48 |
+
"m": 14,
|
| 49 |
+
"n": 3,
|
| 50 |
+
"o": 4,
|
| 51 |
+
"p": 20,
|
| 52 |
+
"q": 30,
|
| 53 |
+
"r": 7,
|
| 54 |
+
"s": 13,
|
| 55 |
+
"t": 17,
|
| 56 |
+
"u": 16,
|
| 57 |
+
"v": 8,
|
| 58 |
+
"x": 27,
|
| 59 |
+
"z": 31,
|
| 60 |
+
"|": 2,
|
| 61 |
+
"á": 28,
|
| 62 |
+
"â": 39,
|
| 63 |
+
"ã": 26,
|
| 64 |
+
"ç": 44,
|
| 65 |
+
"é": 25,
|
| 66 |
+
"ê": 40,
|
| 67 |
+
"í": 32,
|
| 68 |
+
"î": 48,
|
| 69 |
+
"ó": 29,
|
| 70 |
+
"ô": 33,
|
| 71 |
+
"õ": 49,
|
| 72 |
+
"ú": 41,
|
| 73 |
+
"—": 23
|
| 74 |
+
},
|
| 75 |
+
"pad": null,
|
| 76 |
+
"blank": "a",
|
| 77 |
+
"bos": null,
|
| 78 |
+
"eos": null,
|
| 79 |
+
"add_blank_char": true,
|
| 80 |
+
"add_blank_word": false,
|
| 81 |
+
"use_eos_bos": false,
|
| 82 |
+
"blank_at_start": true,
|
| 83 |
+
"blank_at_end": true,
|
| 84 |
+
"word_sep_token": " ",
|
| 85 |
+
"blank_between": "tokens_and_words"
|
| 86 |
+
}
|
facebook__mms-tts-pag-Pangasinan/config.json
ADDED
|
@@ -0,0 +1,67 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"phoonnx_version": "1.0",
|
| 3 |
+
"engine": "transformers",
|
| 4 |
+
"phoneme_type": "graphemes",
|
| 5 |
+
"alphabet": "unicode",
|
| 6 |
+
"lang_code": "pag",
|
| 7 |
+
"audio": {
|
| 8 |
+
"sample_rate": 16000
|
| 9 |
+
},
|
| 10 |
+
"num_symbols": 256,
|
| 11 |
+
"num_speakers": 1,
|
| 12 |
+
"num_langs": 1,
|
| 13 |
+
"speaker_id_map": {},
|
| 14 |
+
"lang_id_map": {},
|
| 15 |
+
"phonemizer_model": null,
|
| 16 |
+
"add_diacritics": false,
|
| 17 |
+
"inference": {
|
| 18 |
+
"noise_scale": 0.667,
|
| 19 |
+
"length_scale": 1.0,
|
| 20 |
+
"noise_w": 0.8
|
| 21 |
+
},
|
| 22 |
+
"phoneme_id_map": {
|
| 23 |
+
" ": 31,
|
| 24 |
+
"'": 21,
|
| 25 |
+
"-": 23,
|
| 26 |
+
"a": 0,
|
| 27 |
+
"b": 16,
|
| 28 |
+
"c": 20,
|
| 29 |
+
"d": 13,
|
| 30 |
+
"e": 8,
|
| 31 |
+
"f": 24,
|
| 32 |
+
"g": 10,
|
| 33 |
+
"h": 22,
|
| 34 |
+
"i": 3,
|
| 35 |
+
"j": 19,
|
| 36 |
+
"k": 9,
|
| 37 |
+
"l": 11,
|
| 38 |
+
"m": 12,
|
| 39 |
+
"n": 2,
|
| 40 |
+
"o": 4,
|
| 41 |
+
"p": 14,
|
| 42 |
+
"q": 28,
|
| 43 |
+
"r": 15,
|
| 44 |
+
"s": 6,
|
| 45 |
+
"t": 5,
|
| 46 |
+
"u": 17,
|
| 47 |
+
"v": 27,
|
| 48 |
+
"w": 18,
|
| 49 |
+
"x": 29,
|
| 50 |
+
"y": 7,
|
| 51 |
+
"z": 25,
|
| 52 |
+
"|": 1,
|
| 53 |
+
"–": 30,
|
| 54 |
+
"—": 26
|
| 55 |
+
},
|
| 56 |
+
"pad": null,
|
| 57 |
+
"blank": "a",
|
| 58 |
+
"bos": null,
|
| 59 |
+
"eos": null,
|
| 60 |
+
"add_blank_char": true,
|
| 61 |
+
"add_blank_word": false,
|
| 62 |
+
"use_eos_bos": false,
|
| 63 |
+
"blank_at_start": true,
|
| 64 |
+
"blank_at_end": true,
|
| 65 |
+
"word_sep_token": " ",
|
| 66 |
+
"blank_between": "tokens_and_words"
|
| 67 |
+
}
|
facebook__mms-tts-pan-Punjabi_Eastern/config.json
ADDED
|
@@ -0,0 +1,94 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"phoonnx_version": "1.0",
|
| 3 |
+
"engine": "transformers",
|
| 4 |
+
"phoneme_type": "graphemes",
|
| 5 |
+
"alphabet": "unicode",
|
| 6 |
+
"lang_code": "pa",
|
| 7 |
+
"audio": {
|
| 8 |
+
"sample_rate": 16000
|
| 9 |
+
},
|
| 10 |
+
"num_symbols": 256,
|
| 11 |
+
"num_speakers": 1,
|
| 12 |
+
"num_langs": 1,
|
| 13 |
+
"speaker_id_map": {},
|
| 14 |
+
"lang_id_map": {},
|
| 15 |
+
"phonemizer_model": null,
|
| 16 |
+
"add_diacritics": false,
|
| 17 |
+
"inference": {
|
| 18 |
+
"noise_scale": 0.667,
|
| 19 |
+
"length_scale": 1.0,
|
| 20 |
+
"noise_w": 0.8
|
| 21 |
+
},
|
| 22 |
+
"phoneme_id_map": {
|
| 23 |
+
" ": 31,
|
| 24 |
+
"-": 5,
|
| 25 |
+
"6": 28,
|
| 26 |
+
"_": 7,
|
| 27 |
+
"l": 6,
|
| 28 |
+
"ਂ": 40,
|
| 29 |
+
"ਅ": 44,
|
| 30 |
+
"ਆ": 48,
|
| 31 |
+
"ਇ": 10,
|
| 32 |
+
"ਈ": 37,
|
| 33 |
+
"ਉ": 43,
|
| 34 |
+
"ਊ": 19,
|
| 35 |
+
"ਏ": 0,
|
| 36 |
+
"ਐ": 36,
|
| 37 |
+
"ਓ": 41,
|
| 38 |
+
"ਔ": 24,
|
| 39 |
+
"ਕ": 53,
|
| 40 |
+
"ਖ": 45,
|
| 41 |
+
"ਗ": 33,
|
| 42 |
+
"ਘ": 38,
|
| 43 |
+
"ਚ": 49,
|
| 44 |
+
"ਛ": 30,
|
| 45 |
+
"ਜ": 23,
|
| 46 |
+
"ਝ": 18,
|
| 47 |
+
"ਟ": 1,
|
| 48 |
+
"ਠ": 4,
|
| 49 |
+
"ਡ": 46,
|
| 50 |
+
"ਢ": 54,
|
| 51 |
+
"ਣ": 12,
|
| 52 |
+
"ਤ": 51,
|
| 53 |
+
"ਥ": 13,
|
| 54 |
+
"ਦ": 25,
|
| 55 |
+
"ਧ": 20,
|
| 56 |
+
"ਨ": 14,
|
| 57 |
+
"ਪ": 11,
|
| 58 |
+
"ਫ": 17,
|
| 59 |
+
"ਬ": 34,
|
| 60 |
+
"ਭ": 39,
|
| 61 |
+
"ਮ": 57,
|
| 62 |
+
"ਯ": 16,
|
| 63 |
+
"ਰ": 55,
|
| 64 |
+
"ਲ": 47,
|
| 65 |
+
"ਵ": 50,
|
| 66 |
+
"ਸ": 15,
|
| 67 |
+
"ਹ": 52,
|
| 68 |
+
"਼": 9,
|
| 69 |
+
"ਾ": 56,
|
| 70 |
+
"ਿ": 22,
|
| 71 |
+
"ੀ": 32,
|
| 72 |
+
"ੁ": 21,
|
| 73 |
+
"ੂ": 29,
|
| 74 |
+
"ੇ": 42,
|
| 75 |
+
"ੈ": 3,
|
| 76 |
+
"ੋ": 26,
|
| 77 |
+
"ੌ": 27,
|
| 78 |
+
"੍": 35,
|
| 79 |
+
"ੜ": 8,
|
| 80 |
+
"ੰ": 2,
|
| 81 |
+
"ੱ": 58
|
| 82 |
+
},
|
| 83 |
+
"pad": null,
|
| 84 |
+
"blank": "ਏ",
|
| 85 |
+
"bos": null,
|
| 86 |
+
"eos": null,
|
| 87 |
+
"add_blank_char": true,
|
| 88 |
+
"add_blank_word": false,
|
| 89 |
+
"use_eos_bos": false,
|
| 90 |
+
"blank_at_start": true,
|
| 91 |
+
"blank_at_end": true,
|
| 92 |
+
"word_sep_token": " ",
|
| 93 |
+
"blank_between": "tokens_and_words"
|
| 94 |
+
}
|
facebook__mms-tts-pap-Papiamentu/config.json
ADDED
|
@@ -0,0 +1,86 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"phoonnx_version": "1.0",
|
| 3 |
+
"engine": "transformers",
|
| 4 |
+
"phoneme_type": "graphemes",
|
| 5 |
+
"alphabet": "unicode",
|
| 6 |
+
"lang_code": "pap",
|
| 7 |
+
"audio": {
|
| 8 |
+
"sample_rate": 16000
|
| 9 |
+
},
|
| 10 |
+
"num_symbols": 256,
|
| 11 |
+
"num_speakers": 1,
|
| 12 |
+
"num_langs": 1,
|
| 13 |
+
"speaker_id_map": {},
|
| 14 |
+
"lang_id_map": {},
|
| 15 |
+
"phonemizer_model": null,
|
| 16 |
+
"add_diacritics": false,
|
| 17 |
+
"inference": {
|
| 18 |
+
"noise_scale": 0.667,
|
| 19 |
+
"length_scale": 1.0,
|
| 20 |
+
"noise_w": 0.8
|
| 21 |
+
},
|
| 22 |
+
"phoneme_id_map": {
|
| 23 |
+
" ": 48,
|
| 24 |
+
"'": 1,
|
| 25 |
+
"-": 14,
|
| 26 |
+
"0": 0,
|
| 27 |
+
"1": 31,
|
| 28 |
+
"2": 24,
|
| 29 |
+
"3": 43,
|
| 30 |
+
"4": 12,
|
| 31 |
+
"5": 8,
|
| 32 |
+
"6": 25,
|
| 33 |
+
"7": 3,
|
| 34 |
+
"8": 36,
|
| 35 |
+
"9": 35,
|
| 36 |
+
"_": 9,
|
| 37 |
+
"a": 33,
|
| 38 |
+
"b": 18,
|
| 39 |
+
"c": 44,
|
| 40 |
+
"d": 41,
|
| 41 |
+
"e": 16,
|
| 42 |
+
"f": 2,
|
| 43 |
+
"g": 6,
|
| 44 |
+
"h": 13,
|
| 45 |
+
"i": 40,
|
| 46 |
+
"j": 28,
|
| 47 |
+
"k": 50,
|
| 48 |
+
"l": 19,
|
| 49 |
+
"m": 26,
|
| 50 |
+
"n": 20,
|
| 51 |
+
"o": 21,
|
| 52 |
+
"p": 30,
|
| 53 |
+
"q": 4,
|
| 54 |
+
"r": 7,
|
| 55 |
+
"s": 45,
|
| 56 |
+
"t": 32,
|
| 57 |
+
"u": 15,
|
| 58 |
+
"v": 49,
|
| 59 |
+
"w": 38,
|
| 60 |
+
"x": 5,
|
| 61 |
+
"y": 11,
|
| 62 |
+
"z": 23,
|
| 63 |
+
"á": 47,
|
| 64 |
+
"è": 42,
|
| 65 |
+
"é": 37,
|
| 66 |
+
"í": 39,
|
| 67 |
+
"ñ": 27,
|
| 68 |
+
"ò": 34,
|
| 69 |
+
"ó": 10,
|
| 70 |
+
"ù": 17,
|
| 71 |
+
"ú": 29,
|
| 72 |
+
"ü": 46,
|
| 73 |
+
"—": 22
|
| 74 |
+
},
|
| 75 |
+
"pad": null,
|
| 76 |
+
"blank": "0",
|
| 77 |
+
"bos": null,
|
| 78 |
+
"eos": null,
|
| 79 |
+
"add_blank_char": true,
|
| 80 |
+
"add_blank_word": false,
|
| 81 |
+
"use_eos_bos": false,
|
| 82 |
+
"blank_at_start": true,
|
| 83 |
+
"blank_at_end": true,
|
| 84 |
+
"word_sep_token": " ",
|
| 85 |
+
"blank_between": "tokens_and_words"
|
| 86 |
+
}
|
facebook__mms-tts-pbc-Patamona/config.json
ADDED
|
@@ -0,0 +1,77 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"phoonnx_version": "1.0",
|
| 3 |
+
"engine": "transformers",
|
| 4 |
+
"phoneme_type": "graphemes",
|
| 5 |
+
"alphabet": "unicode",
|
| 6 |
+
"lang_code": "pbc",
|
| 7 |
+
"audio": {
|
| 8 |
+
"sample_rate": 16000
|
| 9 |
+
},
|
| 10 |
+
"num_symbols": 256,
|
| 11 |
+
"num_speakers": 1,
|
| 12 |
+
"num_langs": 1,
|
| 13 |
+
"speaker_id_map": {},
|
| 14 |
+
"lang_id_map": {},
|
| 15 |
+
"phonemizer_model": null,
|
| 16 |
+
"add_diacritics": false,
|
| 17 |
+
"inference": {
|
| 18 |
+
"noise_scale": 0.667,
|
| 19 |
+
"length_scale": 1.0,
|
| 20 |
+
"noise_w": 0.8
|
| 21 |
+
},
|
| 22 |
+
"phoneme_id_map": {
|
| 23 |
+
" ": 41,
|
| 24 |
+
"'": 17,
|
| 25 |
+
"-": 40,
|
| 26 |
+
"0": 24,
|
| 27 |
+
"1": 26,
|
| 28 |
+
"2": 30,
|
| 29 |
+
"3": 34,
|
| 30 |
+
"4": 32,
|
| 31 |
+
"5": 33,
|
| 32 |
+
"6": 35,
|
| 33 |
+
"7": 29,
|
| 34 |
+
"8": 37,
|
| 35 |
+
"9": 38,
|
| 36 |
+
"a": 1,
|
| 37 |
+
"b": 23,
|
| 38 |
+
"c": 19,
|
| 39 |
+
"d": 22,
|
| 40 |
+
"e": 5,
|
| 41 |
+
"f": 31,
|
| 42 |
+
"g": 25,
|
| 43 |
+
"h": 18,
|
| 44 |
+
"i": 9,
|
| 45 |
+
"j": 20,
|
| 46 |
+
"k": 2,
|
| 47 |
+
"l": 10,
|
| 48 |
+
"m": 13,
|
| 49 |
+
"n": 4,
|
| 50 |
+
"o": 6,
|
| 51 |
+
"p": 3,
|
| 52 |
+
"q": 39,
|
| 53 |
+
"r": 21,
|
| 54 |
+
"s": 15,
|
| 55 |
+
"t": 7,
|
| 56 |
+
"u": 12,
|
| 57 |
+
"v": 28,
|
| 58 |
+
"w": 16,
|
| 59 |
+
"x": 36,
|
| 60 |
+
"y": 14,
|
| 61 |
+
"z": 27,
|
| 62 |
+
"|": 0,
|
| 63 |
+
"à": 8,
|
| 64 |
+
"ù": 11
|
| 65 |
+
},
|
| 66 |
+
"pad": null,
|
| 67 |
+
"blank": "|",
|
| 68 |
+
"bos": null,
|
| 69 |
+
"eos": null,
|
| 70 |
+
"add_blank_char": true,
|
| 71 |
+
"add_blank_word": false,
|
| 72 |
+
"use_eos_bos": false,
|
| 73 |
+
"blank_at_start": true,
|
| 74 |
+
"blank_at_end": true,
|
| 75 |
+
"word_sep_token": " ",
|
| 76 |
+
"blank_between": "tokens_and_words"
|
| 77 |
+
}
|
facebook__mms-tts-pbi-Parkwa/config.json
ADDED
|
@@ -0,0 +1,71 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"phoonnx_version": "1.0",
|
| 3 |
+
"engine": "transformers",
|
| 4 |
+
"phoneme_type": "graphemes",
|
| 5 |
+
"alphabet": "unicode",
|
| 6 |
+
"lang_code": "pbi",
|
| 7 |
+
"audio": {
|
| 8 |
+
"sample_rate": 16000
|
| 9 |
+
},
|
| 10 |
+
"num_symbols": 256,
|
| 11 |
+
"num_speakers": 1,
|
| 12 |
+
"num_langs": 1,
|
| 13 |
+
"speaker_id_map": {},
|
| 14 |
+
"lang_id_map": {},
|
| 15 |
+
"phonemizer_model": null,
|
| 16 |
+
"add_diacritics": false,
|
| 17 |
+
"inference": {
|
| 18 |
+
"noise_scale": 0.667,
|
| 19 |
+
"length_scale": 1.0,
|
| 20 |
+
"noise_w": 0.8
|
| 21 |
+
},
|
| 22 |
+
"phoneme_id_map": {
|
| 23 |
+
" ": 35,
|
| 24 |
+
"-": 32,
|
| 25 |
+
"1": 34,
|
| 26 |
+
"a": 1,
|
| 27 |
+
"b": 14,
|
| 28 |
+
"c": 31,
|
| 29 |
+
"d": 5,
|
| 30 |
+
"e": 9,
|
| 31 |
+
"f": 26,
|
| 32 |
+
"g": 19,
|
| 33 |
+
"h": 18,
|
| 34 |
+
"i": 10,
|
| 35 |
+
"j": 30,
|
| 36 |
+
"k": 3,
|
| 37 |
+
"l": 7,
|
| 38 |
+
"m": 6,
|
| 39 |
+
"n": 4,
|
| 40 |
+
"p": 29,
|
| 41 |
+
"r": 15,
|
| 42 |
+
"s": 11,
|
| 43 |
+
"t": 8,
|
| 44 |
+
"u": 16,
|
| 45 |
+
"v": 22,
|
| 46 |
+
"w": 12,
|
| 47 |
+
"y": 21,
|
| 48 |
+
"z": 17,
|
| 49 |
+
"|": 0,
|
| 50 |
+
"à": 25,
|
| 51 |
+
"á": 24,
|
| 52 |
+
"ŋ": 13,
|
| 53 |
+
"ɓ": 27,
|
| 54 |
+
"ɗ": 20,
|
| 55 |
+
"ə": 2,
|
| 56 |
+
"ɨ": 23,
|
| 57 |
+
"́": 28,
|
| 58 |
+
"̌": 33
|
| 59 |
+
},
|
| 60 |
+
"pad": null,
|
| 61 |
+
"blank": "|",
|
| 62 |
+
"bos": null,
|
| 63 |
+
"eos": null,
|
| 64 |
+
"add_blank_char": true,
|
| 65 |
+
"add_blank_word": false,
|
| 66 |
+
"use_eos_bos": false,
|
| 67 |
+
"blank_at_start": true,
|
| 68 |
+
"blank_at_end": true,
|
| 69 |
+
"word_sep_token": " ",
|
| 70 |
+
"blank_between": "tokens_and_words"
|
| 71 |
+
}
|
facebook__mms-tts-pcm-Pidgin_Nigerian/config.json
ADDED
|
@@ -0,0 +1,71 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"phoonnx_version": "1.0",
|
| 3 |
+
"engine": "transformers",
|
| 4 |
+
"phoneme_type": "graphemes",
|
| 5 |
+
"alphabet": "unicode",
|
| 6 |
+
"lang_code": "pcm",
|
| 7 |
+
"audio": {
|
| 8 |
+
"sample_rate": 16000
|
| 9 |
+
},
|
| 10 |
+
"num_symbols": 256,
|
| 11 |
+
"num_speakers": 1,
|
| 12 |
+
"num_langs": 1,
|
| 13 |
+
"speaker_id_map": {},
|
| 14 |
+
"lang_id_map": {},
|
| 15 |
+
"phonemizer_model": null,
|
| 16 |
+
"add_diacritics": false,
|
| 17 |
+
"inference": {
|
| 18 |
+
"noise_scale": 0.667,
|
| 19 |
+
"length_scale": 1.0,
|
| 20 |
+
"noise_w": 0.8
|
| 21 |
+
},
|
| 22 |
+
"phoneme_id_map": {
|
| 23 |
+
" ": 35,
|
| 24 |
+
"'": 28,
|
| 25 |
+
"-": 24,
|
| 26 |
+
"0": 27,
|
| 27 |
+
"1": 29,
|
| 28 |
+
"2": 30,
|
| 29 |
+
"3": 34,
|
| 30 |
+
"4": 32,
|
| 31 |
+
"5": 31,
|
| 32 |
+
"7": 33,
|
| 33 |
+
"a": 3,
|
| 34 |
+
"b": 19,
|
| 35 |
+
"c": 22,
|
| 36 |
+
"d": 6,
|
| 37 |
+
"e": 1,
|
| 38 |
+
"f": 18,
|
| 39 |
+
"g": 16,
|
| 40 |
+
"h": 20,
|
| 41 |
+
"i": 4,
|
| 42 |
+
"j": 23,
|
| 43 |
+
"k": 14,
|
| 44 |
+
"l": 11,
|
| 45 |
+
"m": 12,
|
| 46 |
+
"n": 5,
|
| 47 |
+
"o": 2,
|
| 48 |
+
"p": 17,
|
| 49 |
+
"r": 9,
|
| 50 |
+
"s": 7,
|
| 51 |
+
"t": 8,
|
| 52 |
+
"u": 15,
|
| 53 |
+
"v": 21,
|
| 54 |
+
"w": 13,
|
| 55 |
+
"x": 26,
|
| 56 |
+
"y": 10,
|
| 57 |
+
"z": 25,
|
| 58 |
+
"|": 0
|
| 59 |
+
},
|
| 60 |
+
"pad": null,
|
| 61 |
+
"blank": "|",
|
| 62 |
+
"bos": null,
|
| 63 |
+
"eos": null,
|
| 64 |
+
"add_blank_char": true,
|
| 65 |
+
"add_blank_word": false,
|
| 66 |
+
"use_eos_bos": false,
|
| 67 |
+
"blank_at_start": true,
|
| 68 |
+
"blank_at_end": true,
|
| 69 |
+
"word_sep_token": " ",
|
| 70 |
+
"blank_between": "tokens_and_words"
|
| 71 |
+
}
|
facebook__mms-tts-peg-Pengo/config.json
ADDED
|
@@ -0,0 +1,73 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"phoonnx_version": "1.0",
|
| 3 |
+
"engine": "transformers",
|
| 4 |
+
"phoneme_type": "graphemes",
|
| 5 |
+
"alphabet": "unicode",
|
| 6 |
+
"lang_code": "peg",
|
| 7 |
+
"audio": {
|
| 8 |
+
"sample_rate": 16000
|
| 9 |
+
},
|
| 10 |
+
"num_symbols": 256,
|
| 11 |
+
"num_speakers": 1,
|
| 12 |
+
"num_langs": 1,
|
| 13 |
+
"speaker_id_map": {},
|
| 14 |
+
"lang_id_map": {},
|
| 15 |
+
"phonemizer_model": null,
|
| 16 |
+
"add_diacritics": false,
|
| 17 |
+
"inference": {
|
| 18 |
+
"noise_scale": 0.667,
|
| 19 |
+
"length_scale": 1.0,
|
| 20 |
+
"noise_w": 0.8
|
| 21 |
+
},
|
| 22 |
+
"phoneme_id_map": {
|
| 23 |
+
" ": 37,
|
| 24 |
+
"|": 0,
|
| 25 |
+
"ଂ": 15,
|
| 26 |
+
"ଃ": 36,
|
| 27 |
+
"ଅ": 34,
|
| 28 |
+
"ଆ": 17,
|
| 29 |
+
"ଇ": 16,
|
| 30 |
+
"ଉ": 33,
|
| 31 |
+
"ଏ": 30,
|
| 32 |
+
"ଓ": 35,
|
| 33 |
+
"କ": 8,
|
| 34 |
+
"ଗ": 13,
|
| 35 |
+
"ଙ": 26,
|
| 36 |
+
"ଚ": 23,
|
| 37 |
+
"ଜ": 10,
|
| 38 |
+
"ଞ": 32,
|
| 39 |
+
"ଟ": 29,
|
| 40 |
+
"ଡ": 25,
|
| 41 |
+
"ଣ": 28,
|
| 42 |
+
"ତ": 7,
|
| 43 |
+
"ଦ": 19,
|
| 44 |
+
"ନ": 6,
|
| 45 |
+
"ପ": 20,
|
| 46 |
+
"ବ": 21,
|
| 47 |
+
"ମ": 14,
|
| 48 |
+
"ର": 5,
|
| 49 |
+
"ଲ": 24,
|
| 50 |
+
"ସ": 18,
|
| 51 |
+
"ହ": 9,
|
| 52 |
+
"଼": 22,
|
| 53 |
+
"ା": 1,
|
| 54 |
+
"ି": 3,
|
| 55 |
+
"ୁ": 12,
|
| 56 |
+
"େ": 4,
|
| 57 |
+
"୍": 2,
|
| 58 |
+
"ୟ": 27,
|
| 59 |
+
"ୱ": 11,
|
| 60 |
+
"": 31
|
| 61 |
+
},
|
| 62 |
+
"pad": null,
|
| 63 |
+
"blank": "|",
|
| 64 |
+
"bos": null,
|
| 65 |
+
"eos": null,
|
| 66 |
+
"add_blank_char": true,
|
| 67 |
+
"add_blank_word": false,
|
| 68 |
+
"use_eos_bos": false,
|
| 69 |
+
"blank_at_start": true,
|
| 70 |
+
"blank_at_end": true,
|
| 71 |
+
"word_sep_token": " ",
|
| 72 |
+
"blank_between": "tokens_and_words"
|
| 73 |
+
}
|
facebook__mms-tts-pez-Penan_Eastern/config.json
ADDED
|
@@ -0,0 +1,68 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"phoonnx_version": "1.0",
|
| 3 |
+
"engine": "transformers",
|
| 4 |
+
"phoneme_type": "graphemes",
|
| 5 |
+
"alphabet": "unicode",
|
| 6 |
+
"lang_code": "pez",
|
| 7 |
+
"audio": {
|
| 8 |
+
"sample_rate": 16000
|
| 9 |
+
},
|
| 10 |
+
"num_symbols": 256,
|
| 11 |
+
"num_speakers": 1,
|
| 12 |
+
"num_langs": 1,
|
| 13 |
+
"speaker_id_map": {},
|
| 14 |
+
"lang_id_map": {},
|
| 15 |
+
"phonemizer_model": null,
|
| 16 |
+
"add_diacritics": false,
|
| 17 |
+
"inference": {
|
| 18 |
+
"noise_scale": 0.667,
|
| 19 |
+
"length_scale": 1.0,
|
| 20 |
+
"noise_w": 0.8
|
| 21 |
+
},
|
| 22 |
+
"phoneme_id_map": {
|
| 23 |
+
" ": 14,
|
| 24 |
+
"'": 32,
|
| 25 |
+
"-": 4,
|
| 26 |
+
"0": 7,
|
| 27 |
+
"1": 20,
|
| 28 |
+
"2": 9,
|
| 29 |
+
"4": 27,
|
| 30 |
+
"6": 13,
|
| 31 |
+
"_": 3,
|
| 32 |
+
"a": 15,
|
| 33 |
+
"b": 0,
|
| 34 |
+
"c": 8,
|
| 35 |
+
"d": 30,
|
| 36 |
+
"e": 18,
|
| 37 |
+
"g": 5,
|
| 38 |
+
"h": 1,
|
| 39 |
+
"i": 17,
|
| 40 |
+
"j": 16,
|
| 41 |
+
"k": 25,
|
| 42 |
+
"l": 6,
|
| 43 |
+
"m": 26,
|
| 44 |
+
"n": 11,
|
| 45 |
+
"o": 12,
|
| 46 |
+
"p": 2,
|
| 47 |
+
"r": 24,
|
| 48 |
+
"s": 22,
|
| 49 |
+
"t": 31,
|
| 50 |
+
"u": 10,
|
| 51 |
+
"v": 19,
|
| 52 |
+
"w": 21,
|
| 53 |
+
"y": 28,
|
| 54 |
+
"z": 29,
|
| 55 |
+
"é": 23
|
| 56 |
+
},
|
| 57 |
+
"pad": null,
|
| 58 |
+
"blank": "b",
|
| 59 |
+
"bos": null,
|
| 60 |
+
"eos": null,
|
| 61 |
+
"add_blank_char": true,
|
| 62 |
+
"add_blank_word": false,
|
| 63 |
+
"use_eos_bos": false,
|
| 64 |
+
"blank_at_start": true,
|
| 65 |
+
"blank_at_end": true,
|
| 66 |
+
"word_sep_token": " ",
|
| 67 |
+
"blank_between": "tokens_and_words"
|
| 68 |
+
}
|
facebook__mms-tts-pir-Piratapuyo/config.json
ADDED
|
@@ -0,0 +1,79 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"phoonnx_version": "1.0",
|
| 3 |
+
"engine": "transformers",
|
| 4 |
+
"phoneme_type": "graphemes",
|
| 5 |
+
"alphabet": "unicode",
|
| 6 |
+
"lang_code": "pir",
|
| 7 |
+
"audio": {
|
| 8 |
+
"sample_rate": 16000
|
| 9 |
+
},
|
| 10 |
+
"num_symbols": 256,
|
| 11 |
+
"num_speakers": 1,
|
| 12 |
+
"num_langs": 1,
|
| 13 |
+
"speaker_id_map": {},
|
| 14 |
+
"lang_id_map": {},
|
| 15 |
+
"phonemizer_model": null,
|
| 16 |
+
"add_diacritics": false,
|
| 17 |
+
"inference": {
|
| 18 |
+
"noise_scale": 0.667,
|
| 19 |
+
"length_scale": 1.0,
|
| 20 |
+
"noise_w": 0.8
|
| 21 |
+
},
|
| 22 |
+
"phoneme_id_map": {
|
| 23 |
+
" ": 43,
|
| 24 |
+
"'": 38,
|
| 25 |
+
"a": 1,
|
| 26 |
+
"b": 23,
|
| 27 |
+
"c": 13,
|
| 28 |
+
"d": 18,
|
| 29 |
+
"e": 3,
|
| 30 |
+
"f": 32,
|
| 31 |
+
"g": 20,
|
| 32 |
+
"h": 6,
|
| 33 |
+
"i": 2,
|
| 34 |
+
"j": 16,
|
| 35 |
+
"k": 40,
|
| 36 |
+
"l": 27,
|
| 37 |
+
"m": 15,
|
| 38 |
+
"n": 10,
|
| 39 |
+
"o": 5,
|
| 40 |
+
"p": 17,
|
| 41 |
+
"q": 14,
|
| 42 |
+
"r": 4,
|
| 43 |
+
"s": 12,
|
| 44 |
+
"t": 9,
|
| 45 |
+
"u": 8,
|
| 46 |
+
"v": 33,
|
| 47 |
+
"w": 24,
|
| 48 |
+
"x": 41,
|
| 49 |
+
"y": 11,
|
| 50 |
+
"z": 35,
|
| 51 |
+
"|": 0,
|
| 52 |
+
"á": 36,
|
| 53 |
+
"ã": 22,
|
| 54 |
+
"é": 34,
|
| 55 |
+
"í": 31,
|
| 56 |
+
"ñ": 21,
|
| 57 |
+
"ó": 39,
|
| 58 |
+
"õ": 28,
|
| 59 |
+
"ú": 37,
|
| 60 |
+
"ĩ": 29,
|
| 61 |
+
"ũ": 26,
|
| 62 |
+
"ʉ": 7,
|
| 63 |
+
"́": 42,
|
| 64 |
+
"̃": 19,
|
| 65 |
+
"ẽ": 25,
|
| 66 |
+
"—": 30
|
| 67 |
+
},
|
| 68 |
+
"pad": null,
|
| 69 |
+
"blank": "|",
|
| 70 |
+
"bos": null,
|
| 71 |
+
"eos": null,
|
| 72 |
+
"add_blank_char": true,
|
| 73 |
+
"add_blank_word": false,
|
| 74 |
+
"use_eos_bos": false,
|
| 75 |
+
"blank_at_start": true,
|
| 76 |
+
"blank_at_end": true,
|
| 77 |
+
"word_sep_token": " ",
|
| 78 |
+
"blank_between": "tokens_and_words"
|
| 79 |
+
}
|
facebook__mms-tts-pis-Pijin/config.json
ADDED
|
@@ -0,0 +1,71 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"phoonnx_version": "1.0",
|
| 3 |
+
"engine": "transformers",
|
| 4 |
+
"phoneme_type": "graphemes",
|
| 5 |
+
"alphabet": "unicode",
|
| 6 |
+
"lang_code": "pis",
|
| 7 |
+
"audio": {
|
| 8 |
+
"sample_rate": 16000
|
| 9 |
+
},
|
| 10 |
+
"num_symbols": 256,
|
| 11 |
+
"num_speakers": 1,
|
| 12 |
+
"num_langs": 1,
|
| 13 |
+
"speaker_id_map": {},
|
| 14 |
+
"lang_id_map": {},
|
| 15 |
+
"phonemizer_model": null,
|
| 16 |
+
"add_diacritics": false,
|
| 17 |
+
"inference": {
|
| 18 |
+
"noise_scale": 0.667,
|
| 19 |
+
"length_scale": 1.0,
|
| 20 |
+
"noise_w": 0.8
|
| 21 |
+
},
|
| 22 |
+
"phoneme_id_map": {
|
| 23 |
+
" ": 35,
|
| 24 |
+
"'": 25,
|
| 25 |
+
"-": 23,
|
| 26 |
+
"0": 24,
|
| 27 |
+
"1": 26,
|
| 28 |
+
"2": 27,
|
| 29 |
+
"3": 32,
|
| 30 |
+
"4": 28,
|
| 31 |
+
"5": 30,
|
| 32 |
+
"6": 31,
|
| 33 |
+
"7": 33,
|
| 34 |
+
"8": 34,
|
| 35 |
+
"9": 29,
|
| 36 |
+
"a": 1,
|
| 37 |
+
"b": 15,
|
| 38 |
+
"d": 16,
|
| 39 |
+
"e": 2,
|
| 40 |
+
"f": 12,
|
| 41 |
+
"g": 10,
|
| 42 |
+
"h": 13,
|
| 43 |
+
"i": 5,
|
| 44 |
+
"j": 22,
|
| 45 |
+
"k": 11,
|
| 46 |
+
"l": 7,
|
| 47 |
+
"m": 4,
|
| 48 |
+
"n": 6,
|
| 49 |
+
"o": 3,
|
| 50 |
+
"p": 18,
|
| 51 |
+
"r": 17,
|
| 52 |
+
"s": 9,
|
| 53 |
+
"t": 8,
|
| 54 |
+
"u": 14,
|
| 55 |
+
"v": 21,
|
| 56 |
+
"w": 20,
|
| 57 |
+
"y": 19,
|
| 58 |
+
"|": 0
|
| 59 |
+
},
|
| 60 |
+
"pad": null,
|
| 61 |
+
"blank": "|",
|
| 62 |
+
"bos": null,
|
| 63 |
+
"eos": null,
|
| 64 |
+
"add_blank_char": true,
|
| 65 |
+
"add_blank_word": false,
|
| 66 |
+
"use_eos_bos": false,
|
| 67 |
+
"blank_at_start": true,
|
| 68 |
+
"blank_at_end": true,
|
| 69 |
+
"word_sep_token": " ",
|
| 70 |
+
"blank_between": "tokens_and_words"
|
| 71 |
+
}
|
facebook__mms-tts-pjt-Pitjantjatjara/config.json
ADDED
|
@@ -0,0 +1,80 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"phoonnx_version": "1.0",
|
| 3 |
+
"engine": "transformers",
|
| 4 |
+
"phoneme_type": "graphemes",
|
| 5 |
+
"alphabet": "unicode",
|
| 6 |
+
"lang_code": "pjt",
|
| 7 |
+
"audio": {
|
| 8 |
+
"sample_rate": 16000
|
| 9 |
+
},
|
| 10 |
+
"num_symbols": 256,
|
| 11 |
+
"num_speakers": 1,
|
| 12 |
+
"num_langs": 1,
|
| 13 |
+
"speaker_id_map": {},
|
| 14 |
+
"lang_id_map": {},
|
| 15 |
+
"phonemizer_model": null,
|
| 16 |
+
"add_diacritics": false,
|
| 17 |
+
"inference": {
|
| 18 |
+
"noise_scale": 0.667,
|
| 19 |
+
"length_scale": 1.0,
|
| 20 |
+
"noise_w": 0.8
|
| 21 |
+
},
|
| 22 |
+
"phoneme_id_map": {
|
| 23 |
+
" ": 35,
|
| 24 |
+
"'": 13,
|
| 25 |
+
"-": 30,
|
| 26 |
+
"0": 37,
|
| 27 |
+
"1": 28,
|
| 28 |
+
"2": 36,
|
| 29 |
+
"3": 14,
|
| 30 |
+
"4": 8,
|
| 31 |
+
"5": 18,
|
| 32 |
+
"6": 6,
|
| 33 |
+
"7": 41,
|
| 34 |
+
"8": 22,
|
| 35 |
+
"9": 17,
|
| 36 |
+
"_": 11,
|
| 37 |
+
"a": 44,
|
| 38 |
+
"b": 10,
|
| 39 |
+
"c": 4,
|
| 40 |
+
"d": 1,
|
| 41 |
+
"e": 38,
|
| 42 |
+
"f": 32,
|
| 43 |
+
"g": 26,
|
| 44 |
+
"h": 23,
|
| 45 |
+
"i": 42,
|
| 46 |
+
"j": 39,
|
| 47 |
+
"k": 43,
|
| 48 |
+
"l": 24,
|
| 49 |
+
"m": 2,
|
| 50 |
+
"n": 31,
|
| 51 |
+
"o": 25,
|
| 52 |
+
"p": 12,
|
| 53 |
+
"r": 34,
|
| 54 |
+
"s": 20,
|
| 55 |
+
"t": 40,
|
| 56 |
+
"u": 29,
|
| 57 |
+
"v": 3,
|
| 58 |
+
"w": 21,
|
| 59 |
+
"x": 27,
|
| 60 |
+
"y": 0,
|
| 61 |
+
"z": 5,
|
| 62 |
+
"ḻ": 7,
|
| 63 |
+
"ṉ": 16,
|
| 64 |
+
"ṟ": 15,
|
| 65 |
+
"ṯ": 33,
|
| 66 |
+
"–": 19,
|
| 67 |
+
"—": 9
|
| 68 |
+
},
|
| 69 |
+
"pad": null,
|
| 70 |
+
"blank": "y",
|
| 71 |
+
"bos": null,
|
| 72 |
+
"eos": null,
|
| 73 |
+
"add_blank_char": true,
|
| 74 |
+
"add_blank_word": false,
|
| 75 |
+
"use_eos_bos": false,
|
| 76 |
+
"blank_at_start": true,
|
| 77 |
+
"blank_at_end": true,
|
| 78 |
+
"word_sep_token": " ",
|
| 79 |
+
"blank_between": "tokens_and_words"
|
| 80 |
+
}
|
facebook__mms-tts-pls-Popoloca_San_Marcos_Tlacoyalco/config.json
ADDED
|
@@ -0,0 +1,80 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"phoonnx_version": "1.0",
|
| 3 |
+
"engine": "transformers",
|
| 4 |
+
"phoneme_type": "graphemes",
|
| 5 |
+
"alphabet": "unicode",
|
| 6 |
+
"lang_code": "pls",
|
| 7 |
+
"audio": {
|
| 8 |
+
"sample_rate": 16000
|
| 9 |
+
},
|
| 10 |
+
"num_symbols": 256,
|
| 11 |
+
"num_speakers": 1,
|
| 12 |
+
"num_langs": 1,
|
| 13 |
+
"speaker_id_map": {},
|
| 14 |
+
"lang_id_map": {},
|
| 15 |
+
"phonemizer_model": null,
|
| 16 |
+
"add_diacritics": false,
|
| 17 |
+
"inference": {
|
| 18 |
+
"noise_scale": 0.667,
|
| 19 |
+
"length_scale": 1.0,
|
| 20 |
+
"noise_w": 0.8
|
| 21 |
+
},
|
| 22 |
+
"phoneme_id_map": {
|
| 23 |
+
" ": 1,
|
| 24 |
+
"'": 17,
|
| 25 |
+
"-": 11,
|
| 26 |
+
"0": 31,
|
| 27 |
+
"1": 19,
|
| 28 |
+
"2": 40,
|
| 29 |
+
"3": 18,
|
| 30 |
+
"4": 4,
|
| 31 |
+
"6": 3,
|
| 32 |
+
"7": 0,
|
| 33 |
+
"_": 13,
|
| 34 |
+
"a": 2,
|
| 35 |
+
"b": 15,
|
| 36 |
+
"c": 38,
|
| 37 |
+
"d": 26,
|
| 38 |
+
"e": 9,
|
| 39 |
+
"f": 33,
|
| 40 |
+
"g": 23,
|
| 41 |
+
"h": 36,
|
| 42 |
+
"i": 32,
|
| 43 |
+
"j": 44,
|
| 44 |
+
"k": 10,
|
| 45 |
+
"l": 7,
|
| 46 |
+
"m": 6,
|
| 47 |
+
"n": 39,
|
| 48 |
+
"o": 27,
|
| 49 |
+
"p": 24,
|
| 50 |
+
"q": 12,
|
| 51 |
+
"r": 21,
|
| 52 |
+
"s": 8,
|
| 53 |
+
"t": 5,
|
| 54 |
+
"u": 28,
|
| 55 |
+
"v": 25,
|
| 56 |
+
"x": 14,
|
| 57 |
+
"y": 35,
|
| 58 |
+
"z": 22,
|
| 59 |
+
"á": 43,
|
| 60 |
+
"é": 37,
|
| 61 |
+
"í": 30,
|
| 62 |
+
"ñ": 42,
|
| 63 |
+
"ó": 34,
|
| 64 |
+
"ú": 20,
|
| 65 |
+
"̱": 29,
|
| 66 |
+
"—": 41,
|
| 67 |
+
"ꞌ": 16
|
| 68 |
+
},
|
| 69 |
+
"pad": null,
|
| 70 |
+
"blank": "7",
|
| 71 |
+
"bos": null,
|
| 72 |
+
"eos": null,
|
| 73 |
+
"add_blank_char": true,
|
| 74 |
+
"add_blank_word": false,
|
| 75 |
+
"use_eos_bos": false,
|
| 76 |
+
"blank_at_start": true,
|
| 77 |
+
"blank_at_end": true,
|
| 78 |
+
"word_sep_token": " ",
|
| 79 |
+
"blank_between": "tokens_and_words"
|
| 80 |
+
}
|
facebook__mms-tts-pmf-Pamona/config.json
ADDED
|
@@ -0,0 +1,62 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"phoonnx_version": "1.0",
|
| 3 |
+
"engine": "transformers",
|
| 4 |
+
"phoneme_type": "graphemes",
|
| 5 |
+
"alphabet": "unicode",
|
| 6 |
+
"lang_code": "pmf",
|
| 7 |
+
"audio": {
|
| 8 |
+
"sample_rate": 16000
|
| 9 |
+
},
|
| 10 |
+
"num_symbols": 256,
|
| 11 |
+
"num_speakers": 1,
|
| 12 |
+
"num_langs": 1,
|
| 13 |
+
"speaker_id_map": {},
|
| 14 |
+
"lang_id_map": {},
|
| 15 |
+
"phonemizer_model": null,
|
| 16 |
+
"add_diacritics": false,
|
| 17 |
+
"inference": {
|
| 18 |
+
"noise_scale": 0.667,
|
| 19 |
+
"length_scale": 1.0,
|
| 20 |
+
"noise_w": 0.8
|
| 21 |
+
},
|
| 22 |
+
"phoneme_id_map": {
|
| 23 |
+
" ": 26,
|
| 24 |
+
"'": 17,
|
| 25 |
+
"-": 22,
|
| 26 |
+
"a": 0,
|
| 27 |
+
"b": 18,
|
| 28 |
+
"c": 24,
|
| 29 |
+
"d": 19,
|
| 30 |
+
"e": 6,
|
| 31 |
+
"f": 25,
|
| 32 |
+
"g": 13,
|
| 33 |
+
"h": 21,
|
| 34 |
+
"i": 3,
|
| 35 |
+
"j": 20,
|
| 36 |
+
"k": 9,
|
| 37 |
+
"l": 14,
|
| 38 |
+
"m": 5,
|
| 39 |
+
"n": 4,
|
| 40 |
+
"o": 2,
|
| 41 |
+
"p": 11,
|
| 42 |
+
"r": 12,
|
| 43 |
+
"s": 10,
|
| 44 |
+
"t": 7,
|
| 45 |
+
"u": 8,
|
| 46 |
+
"w": 16,
|
| 47 |
+
"y": 15,
|
| 48 |
+
"z": 23,
|
| 49 |
+
"|": 1
|
| 50 |
+
},
|
| 51 |
+
"pad": null,
|
| 52 |
+
"blank": "a",
|
| 53 |
+
"bos": null,
|
| 54 |
+
"eos": null,
|
| 55 |
+
"add_blank_char": true,
|
| 56 |
+
"add_blank_word": false,
|
| 57 |
+
"use_eos_bos": false,
|
| 58 |
+
"blank_at_start": true,
|
| 59 |
+
"blank_at_end": true,
|
| 60 |
+
"word_sep_token": " ",
|
| 61 |
+
"blank_between": "tokens_and_words"
|
| 62 |
+
}
|
facebook__mms-tts-pny-Pinyin/config.json
ADDED
|
@@ -0,0 +1,90 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"phoonnx_version": "1.0",
|
| 3 |
+
"engine": "transformers",
|
| 4 |
+
"phoneme_type": "graphemes",
|
| 5 |
+
"alphabet": "unicode",
|
| 6 |
+
"lang_code": "pny",
|
| 7 |
+
"audio": {
|
| 8 |
+
"sample_rate": 16000
|
| 9 |
+
},
|
| 10 |
+
"num_symbols": 256,
|
| 11 |
+
"num_speakers": 1,
|
| 12 |
+
"num_langs": 1,
|
| 13 |
+
"speaker_id_map": {},
|
| 14 |
+
"lang_id_map": {},
|
| 15 |
+
"phonemizer_model": null,
|
| 16 |
+
"add_diacritics": false,
|
| 17 |
+
"inference": {
|
| 18 |
+
"noise_scale": 0.667,
|
| 19 |
+
"length_scale": 1.0,
|
| 20 |
+
"noise_w": 0.8
|
| 21 |
+
},
|
| 22 |
+
"phoneme_id_map": {
|
| 23 |
+
" ": 54,
|
| 24 |
+
"'": 47,
|
| 25 |
+
"-": 51,
|
| 26 |
+
"1": 52,
|
| 27 |
+
"2": 53,
|
| 28 |
+
"a": 5,
|
| 29 |
+
"b": 16,
|
| 30 |
+
"c": 34,
|
| 31 |
+
"d": 29,
|
| 32 |
+
"e": 26,
|
| 33 |
+
"f": 32,
|
| 34 |
+
"g": 20,
|
| 35 |
+
"h": 12,
|
| 36 |
+
"i": 23,
|
| 37 |
+
"j": 38,
|
| 38 |
+
"k": 21,
|
| 39 |
+
"l": 11,
|
| 40 |
+
"m": 6,
|
| 41 |
+
"n": 3,
|
| 42 |
+
"o": 13,
|
| 43 |
+
"p": 7,
|
| 44 |
+
"q": 50,
|
| 45 |
+
"r": 24,
|
| 46 |
+
"s": 17,
|
| 47 |
+
"t": 9,
|
| 48 |
+
"u": 15,
|
| 49 |
+
"v": 46,
|
| 50 |
+
"w": 10,
|
| 51 |
+
"x": 49,
|
| 52 |
+
"y": 22,
|
| 53 |
+
"z": 25,
|
| 54 |
+
"|": 0,
|
| 55 |
+
"à": 8,
|
| 56 |
+
"â": 35,
|
| 57 |
+
"è": 31,
|
| 58 |
+
"ì": 33,
|
| 59 |
+
"î": 44,
|
| 60 |
+
"ò": 27,
|
| 61 |
+
"ô": 36,
|
| 62 |
+
"ù": 18,
|
| 63 |
+
"û": 39,
|
| 64 |
+
"ě": 40,
|
| 65 |
+
"ŋ": 14,
|
| 66 |
+
"ǎ": 37,
|
| 67 |
+
"ǐ": 45,
|
| 68 |
+
"ǒ": 48,
|
| 69 |
+
"ǔ": 43,
|
| 70 |
+
"ǹ": 42,
|
| 71 |
+
"ə": 1,
|
| 72 |
+
"ɨ": 4,
|
| 73 |
+
"ʼ": 19,
|
| 74 |
+
"̀": 2,
|
| 75 |
+
"̂": 30,
|
| 76 |
+
"̌": 41,
|
| 77 |
+
"ẅ": 28
|
| 78 |
+
},
|
| 79 |
+
"pad": null,
|
| 80 |
+
"blank": "|",
|
| 81 |
+
"bos": null,
|
| 82 |
+
"eos": null,
|
| 83 |
+
"add_blank_char": true,
|
| 84 |
+
"add_blank_word": false,
|
| 85 |
+
"use_eos_bos": false,
|
| 86 |
+
"blank_at_start": true,
|
| 87 |
+
"blank_at_end": true,
|
| 88 |
+
"word_sep_token": " ",
|
| 89 |
+
"blank_between": "tokens_and_words"
|
| 90 |
+
}
|
facebook__mms-tts-poh-dialect_eastern-Poqomchi’/config.json
ADDED
|
@@ -0,0 +1,72 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"phoonnx_version": "1.0",
|
| 3 |
+
"engine": "transformers",
|
| 4 |
+
"phoneme_type": "graphemes",
|
| 5 |
+
"alphabet": "unicode",
|
| 6 |
+
"lang_code": "poh-dialect-eastern",
|
| 7 |
+
"audio": {
|
| 8 |
+
"sample_rate": 16000
|
| 9 |
+
},
|
| 10 |
+
"num_symbols": 256,
|
| 11 |
+
"num_speakers": 1,
|
| 12 |
+
"num_langs": 1,
|
| 13 |
+
"speaker_id_map": {},
|
| 14 |
+
"lang_id_map": {},
|
| 15 |
+
"phonemizer_model": null,
|
| 16 |
+
"add_diacritics": false,
|
| 17 |
+
"inference": {
|
| 18 |
+
"noise_scale": 0.667,
|
| 19 |
+
"length_scale": 1.0,
|
| 20 |
+
"noise_w": 0.8
|
| 21 |
+
},
|
| 22 |
+
"phoneme_id_map": {
|
| 23 |
+
" ": 7,
|
| 24 |
+
"'": 17,
|
| 25 |
+
"-": 25,
|
| 26 |
+
"_": 9,
|
| 27 |
+
"a": 11,
|
| 28 |
+
"b": 14,
|
| 29 |
+
"c": 31,
|
| 30 |
+
"d": 32,
|
| 31 |
+
"e": 1,
|
| 32 |
+
"f": 16,
|
| 33 |
+
"g": 20,
|
| 34 |
+
"h": 0,
|
| 35 |
+
"i": 28,
|
| 36 |
+
"j": 26,
|
| 37 |
+
"k": 27,
|
| 38 |
+
"l": 10,
|
| 39 |
+
"m": 18,
|
| 40 |
+
"n": 36,
|
| 41 |
+
"o": 35,
|
| 42 |
+
"p": 2,
|
| 43 |
+
"q": 23,
|
| 44 |
+
"r": 12,
|
| 45 |
+
"s": 29,
|
| 46 |
+
"t": 34,
|
| 47 |
+
"u": 13,
|
| 48 |
+
"v": 19,
|
| 49 |
+
"w": 21,
|
| 50 |
+
"x": 33,
|
| 51 |
+
"y": 8,
|
| 52 |
+
"z": 24,
|
| 53 |
+
"á": 4,
|
| 54 |
+
"é": 22,
|
| 55 |
+
"í": 15,
|
| 56 |
+
"ñ": 30,
|
| 57 |
+
"ó": 3,
|
| 58 |
+
"ú": 5,
|
| 59 |
+
"—": 6
|
| 60 |
+
},
|
| 61 |
+
"pad": null,
|
| 62 |
+
"blank": "h",
|
| 63 |
+
"bos": null,
|
| 64 |
+
"eos": null,
|
| 65 |
+
"add_blank_char": true,
|
| 66 |
+
"add_blank_word": false,
|
| 67 |
+
"use_eos_bos": false,
|
| 68 |
+
"blank_at_start": true,
|
| 69 |
+
"blank_at_end": true,
|
| 70 |
+
"word_sep_token": " ",
|
| 71 |
+
"blank_between": "tokens_and_words"
|
| 72 |
+
}
|
facebook__mms-tts-poh-dialect_western-Poqomchi’/config.json
ADDED
|
@@ -0,0 +1,64 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"phoonnx_version": "1.0",
|
| 3 |
+
"engine": "transformers",
|
| 4 |
+
"phoneme_type": "graphemes",
|
| 5 |
+
"alphabet": "unicode",
|
| 6 |
+
"lang_code": "poh-dialect-western",
|
| 7 |
+
"audio": {
|
| 8 |
+
"sample_rate": 16000
|
| 9 |
+
},
|
| 10 |
+
"num_symbols": 256,
|
| 11 |
+
"num_speakers": 1,
|
| 12 |
+
"num_langs": 1,
|
| 13 |
+
"speaker_id_map": {},
|
| 14 |
+
"lang_id_map": {},
|
| 15 |
+
"phonemizer_model": null,
|
| 16 |
+
"add_diacritics": false,
|
| 17 |
+
"inference": {
|
| 18 |
+
"noise_scale": 0.667,
|
| 19 |
+
"length_scale": 1.0,
|
| 20 |
+
"noise_w": 0.8
|
| 21 |
+
},
|
| 22 |
+
"phoneme_id_map": {
|
| 23 |
+
" ": 28,
|
| 24 |
+
"-": 25,
|
| 25 |
+
"a": 2,
|
| 26 |
+
"b": 18,
|
| 27 |
+
"c": 4,
|
| 28 |
+
"d": 24,
|
| 29 |
+
"e": 6,
|
| 30 |
+
"h": 5,
|
| 31 |
+
"i": 1,
|
| 32 |
+
"j": 10,
|
| 33 |
+
"k": 11,
|
| 34 |
+
"l": 13,
|
| 35 |
+
"m": 17,
|
| 36 |
+
"n": 8,
|
| 37 |
+
"o": 9,
|
| 38 |
+
"p": 22,
|
| 39 |
+
"q": 21,
|
| 40 |
+
"r": 7,
|
| 41 |
+
"s": 20,
|
| 42 |
+
"t": 14,
|
| 43 |
+
"u": 12,
|
| 44 |
+
"w": 15,
|
| 45 |
+
"x": 19,
|
| 46 |
+
"y": 23,
|
| 47 |
+
"z": 26,
|
| 48 |
+
"|": 0,
|
| 49 |
+
"̱": 16,
|
| 50 |
+
"—": 27,
|
| 51 |
+
"ꞌ": 3
|
| 52 |
+
},
|
| 53 |
+
"pad": null,
|
| 54 |
+
"blank": "|",
|
| 55 |
+
"bos": null,
|
| 56 |
+
"eos": null,
|
| 57 |
+
"add_blank_char": true,
|
| 58 |
+
"add_blank_word": false,
|
| 59 |
+
"use_eos_bos": false,
|
| 60 |
+
"blank_at_start": true,
|
| 61 |
+
"blank_at_end": true,
|
| 62 |
+
"word_sep_token": " ",
|
| 63 |
+
"blank_between": "tokens_and_words"
|
| 64 |
+
}
|
facebook__mms-tts-poi-Popoluca_Highland/config.json
ADDED
|
@@ -0,0 +1,74 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"phoonnx_version": "1.0",
|
| 3 |
+
"engine": "transformers",
|
| 4 |
+
"phoneme_type": "graphemes",
|
| 5 |
+
"alphabet": "unicode",
|
| 6 |
+
"lang_code": "poi",
|
| 7 |
+
"audio": {
|
| 8 |
+
"sample_rate": 16000
|
| 9 |
+
},
|
| 10 |
+
"num_symbols": 256,
|
| 11 |
+
"num_speakers": 1,
|
| 12 |
+
"num_langs": 1,
|
| 13 |
+
"speaker_id_map": {},
|
| 14 |
+
"lang_id_map": {},
|
| 15 |
+
"phonemizer_model": null,
|
| 16 |
+
"add_diacritics": false,
|
| 17 |
+
"inference": {
|
| 18 |
+
"noise_scale": 0.667,
|
| 19 |
+
"length_scale": 1.0,
|
| 20 |
+
"noise_w": 0.8
|
| 21 |
+
},
|
| 22 |
+
"phoneme_id_map": {
|
| 23 |
+
" ": 15,
|
| 24 |
+
"-": 33,
|
| 25 |
+
"_": 10,
|
| 26 |
+
"a": 13,
|
| 27 |
+
"b": 11,
|
| 28 |
+
"c": 36,
|
| 29 |
+
"d": 18,
|
| 30 |
+
"e": 1,
|
| 31 |
+
"f": 9,
|
| 32 |
+
"g": 17,
|
| 33 |
+
"h": 37,
|
| 34 |
+
"i": 4,
|
| 35 |
+
"j": 31,
|
| 36 |
+
"k": 12,
|
| 37 |
+
"l": 27,
|
| 38 |
+
"m": 24,
|
| 39 |
+
"n": 29,
|
| 40 |
+
"o": 20,
|
| 41 |
+
"p": 23,
|
| 42 |
+
"q": 2,
|
| 43 |
+
"r": 3,
|
| 44 |
+
"s": 19,
|
| 45 |
+
"t": 34,
|
| 46 |
+
"u": 38,
|
| 47 |
+
"v": 16,
|
| 48 |
+
"w": 5,
|
| 49 |
+
"x": 6,
|
| 50 |
+
"y": 21,
|
| 51 |
+
"z": 32,
|
| 52 |
+
"á": 22,
|
| 53 |
+
"é": 8,
|
| 54 |
+
"í": 25,
|
| 55 |
+
"ñ": 0,
|
| 56 |
+
"ó": 28,
|
| 57 |
+
"ú": 30,
|
| 58 |
+
"ŋ": 26,
|
| 59 |
+
"ɨ": 35,
|
| 60 |
+
"́": 7,
|
| 61 |
+
"̱": 14
|
| 62 |
+
},
|
| 63 |
+
"pad": null,
|
| 64 |
+
"blank": "ñ",
|
| 65 |
+
"bos": null,
|
| 66 |
+
"eos": null,
|
| 67 |
+
"add_blank_char": true,
|
| 68 |
+
"add_blank_word": false,
|
| 69 |
+
"use_eos_bos": false,
|
| 70 |
+
"blank_at_start": true,
|
| 71 |
+
"blank_at_end": true,
|
| 72 |
+
"word_sep_token": " ",
|
| 73 |
+
"blank_between": "tokens_and_words"
|
| 74 |
+
}
|
facebook__mms-tts-pol-Polish/config.json
ADDED
|
@@ -0,0 +1,81 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"phoonnx_version": "1.0",
|
| 3 |
+
"engine": "transformers",
|
| 4 |
+
"phoneme_type": "graphemes",
|
| 5 |
+
"alphabet": "unicode",
|
| 6 |
+
"lang_code": "pl",
|
| 7 |
+
"audio": {
|
| 8 |
+
"sample_rate": 16000
|
| 9 |
+
},
|
| 10 |
+
"num_symbols": 256,
|
| 11 |
+
"num_speakers": 1,
|
| 12 |
+
"num_langs": 1,
|
| 13 |
+
"speaker_id_map": {},
|
| 14 |
+
"lang_id_map": {},
|
| 15 |
+
"phonemizer_model": null,
|
| 16 |
+
"add_diacritics": false,
|
| 17 |
+
"inference": {
|
| 18 |
+
"noise_scale": 0.667,
|
| 19 |
+
"length_scale": 1.0,
|
| 20 |
+
"noise_w": 0.8
|
| 21 |
+
},
|
| 22 |
+
"phoneme_id_map": {
|
| 23 |
+
" ": 2,
|
| 24 |
+
"-": 24,
|
| 25 |
+
"0": 4,
|
| 26 |
+
"1": 18,
|
| 27 |
+
"2": 12,
|
| 28 |
+
"3": 39,
|
| 29 |
+
"4": 15,
|
| 30 |
+
"5": 30,
|
| 31 |
+
"6": 23,
|
| 32 |
+
"7": 40,
|
| 33 |
+
"8": 27,
|
| 34 |
+
"9": 20,
|
| 35 |
+
"_": 31,
|
| 36 |
+
"a": 29,
|
| 37 |
+
"b": 26,
|
| 38 |
+
"c": 5,
|
| 39 |
+
"d": 11,
|
| 40 |
+
"e": 22,
|
| 41 |
+
"f": 17,
|
| 42 |
+
"g": 16,
|
| 43 |
+
"h": 1,
|
| 44 |
+
"i": 35,
|
| 45 |
+
"j": 37,
|
| 46 |
+
"k": 25,
|
| 47 |
+
"l": 3,
|
| 48 |
+
"m": 6,
|
| 49 |
+
"n": 41,
|
| 50 |
+
"o": 38,
|
| 51 |
+
"p": 19,
|
| 52 |
+
"r": 28,
|
| 53 |
+
"s": 8,
|
| 54 |
+
"t": 42,
|
| 55 |
+
"u": 10,
|
| 56 |
+
"w": 0,
|
| 57 |
+
"y": 33,
|
| 58 |
+
"z": 9,
|
| 59 |
+
"ó": 14,
|
| 60 |
+
"ą": 7,
|
| 61 |
+
"ć": 44,
|
| 62 |
+
"ę": 32,
|
| 63 |
+
"ł": 34,
|
| 64 |
+
"ń": 13,
|
| 65 |
+
"ś": 43,
|
| 66 |
+
"ź": 45,
|
| 67 |
+
"ż": 36,
|
| 68 |
+
"—": 21
|
| 69 |
+
},
|
| 70 |
+
"pad": null,
|
| 71 |
+
"blank": "w",
|
| 72 |
+
"bos": null,
|
| 73 |
+
"eos": null,
|
| 74 |
+
"add_blank_char": true,
|
| 75 |
+
"add_blank_word": false,
|
| 76 |
+
"use_eos_bos": false,
|
| 77 |
+
"blank_at_start": true,
|
| 78 |
+
"blank_at_end": true,
|
| 79 |
+
"word_sep_token": " ",
|
| 80 |
+
"blank_between": "tokens_and_words"
|
| 81 |
+
}
|
facebook__mms-tts-por-Portuguese/config.json
ADDED
|
@@ -0,0 +1,78 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"phoonnx_version": "1.0",
|
| 3 |
+
"engine": "transformers",
|
| 4 |
+
"phoneme_type": "graphemes",
|
| 5 |
+
"alphabet": "unicode",
|
| 6 |
+
"lang_code": "pt",
|
| 7 |
+
"audio": {
|
| 8 |
+
"sample_rate": 16000
|
| 9 |
+
},
|
| 10 |
+
"num_symbols": 256,
|
| 11 |
+
"num_speakers": 1,
|
| 12 |
+
"num_langs": 1,
|
| 13 |
+
"speaker_id_map": {},
|
| 14 |
+
"lang_id_map": {},
|
| 15 |
+
"phonemizer_model": null,
|
| 16 |
+
"add_diacritics": false,
|
| 17 |
+
"inference": {
|
| 18 |
+
"noise_scale": 0.667,
|
| 19 |
+
"length_scale": 1.0,
|
| 20 |
+
"noise_w": 0.8
|
| 21 |
+
},
|
| 22 |
+
"phoneme_id_map": {
|
| 23 |
+
" ": 32,
|
| 24 |
+
"'": 11,
|
| 25 |
+
"-": 19,
|
| 26 |
+
"1": 2,
|
| 27 |
+
"2": 5,
|
| 28 |
+
"4": 16,
|
| 29 |
+
"_": 13,
|
| 30 |
+
"a": 38,
|
| 31 |
+
"b": 31,
|
| 32 |
+
"c": 22,
|
| 33 |
+
"d": 40,
|
| 34 |
+
"e": 27,
|
| 35 |
+
"f": 30,
|
| 36 |
+
"g": 20,
|
| 37 |
+
"h": 6,
|
| 38 |
+
"i": 29,
|
| 39 |
+
"j": 39,
|
| 40 |
+
"l": 4,
|
| 41 |
+
"m": 18,
|
| 42 |
+
"n": 35,
|
| 43 |
+
"o": 28,
|
| 44 |
+
"p": 8,
|
| 45 |
+
"q": 21,
|
| 46 |
+
"r": 33,
|
| 47 |
+
"s": 14,
|
| 48 |
+
"t": 26,
|
| 49 |
+
"u": 3,
|
| 50 |
+
"v": 17,
|
| 51 |
+
"x": 10,
|
| 52 |
+
"z": 23,
|
| 53 |
+
"à": 0,
|
| 54 |
+
"á": 42,
|
| 55 |
+
"â": 24,
|
| 56 |
+
"ã": 9,
|
| 57 |
+
"ç": 15,
|
| 58 |
+
"é": 7,
|
| 59 |
+
"ê": 12,
|
| 60 |
+
"í": 25,
|
| 61 |
+
"ó": 37,
|
| 62 |
+
"ô": 34,
|
| 63 |
+
"õ": 41,
|
| 64 |
+
"ú": 1,
|
| 65 |
+
"—": 36
|
| 66 |
+
},
|
| 67 |
+
"pad": null,
|
| 68 |
+
"blank": "à",
|
| 69 |
+
"bos": null,
|
| 70 |
+
"eos": null,
|
| 71 |
+
"add_blank_char": true,
|
| 72 |
+
"add_blank_word": false,
|
| 73 |
+
"use_eos_bos": false,
|
| 74 |
+
"blank_at_start": true,
|
| 75 |
+
"blank_at_end": true,
|
| 76 |
+
"word_sep_token": " ",
|
| 77 |
+
"blank_between": "tokens_and_words"
|
| 78 |
+
}
|
facebook__mms-tts-poy-Pogolo/config.json
ADDED
|
@@ -0,0 +1,62 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"phoonnx_version": "1.0",
|
| 3 |
+
"engine": "transformers",
|
| 4 |
+
"phoneme_type": "graphemes",
|
| 5 |
+
"alphabet": "unicode",
|
| 6 |
+
"lang_code": "poy",
|
| 7 |
+
"audio": {
|
| 8 |
+
"sample_rate": 16000
|
| 9 |
+
},
|
| 10 |
+
"num_symbols": 256,
|
| 11 |
+
"num_speakers": 1,
|
| 12 |
+
"num_langs": 1,
|
| 13 |
+
"speaker_id_map": {},
|
| 14 |
+
"lang_id_map": {},
|
| 15 |
+
"phonemizer_model": null,
|
| 16 |
+
"add_diacritics": false,
|
| 17 |
+
"inference": {
|
| 18 |
+
"noise_scale": 0.667,
|
| 19 |
+
"length_scale": 1.0,
|
| 20 |
+
"noise_w": 0.8
|
| 21 |
+
},
|
| 22 |
+
"phoneme_id_map": {
|
| 23 |
+
" ": 14,
|
| 24 |
+
"'": 2,
|
| 25 |
+
"_": 12,
|
| 26 |
+
"a": 1,
|
| 27 |
+
"b": 20,
|
| 28 |
+
"c": 24,
|
| 29 |
+
"d": 26,
|
| 30 |
+
"e": 7,
|
| 31 |
+
"f": 13,
|
| 32 |
+
"g": 5,
|
| 33 |
+
"h": 22,
|
| 34 |
+
"i": 18,
|
| 35 |
+
"j": 19,
|
| 36 |
+
"k": 8,
|
| 37 |
+
"l": 16,
|
| 38 |
+
"m": 21,
|
| 39 |
+
"n": 6,
|
| 40 |
+
"o": 23,
|
| 41 |
+
"p": 4,
|
| 42 |
+
"r": 15,
|
| 43 |
+
"s": 11,
|
| 44 |
+
"t": 3,
|
| 45 |
+
"u": 0,
|
| 46 |
+
"v": 17,
|
| 47 |
+
"w": 25,
|
| 48 |
+
"y": 9,
|
| 49 |
+
"z": 10
|
| 50 |
+
},
|
| 51 |
+
"pad": null,
|
| 52 |
+
"blank": "u",
|
| 53 |
+
"bos": null,
|
| 54 |
+
"eos": null,
|
| 55 |
+
"add_blank_char": true,
|
| 56 |
+
"add_blank_word": false,
|
| 57 |
+
"use_eos_bos": false,
|
| 58 |
+
"blank_at_start": true,
|
| 59 |
+
"blank_at_end": true,
|
| 60 |
+
"word_sep_token": " ",
|
| 61 |
+
"blank_between": "tokens_and_words"
|
| 62 |
+
}
|
facebook__mms-tts-pps-Popoloca_San_Luís_Temalacayuca/config.json
ADDED
|
@@ -0,0 +1,81 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"phoonnx_version": "1.0",
|
| 3 |
+
"engine": "transformers",
|
| 4 |
+
"phoneme_type": "graphemes",
|
| 5 |
+
"alphabet": "unicode",
|
| 6 |
+
"lang_code": "pps",
|
| 7 |
+
"audio": {
|
| 8 |
+
"sample_rate": 16000
|
| 9 |
+
},
|
| 10 |
+
"num_symbols": 256,
|
| 11 |
+
"num_speakers": 1,
|
| 12 |
+
"num_langs": 1,
|
| 13 |
+
"speaker_id_map": {},
|
| 14 |
+
"lang_id_map": {},
|
| 15 |
+
"phonemizer_model": null,
|
| 16 |
+
"add_diacritics": false,
|
| 17 |
+
"inference": {
|
| 18 |
+
"noise_scale": 0.667,
|
| 19 |
+
"length_scale": 1.0,
|
| 20 |
+
"noise_w": 0.8
|
| 21 |
+
},
|
| 22 |
+
"phoneme_id_map": {
|
| 23 |
+
" ": 20,
|
| 24 |
+
"'": 1,
|
| 25 |
+
"-": 35,
|
| 26 |
+
"1": 4,
|
| 27 |
+
"2": 37,
|
| 28 |
+
"5": 40,
|
| 29 |
+
"9": 23,
|
| 30 |
+
"_": 6,
|
| 31 |
+
"`": 11,
|
| 32 |
+
"a": 41,
|
| 33 |
+
"b": 36,
|
| 34 |
+
"c": 26,
|
| 35 |
+
"d": 10,
|
| 36 |
+
"e": 22,
|
| 37 |
+
"f": 29,
|
| 38 |
+
"g": 13,
|
| 39 |
+
"h": 17,
|
| 40 |
+
"i": 14,
|
| 41 |
+
"j": 2,
|
| 42 |
+
"k": 28,
|
| 43 |
+
"l": 24,
|
| 44 |
+
"m": 12,
|
| 45 |
+
"n": 19,
|
| 46 |
+
"o": 0,
|
| 47 |
+
"p": 21,
|
| 48 |
+
"q": 30,
|
| 49 |
+
"r": 3,
|
| 50 |
+
"s": 32,
|
| 51 |
+
"t": 5,
|
| 52 |
+
"u": 18,
|
| 53 |
+
"v": 43,
|
| 54 |
+
"x": 7,
|
| 55 |
+
"y": 34,
|
| 56 |
+
"z": 33,
|
| 57 |
+
"à": 16,
|
| 58 |
+
"á": 42,
|
| 59 |
+
"é": 45,
|
| 60 |
+
"ì": 9,
|
| 61 |
+
"í": 39,
|
| 62 |
+
"ñ": 31,
|
| 63 |
+
"ó": 8,
|
| 64 |
+
"ù": 44,
|
| 65 |
+
"ú": 15,
|
| 66 |
+
"̱": 38,
|
| 67 |
+
"—": 25,
|
| 68 |
+
"ꞌ": 27
|
| 69 |
+
},
|
| 70 |
+
"pad": null,
|
| 71 |
+
"blank": "o",
|
| 72 |
+
"bos": null,
|
| 73 |
+
"eos": null,
|
| 74 |
+
"add_blank_char": true,
|
| 75 |
+
"add_blank_word": false,
|
| 76 |
+
"use_eos_bos": false,
|
| 77 |
+
"blank_at_start": true,
|
| 78 |
+
"blank_at_end": true,
|
| 79 |
+
"word_sep_token": " ",
|
| 80 |
+
"blank_between": "tokens_and_words"
|
| 81 |
+
}
|
facebook__mms-tts-prf-Paranan/config.json
ADDED
|
@@ -0,0 +1,71 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"phoonnx_version": "1.0",
|
| 3 |
+
"engine": "transformers",
|
| 4 |
+
"phoneme_type": "graphemes",
|
| 5 |
+
"alphabet": "unicode",
|
| 6 |
+
"lang_code": "prf",
|
| 7 |
+
"audio": {
|
| 8 |
+
"sample_rate": 16000
|
| 9 |
+
},
|
| 10 |
+
"num_symbols": 256,
|
| 11 |
+
"num_speakers": 1,
|
| 12 |
+
"num_langs": 1,
|
| 13 |
+
"speaker_id_map": {},
|
| 14 |
+
"lang_id_map": {},
|
| 15 |
+
"phonemizer_model": null,
|
| 16 |
+
"add_diacritics": false,
|
| 17 |
+
"inference": {
|
| 18 |
+
"noise_scale": 0.667,
|
| 19 |
+
"length_scale": 1.0,
|
| 20 |
+
"noise_w": 0.8
|
| 21 |
+
},
|
| 22 |
+
"phoneme_id_map": {
|
| 23 |
+
" ": 35,
|
| 24 |
+
"'": 24,
|
| 25 |
+
"-": 22,
|
| 26 |
+
"0": 29,
|
| 27 |
+
"1": 30,
|
| 28 |
+
"2": 31,
|
| 29 |
+
"4": 33,
|
| 30 |
+
"6": 34,
|
| 31 |
+
"a": 1,
|
| 32 |
+
"b": 17,
|
| 33 |
+
"c": 23,
|
| 34 |
+
"d": 8,
|
| 35 |
+
"e": 6,
|
| 36 |
+
"f": 25,
|
| 37 |
+
"g": 11,
|
| 38 |
+
"h": 18,
|
| 39 |
+
"i": 3,
|
| 40 |
+
"j": 21,
|
| 41 |
+
"k": 5,
|
| 42 |
+
"l": 14,
|
| 43 |
+
"m": 10,
|
| 44 |
+
"n": 2,
|
| 45 |
+
"o": 15,
|
| 46 |
+
"p": 13,
|
| 47 |
+
"q": 28,
|
| 48 |
+
"r": 19,
|
| 49 |
+
"s": 12,
|
| 50 |
+
"t": 4,
|
| 51 |
+
"u": 7,
|
| 52 |
+
"v": 27,
|
| 53 |
+
"w": 20,
|
| 54 |
+
"x": 32,
|
| 55 |
+
"y": 9,
|
| 56 |
+
"z": 26,
|
| 57 |
+
"|": 0,
|
| 58 |
+
"á": 16
|
| 59 |
+
},
|
| 60 |
+
"pad": null,
|
| 61 |
+
"blank": "|",
|
| 62 |
+
"bos": null,
|
| 63 |
+
"eos": null,
|
| 64 |
+
"add_blank_char": true,
|
| 65 |
+
"add_blank_word": false,
|
| 66 |
+
"use_eos_bos": false,
|
| 67 |
+
"blank_at_start": true,
|
| 68 |
+
"blank_at_end": true,
|
| 69 |
+
"word_sep_token": " ",
|
| 70 |
+
"blank_between": "tokens_and_words"
|
| 71 |
+
}
|
facebook__mms-tts-prt-Prai/config.json
ADDED
|
@@ -0,0 +1,90 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"phoonnx_version": "1.0",
|
| 3 |
+
"engine": "transformers",
|
| 4 |
+
"phoneme_type": "graphemes",
|
| 5 |
+
"alphabet": "unicode",
|
| 6 |
+
"lang_code": "prt",
|
| 7 |
+
"audio": {
|
| 8 |
+
"sample_rate": 16000
|
| 9 |
+
},
|
| 10 |
+
"num_symbols": 256,
|
| 11 |
+
"num_speakers": 1,
|
| 12 |
+
"num_langs": 1,
|
| 13 |
+
"speaker_id_map": {},
|
| 14 |
+
"lang_id_map": {},
|
| 15 |
+
"phonemizer_model": null,
|
| 16 |
+
"add_diacritics": false,
|
| 17 |
+
"inference": {
|
| 18 |
+
"noise_scale": 0.667,
|
| 19 |
+
"length_scale": 1.0,
|
| 20 |
+
"noise_w": 0.8
|
| 21 |
+
},
|
| 22 |
+
"phoneme_id_map": {
|
| 23 |
+
" ": 38,
|
| 24 |
+
"'": 50,
|
| 25 |
+
"-": 48,
|
| 26 |
+
"0": 21,
|
| 27 |
+
"1": 0,
|
| 28 |
+
"2": 46,
|
| 29 |
+
"3": 25,
|
| 30 |
+
"4": 31,
|
| 31 |
+
"5": 26,
|
| 32 |
+
"6": 1,
|
| 33 |
+
"7": 47,
|
| 34 |
+
"8": 43,
|
| 35 |
+
"9": 30,
|
| 36 |
+
"_": 3,
|
| 37 |
+
"ก": 34,
|
| 38 |
+
"ค": 15,
|
| 39 |
+
"ง": 24,
|
| 40 |
+
"จ": 13,
|
| 41 |
+
"ซ": 53,
|
| 42 |
+
"ญ": 6,
|
| 43 |
+
"ด": 42,
|
| 44 |
+
"ต": 37,
|
| 45 |
+
"ท": 16,
|
| 46 |
+
"น": 12,
|
| 47 |
+
"บ": 18,
|
| 48 |
+
"ป": 9,
|
| 49 |
+
"พ": 10,
|
| 50 |
+
"ฟ": 14,
|
| 51 |
+
"ม": 54,
|
| 52 |
+
"ย": 29,
|
| 53 |
+
"ร": 5,
|
| 54 |
+
"ล": 51,
|
| 55 |
+
"ว": 20,
|
| 56 |
+
"ห": 36,
|
| 57 |
+
"อ": 7,
|
| 58 |
+
"ฮ": 35,
|
| 59 |
+
"ะ": 28,
|
| 60 |
+
"ั": 8,
|
| 61 |
+
"า": 32,
|
| 62 |
+
"ิ": 39,
|
| 63 |
+
"ี": 33,
|
| 64 |
+
"ึ": 44,
|
| 65 |
+
"ื": 11,
|
| 66 |
+
"ุ": 17,
|
| 67 |
+
"ู": 40,
|
| 68 |
+
"เ": 45,
|
| 69 |
+
"แ": 23,
|
| 70 |
+
"โ": 52,
|
| 71 |
+
"ใ": 22,
|
| 72 |
+
"ไ": 19,
|
| 73 |
+
"็": 41,
|
| 74 |
+
"้": 2,
|
| 75 |
+
"๊": 27,
|
| 76 |
+
"ํ": 49,
|
| 77 |
+
"": 4
|
| 78 |
+
},
|
| 79 |
+
"pad": null,
|
| 80 |
+
"blank": "1",
|
| 81 |
+
"bos": null,
|
| 82 |
+
"eos": null,
|
| 83 |
+
"add_blank_char": true,
|
| 84 |
+
"add_blank_word": false,
|
| 85 |
+
"use_eos_bos": false,
|
| 86 |
+
"blank_at_start": true,
|
| 87 |
+
"blank_at_end": true,
|
| 88 |
+
"word_sep_token": " ",
|
| 89 |
+
"blank_between": "tokens_and_words"
|
| 90 |
+
}
|
facebook__mms-tts-pui-Puinave/config.json
ADDED
|
@@ -0,0 +1,77 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"phoonnx_version": "1.0",
|
| 3 |
+
"engine": "transformers",
|
| 4 |
+
"phoneme_type": "graphemes",
|
| 5 |
+
"alphabet": "unicode",
|
| 6 |
+
"lang_code": "pui",
|
| 7 |
+
"audio": {
|
| 8 |
+
"sample_rate": 16000
|
| 9 |
+
},
|
| 10 |
+
"num_symbols": 256,
|
| 11 |
+
"num_speakers": 1,
|
| 12 |
+
"num_langs": 1,
|
| 13 |
+
"speaker_id_map": {},
|
| 14 |
+
"lang_id_map": {},
|
| 15 |
+
"phonemizer_model": null,
|
| 16 |
+
"add_diacritics": false,
|
| 17 |
+
"inference": {
|
| 18 |
+
"noise_scale": 0.667,
|
| 19 |
+
"length_scale": 1.0,
|
| 20 |
+
"noise_w": 0.8
|
| 21 |
+
},
|
| 22 |
+
"phoneme_id_map": {
|
| 23 |
+
" ": 33,
|
| 24 |
+
"-": 29,
|
| 25 |
+
"0": 1,
|
| 26 |
+
"2": 13,
|
| 27 |
+
"4": 30,
|
| 28 |
+
"7": 32,
|
| 29 |
+
"9": 39,
|
| 30 |
+
"_": 5,
|
| 31 |
+
"a": 11,
|
| 32 |
+
"b": 18,
|
| 33 |
+
"c": 37,
|
| 34 |
+
"d": 7,
|
| 35 |
+
"e": 31,
|
| 36 |
+
"f": 36,
|
| 37 |
+
"g": 38,
|
| 38 |
+
"h": 14,
|
| 39 |
+
"i": 34,
|
| 40 |
+
"j": 15,
|
| 41 |
+
"k": 12,
|
| 42 |
+
"l": 17,
|
| 43 |
+
"m": 4,
|
| 44 |
+
"n": 6,
|
| 45 |
+
"o": 26,
|
| 46 |
+
"p": 10,
|
| 47 |
+
"q": 28,
|
| 48 |
+
"r": 41,
|
| 49 |
+
"s": 40,
|
| 50 |
+
"t": 20,
|
| 51 |
+
"u": 35,
|
| 52 |
+
"v": 21,
|
| 53 |
+
"w": 27,
|
| 54 |
+
"x": 8,
|
| 55 |
+
"y": 16,
|
| 56 |
+
"z": 25,
|
| 57 |
+
"á": 3,
|
| 58 |
+
"é": 23,
|
| 59 |
+
"í": 0,
|
| 60 |
+
"ñ": 22,
|
| 61 |
+
"ó": 9,
|
| 62 |
+
"ú": 19,
|
| 63 |
+
"ü": 2,
|
| 64 |
+
"ŕ": 24
|
| 65 |
+
},
|
| 66 |
+
"pad": null,
|
| 67 |
+
"blank": "í",
|
| 68 |
+
"bos": null,
|
| 69 |
+
"eos": null,
|
| 70 |
+
"add_blank_char": true,
|
| 71 |
+
"add_blank_word": false,
|
| 72 |
+
"use_eos_bos": false,
|
| 73 |
+
"blank_at_start": true,
|
| 74 |
+
"blank_at_end": true,
|
| 75 |
+
"word_sep_token": " ",
|
| 76 |
+
"blank_between": "tokens_and_words"
|
| 77 |
+
}
|
facebook__mms-tts-qub-Quechua_Huallaga/config.json
ADDED
|
@@ -0,0 +1,76 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"phoonnx_version": "1.0",
|
| 3 |
+
"engine": "transformers",
|
| 4 |
+
"phoneme_type": "graphemes",
|
| 5 |
+
"alphabet": "unicode",
|
| 6 |
+
"lang_code": "qub",
|
| 7 |
+
"audio": {
|
| 8 |
+
"sample_rate": 16000
|
| 9 |
+
},
|
| 10 |
+
"num_symbols": 256,
|
| 11 |
+
"num_speakers": 1,
|
| 12 |
+
"num_langs": 1,
|
| 13 |
+
"speaker_id_map": {},
|
| 14 |
+
"lang_id_map": {},
|
| 15 |
+
"phonemizer_model": null,
|
| 16 |
+
"add_diacritics": false,
|
| 17 |
+
"inference": {
|
| 18 |
+
"noise_scale": 0.667,
|
| 19 |
+
"length_scale": 1.0,
|
| 20 |
+
"noise_w": 0.8
|
| 21 |
+
},
|
| 22 |
+
"phoneme_id_map": {
|
| 23 |
+
" ": 40,
|
| 24 |
+
"'": 37,
|
| 25 |
+
"-": 27,
|
| 26 |
+
"a": 0,
|
| 27 |
+
"b": 23,
|
| 28 |
+
"c": 3,
|
| 29 |
+
"d": 21,
|
| 30 |
+
"e": 19,
|
| 31 |
+
"f": 28,
|
| 32 |
+
"g": 15,
|
| 33 |
+
"h": 6,
|
| 34 |
+
"i": 4,
|
| 35 |
+
"j": 14,
|
| 36 |
+
"k": 39,
|
| 37 |
+
"l": 13,
|
| 38 |
+
"m": 10,
|
| 39 |
+
"n": 2,
|
| 40 |
+
"o": 16,
|
| 41 |
+
"p": 12,
|
| 42 |
+
"q": 20,
|
| 43 |
+
"r": 9,
|
| 44 |
+
"s": 8,
|
| 45 |
+
"t": 11,
|
| 46 |
+
"u": 5,
|
| 47 |
+
"v": 34,
|
| 48 |
+
"w": 17,
|
| 49 |
+
"x": 38,
|
| 50 |
+
"y": 7,
|
| 51 |
+
"z": 33,
|
| 52 |
+
"|": 1,
|
| 53 |
+
"á": 36,
|
| 54 |
+
"ä": 18,
|
| 55 |
+
"é": 32,
|
| 56 |
+
"ë": 26,
|
| 57 |
+
"í": 31,
|
| 58 |
+
"ï": 25,
|
| 59 |
+
"ñ": 24,
|
| 60 |
+
"ó": 35,
|
| 61 |
+
"ö": 22,
|
| 62 |
+
"ú": 29,
|
| 63 |
+
"ü": 30
|
| 64 |
+
},
|
| 65 |
+
"pad": null,
|
| 66 |
+
"blank": "a",
|
| 67 |
+
"bos": null,
|
| 68 |
+
"eos": null,
|
| 69 |
+
"add_blank_char": true,
|
| 70 |
+
"add_blank_word": false,
|
| 71 |
+
"use_eos_bos": false,
|
| 72 |
+
"blank_at_start": true,
|
| 73 |
+
"blank_at_end": true,
|
| 74 |
+
"word_sep_token": " ",
|
| 75 |
+
"blank_between": "tokens_and_words"
|
| 76 |
+
}
|
facebook__mms-tts-quf-Quechua_Lambayeque/config.json
ADDED
|
@@ -0,0 +1,70 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"phoonnx_version": "1.0",
|
| 3 |
+
"engine": "transformers",
|
| 4 |
+
"phoneme_type": "graphemes",
|
| 5 |
+
"alphabet": "unicode",
|
| 6 |
+
"lang_code": "quf",
|
| 7 |
+
"audio": {
|
| 8 |
+
"sample_rate": 16000
|
| 9 |
+
},
|
| 10 |
+
"num_symbols": 256,
|
| 11 |
+
"num_speakers": 1,
|
| 12 |
+
"num_langs": 1,
|
| 13 |
+
"speaker_id_map": {},
|
| 14 |
+
"lang_id_map": {},
|
| 15 |
+
"phonemizer_model": null,
|
| 16 |
+
"add_diacritics": false,
|
| 17 |
+
"inference": {
|
| 18 |
+
"noise_scale": 0.667,
|
| 19 |
+
"length_scale": 1.0,
|
| 20 |
+
"noise_w": 0.8
|
| 21 |
+
},
|
| 22 |
+
"phoneme_id_map": {
|
| 23 |
+
" ": 34,
|
| 24 |
+
"'": 18,
|
| 25 |
+
"-": 23,
|
| 26 |
+
"0": 29,
|
| 27 |
+
"1": 31,
|
| 28 |
+
"2": 32,
|
| 29 |
+
"4": 33,
|
| 30 |
+
"a": 0,
|
| 31 |
+
"b": 21,
|
| 32 |
+
"c": 15,
|
| 33 |
+
"d": 17,
|
| 34 |
+
"e": 19,
|
| 35 |
+
"f": 26,
|
| 36 |
+
"g": 22,
|
| 37 |
+
"h": 8,
|
| 38 |
+
"i": 3,
|
| 39 |
+
"j": 20,
|
| 40 |
+
"k": 5,
|
| 41 |
+
"l": 7,
|
| 42 |
+
"m": 10,
|
| 43 |
+
"n": 2,
|
| 44 |
+
"o": 24,
|
| 45 |
+
"p": 9,
|
| 46 |
+
"q": 12,
|
| 47 |
+
"r": 11,
|
| 48 |
+
"s": 13,
|
| 49 |
+
"t": 14,
|
| 50 |
+
"u": 4,
|
| 51 |
+
"v": 27,
|
| 52 |
+
"w": 16,
|
| 53 |
+
"x": 30,
|
| 54 |
+
"y": 6,
|
| 55 |
+
"z": 28,
|
| 56 |
+
"|": 1,
|
| 57 |
+
"ñ": 25
|
| 58 |
+
},
|
| 59 |
+
"pad": null,
|
| 60 |
+
"blank": "a",
|
| 61 |
+
"bos": null,
|
| 62 |
+
"eos": null,
|
| 63 |
+
"add_blank_char": true,
|
| 64 |
+
"add_blank_word": false,
|
| 65 |
+
"use_eos_bos": false,
|
| 66 |
+
"blank_at_start": true,
|
| 67 |
+
"blank_at_end": true,
|
| 68 |
+
"word_sep_token": " ",
|
| 69 |
+
"blank_between": "tokens_and_words"
|
| 70 |
+
}
|
facebook__mms-tts-quh-Quechua_South_Bolivian/config.json
ADDED
|
@@ -0,0 +1,78 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"phoonnx_version": "1.0",
|
| 3 |
+
"engine": "transformers",
|
| 4 |
+
"phoneme_type": "graphemes",
|
| 5 |
+
"alphabet": "unicode",
|
| 6 |
+
"lang_code": "quh",
|
| 7 |
+
"audio": {
|
| 8 |
+
"sample_rate": 16000
|
| 9 |
+
},
|
| 10 |
+
"num_symbols": 256,
|
| 11 |
+
"num_speakers": 1,
|
| 12 |
+
"num_langs": 1,
|
| 13 |
+
"speaker_id_map": {},
|
| 14 |
+
"lang_id_map": {},
|
| 15 |
+
"phonemizer_model": null,
|
| 16 |
+
"add_diacritics": false,
|
| 17 |
+
"inference": {
|
| 18 |
+
"noise_scale": 0.667,
|
| 19 |
+
"length_scale": 1.0,
|
| 20 |
+
"noise_w": 0.8
|
| 21 |
+
},
|
| 22 |
+
"phoneme_id_map": {
|
| 23 |
+
" ": 11,
|
| 24 |
+
"'": 27,
|
| 25 |
+
"0": 22,
|
| 26 |
+
"1": 18,
|
| 27 |
+
"2": 10,
|
| 28 |
+
"3": 35,
|
| 29 |
+
"4": 20,
|
| 30 |
+
"5": 13,
|
| 31 |
+
"6": 19,
|
| 32 |
+
"7": 42,
|
| 33 |
+
"_": 33,
|
| 34 |
+
"a": 2,
|
| 35 |
+
"b": 32,
|
| 36 |
+
"c": 25,
|
| 37 |
+
"d": 12,
|
| 38 |
+
"e": 28,
|
| 39 |
+
"f": 23,
|
| 40 |
+
"g": 9,
|
| 41 |
+
"h": 5,
|
| 42 |
+
"i": 30,
|
| 43 |
+
"j": 34,
|
| 44 |
+
"k": 16,
|
| 45 |
+
"l": 4,
|
| 46 |
+
"m": 41,
|
| 47 |
+
"n": 24,
|
| 48 |
+
"o": 8,
|
| 49 |
+
"p": 7,
|
| 50 |
+
"q": 36,
|
| 51 |
+
"r": 38,
|
| 52 |
+
"s": 40,
|
| 53 |
+
"t": 6,
|
| 54 |
+
"u": 39,
|
| 55 |
+
"v": 26,
|
| 56 |
+
"w": 14,
|
| 57 |
+
"x": 31,
|
| 58 |
+
"y": 21,
|
| 59 |
+
"z": 0,
|
| 60 |
+
"á": 1,
|
| 61 |
+
"é": 17,
|
| 62 |
+
"í": 29,
|
| 63 |
+
"ñ": 3,
|
| 64 |
+
"ó": 37,
|
| 65 |
+
"ú": 15
|
| 66 |
+
},
|
| 67 |
+
"pad": null,
|
| 68 |
+
"blank": "z",
|
| 69 |
+
"bos": null,
|
| 70 |
+
"eos": null,
|
| 71 |
+
"add_blank_char": true,
|
| 72 |
+
"add_blank_word": false,
|
| 73 |
+
"use_eos_bos": false,
|
| 74 |
+
"blank_at_start": true,
|
| 75 |
+
"blank_at_end": true,
|
| 76 |
+
"word_sep_token": " ",
|
| 77 |
+
"blank_between": "tokens_and_words"
|
| 78 |
+
}
|
facebook__mms-tts-qul-Quechua_North_Bolivian/config.json
ADDED
|
@@ -0,0 +1,73 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"phoonnx_version": "1.0",
|
| 3 |
+
"engine": "transformers",
|
| 4 |
+
"phoneme_type": "graphemes",
|
| 5 |
+
"alphabet": "unicode",
|
| 6 |
+
"lang_code": "qul",
|
| 7 |
+
"audio": {
|
| 8 |
+
"sample_rate": 16000
|
| 9 |
+
},
|
| 10 |
+
"num_symbols": 256,
|
| 11 |
+
"num_speakers": 1,
|
| 12 |
+
"num_langs": 1,
|
| 13 |
+
"speaker_id_map": {},
|
| 14 |
+
"lang_id_map": {},
|
| 15 |
+
"phonemizer_model": null,
|
| 16 |
+
"add_diacritics": false,
|
| 17 |
+
"inference": {
|
| 18 |
+
"noise_scale": 0.667,
|
| 19 |
+
"length_scale": 1.0,
|
| 20 |
+
"noise_w": 0.8
|
| 21 |
+
},
|
| 22 |
+
"phoneme_id_map": {
|
| 23 |
+
" ": 37,
|
| 24 |
+
"'": 18,
|
| 25 |
+
"a": 0,
|
| 26 |
+
"b": 24,
|
| 27 |
+
"c": 8,
|
| 28 |
+
"d": 21,
|
| 29 |
+
"e": 20,
|
| 30 |
+
"f": 26,
|
| 31 |
+
"g": 25,
|
| 32 |
+
"h": 7,
|
| 33 |
+
"i": 3,
|
| 34 |
+
"j": 17,
|
| 35 |
+
"k": 6,
|
| 36 |
+
"l": 15,
|
| 37 |
+
"m": 9,
|
| 38 |
+
"n": 2,
|
| 39 |
+
"o": 19,
|
| 40 |
+
"p": 12,
|
| 41 |
+
"q": 5,
|
| 42 |
+
"r": 14,
|
| 43 |
+
"s": 11,
|
| 44 |
+
"t": 13,
|
| 45 |
+
"u": 4,
|
| 46 |
+
"v": 29,
|
| 47 |
+
"w": 16,
|
| 48 |
+
"x": 36,
|
| 49 |
+
"y": 10,
|
| 50 |
+
"z": 32,
|
| 51 |
+
"|": 1,
|
| 52 |
+
"á": 34,
|
| 53 |
+
"ä": 31,
|
| 54 |
+
"é": 28,
|
| 55 |
+
"í": 27,
|
| 56 |
+
"ï": 35,
|
| 57 |
+
"ñ": 22,
|
| 58 |
+
"ó": 30,
|
| 59 |
+
"ú": 33,
|
| 60 |
+
"–": 23
|
| 61 |
+
},
|
| 62 |
+
"pad": null,
|
| 63 |
+
"blank": "a",
|
| 64 |
+
"bos": null,
|
| 65 |
+
"eos": null,
|
| 66 |
+
"add_blank_char": true,
|
| 67 |
+
"add_blank_word": false,
|
| 68 |
+
"use_eos_bos": false,
|
| 69 |
+
"blank_at_start": true,
|
| 70 |
+
"blank_at_end": true,
|
| 71 |
+
"word_sep_token": " ",
|
| 72 |
+
"blank_between": "tokens_and_words"
|
| 73 |
+
}
|
facebook__mms-tts-quw-Quichua_Tena_Lowland/config.json
ADDED
|
@@ -0,0 +1,79 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"phoonnx_version": "1.0",
|
| 3 |
+
"engine": "transformers",
|
| 4 |
+
"phoneme_type": "graphemes",
|
| 5 |
+
"alphabet": "unicode",
|
| 6 |
+
"lang_code": "quw",
|
| 7 |
+
"audio": {
|
| 8 |
+
"sample_rate": 16000
|
| 9 |
+
},
|
| 10 |
+
"num_symbols": 256,
|
| 11 |
+
"num_speakers": 1,
|
| 12 |
+
"num_langs": 1,
|
| 13 |
+
"speaker_id_map": {},
|
| 14 |
+
"lang_id_map": {},
|
| 15 |
+
"phonemizer_model": null,
|
| 16 |
+
"add_diacritics": false,
|
| 17 |
+
"inference": {
|
| 18 |
+
"noise_scale": 0.667,
|
| 19 |
+
"length_scale": 1.0,
|
| 20 |
+
"noise_w": 0.8
|
| 21 |
+
},
|
| 22 |
+
"phoneme_id_map": {
|
| 23 |
+
" ": 43,
|
| 24 |
+
"'": 38,
|
| 25 |
+
"-": 40,
|
| 26 |
+
"0": 32,
|
| 27 |
+
"1": 33,
|
| 28 |
+
"2": 34,
|
| 29 |
+
"a": 0,
|
| 30 |
+
"b": 21,
|
| 31 |
+
"c": 5,
|
| 32 |
+
"d": 15,
|
| 33 |
+
"e": 19,
|
| 34 |
+
"f": 25,
|
| 35 |
+
"g": 13,
|
| 36 |
+
"h": 6,
|
| 37 |
+
"i": 2,
|
| 38 |
+
"j": 14,
|
| 39 |
+
"k": 39,
|
| 40 |
+
"l": 11,
|
| 41 |
+
"m": 9,
|
| 42 |
+
"n": 4,
|
| 43 |
+
"o": 18,
|
| 44 |
+
"p": 10,
|
| 45 |
+
"q": 20,
|
| 46 |
+
"r": 8,
|
| 47 |
+
"s": 7,
|
| 48 |
+
"t": 12,
|
| 49 |
+
"u": 3,
|
| 50 |
+
"v": 23,
|
| 51 |
+
"x": 35,
|
| 52 |
+
"y": 16,
|
| 53 |
+
"z": 22,
|
| 54 |
+
"|": 1,
|
| 55 |
+
"á": 30,
|
| 56 |
+
"ä": 41,
|
| 57 |
+
"é": 28,
|
| 58 |
+
"í": 26,
|
| 59 |
+
"ï": 36,
|
| 60 |
+
"ñ": 17,
|
| 61 |
+
"ó": 31,
|
| 62 |
+
"ú": 24,
|
| 63 |
+
"ü": 29,
|
| 64 |
+
"ź": 27,
|
| 65 |
+
"ḿ": 42,
|
| 66 |
+
"—": 37
|
| 67 |
+
},
|
| 68 |
+
"pad": null,
|
| 69 |
+
"blank": "a",
|
| 70 |
+
"bos": null,
|
| 71 |
+
"eos": null,
|
| 72 |
+
"add_blank_char": true,
|
| 73 |
+
"add_blank_word": false,
|
| 74 |
+
"use_eos_bos": false,
|
| 75 |
+
"blank_at_start": true,
|
| 76 |
+
"blank_at_end": true,
|
| 77 |
+
"word_sep_token": " ",
|
| 78 |
+
"blank_between": "tokens_and_words"
|
| 79 |
+
}
|
facebook__mms-tts-quy-Quechua_Ayacucho/config.json
ADDED
|
@@ -0,0 +1,71 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"phoonnx_version": "1.0",
|
| 3 |
+
"engine": "transformers",
|
| 4 |
+
"phoneme_type": "graphemes",
|
| 5 |
+
"alphabet": "unicode",
|
| 6 |
+
"lang_code": "quy",
|
| 7 |
+
"audio": {
|
| 8 |
+
"sample_rate": 16000
|
| 9 |
+
},
|
| 10 |
+
"num_symbols": 256,
|
| 11 |
+
"num_speakers": 1,
|
| 12 |
+
"num_langs": 1,
|
| 13 |
+
"speaker_id_map": {},
|
| 14 |
+
"lang_id_map": {},
|
| 15 |
+
"phonemizer_model": null,
|
| 16 |
+
"add_diacritics": false,
|
| 17 |
+
"inference": {
|
| 18 |
+
"noise_scale": 0.667,
|
| 19 |
+
"length_scale": 1.0,
|
| 20 |
+
"noise_w": 0.8
|
| 21 |
+
},
|
| 22 |
+
"phoneme_id_map": {
|
| 23 |
+
" ": 29,
|
| 24 |
+
"-": 27,
|
| 25 |
+
"_": 1,
|
| 26 |
+
"a": 0,
|
| 27 |
+
"b": 25,
|
| 28 |
+
"c": 8,
|
| 29 |
+
"d": 12,
|
| 30 |
+
"e": 19,
|
| 31 |
+
"f": 5,
|
| 32 |
+
"g": 3,
|
| 33 |
+
"h": 33,
|
| 34 |
+
"i": 9,
|
| 35 |
+
"j": 11,
|
| 36 |
+
"k": 21,
|
| 37 |
+
"l": 24,
|
| 38 |
+
"m": 17,
|
| 39 |
+
"n": 23,
|
| 40 |
+
"o": 2,
|
| 41 |
+
"p": 22,
|
| 42 |
+
"q": 16,
|
| 43 |
+
"r": 13,
|
| 44 |
+
"s": 4,
|
| 45 |
+
"t": 31,
|
| 46 |
+
"u": 10,
|
| 47 |
+
"v": 20,
|
| 48 |
+
"w": 6,
|
| 49 |
+
"x": 26,
|
| 50 |
+
"y": 32,
|
| 51 |
+
"z": 7,
|
| 52 |
+
"á": 18,
|
| 53 |
+
"é": 30,
|
| 54 |
+
"í": 28,
|
| 55 |
+
"ñ": 15,
|
| 56 |
+
"ó": 14,
|
| 57 |
+
"ú": 35,
|
| 58 |
+
"—": 34
|
| 59 |
+
},
|
| 60 |
+
"pad": null,
|
| 61 |
+
"blank": "a",
|
| 62 |
+
"bos": null,
|
| 63 |
+
"eos": null,
|
| 64 |
+
"add_blank_char": true,
|
| 65 |
+
"add_blank_word": false,
|
| 66 |
+
"use_eos_bos": false,
|
| 67 |
+
"blank_at_start": true,
|
| 68 |
+
"blank_at_end": true,
|
| 69 |
+
"word_sep_token": " ",
|
| 70 |
+
"blank_between": "tokens_and_words"
|
| 71 |
+
}
|
facebook__mms-tts-quz-Quechua_Cusco/config.json
ADDED
|
@@ -0,0 +1,72 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"phoonnx_version": "1.0",
|
| 3 |
+
"engine": "transformers",
|
| 4 |
+
"phoneme_type": "graphemes",
|
| 5 |
+
"alphabet": "unicode",
|
| 6 |
+
"lang_code": "quz",
|
| 7 |
+
"audio": {
|
| 8 |
+
"sample_rate": 16000
|
| 9 |
+
},
|
| 10 |
+
"num_symbols": 256,
|
| 11 |
+
"num_speakers": 1,
|
| 12 |
+
"num_langs": 1,
|
| 13 |
+
"speaker_id_map": {},
|
| 14 |
+
"lang_id_map": {},
|
| 15 |
+
"phonemizer_model": null,
|
| 16 |
+
"add_diacritics": false,
|
| 17 |
+
"inference": {
|
| 18 |
+
"noise_scale": 0.667,
|
| 19 |
+
"length_scale": 1.0,
|
| 20 |
+
"noise_w": 0.8
|
| 21 |
+
},
|
| 22 |
+
"phoneme_id_map": {
|
| 23 |
+
" ": 36,
|
| 24 |
+
"'": 20,
|
| 25 |
+
"-": 25,
|
| 26 |
+
"a": 0,
|
| 27 |
+
"b": 24,
|
| 28 |
+
"c": 11,
|
| 29 |
+
"d": 21,
|
| 30 |
+
"e": 18,
|
| 31 |
+
"f": 28,
|
| 32 |
+
"g": 23,
|
| 33 |
+
"h": 8,
|
| 34 |
+
"i": 3,
|
| 35 |
+
"j": 22,
|
| 36 |
+
"k": 6,
|
| 37 |
+
"l": 15,
|
| 38 |
+
"m": 13,
|
| 39 |
+
"n": 2,
|
| 40 |
+
"o": 16,
|
| 41 |
+
"p": 9,
|
| 42 |
+
"q": 5,
|
| 43 |
+
"r": 14,
|
| 44 |
+
"s": 7,
|
| 45 |
+
"t": 12,
|
| 46 |
+
"u": 4,
|
| 47 |
+
"v": 27,
|
| 48 |
+
"w": 17,
|
| 49 |
+
"x": 35,
|
| 50 |
+
"y": 10,
|
| 51 |
+
"z": 30,
|
| 52 |
+
"|": 1,
|
| 53 |
+
"á": 32,
|
| 54 |
+
"é": 31,
|
| 55 |
+
"í": 29,
|
| 56 |
+
"ñ": 19,
|
| 57 |
+
"ó": 33,
|
| 58 |
+
"ú": 34,
|
| 59 |
+
"–": 26
|
| 60 |
+
},
|
| 61 |
+
"pad": null,
|
| 62 |
+
"blank": "a",
|
| 63 |
+
"bos": null,
|
| 64 |
+
"eos": null,
|
| 65 |
+
"add_blank_char": true,
|
| 66 |
+
"add_blank_word": false,
|
| 67 |
+
"use_eos_bos": false,
|
| 68 |
+
"blank_at_start": true,
|
| 69 |
+
"blank_at_end": true,
|
| 70 |
+
"word_sep_token": " ",
|
| 71 |
+
"blank_between": "tokens_and_words"
|
| 72 |
+
}
|
facebook__mms-tts-qvc-Quechua_Cajamarca/config.json
ADDED
|
@@ -0,0 +1,77 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"phoonnx_version": "1.0",
|
| 3 |
+
"engine": "transformers",
|
| 4 |
+
"phoneme_type": "graphemes",
|
| 5 |
+
"alphabet": "unicode",
|
| 6 |
+
"lang_code": "qvc",
|
| 7 |
+
"audio": {
|
| 8 |
+
"sample_rate": 16000
|
| 9 |
+
},
|
| 10 |
+
"num_symbols": 256,
|
| 11 |
+
"num_speakers": 1,
|
| 12 |
+
"num_langs": 1,
|
| 13 |
+
"speaker_id_map": {},
|
| 14 |
+
"lang_id_map": {},
|
| 15 |
+
"phonemizer_model": null,
|
| 16 |
+
"add_diacritics": false,
|
| 17 |
+
"inference": {
|
| 18 |
+
"noise_scale": 0.667,
|
| 19 |
+
"length_scale": 1.0,
|
| 20 |
+
"noise_w": 0.8
|
| 21 |
+
},
|
| 22 |
+
"phoneme_id_map": {
|
| 23 |
+
" ": 41,
|
| 24 |
+
"'": 35,
|
| 25 |
+
"0": 26,
|
| 26 |
+
"1": 33,
|
| 27 |
+
"2": 29,
|
| 28 |
+
"3": 36,
|
| 29 |
+
"4": 28,
|
| 30 |
+
"5": 34,
|
| 31 |
+
"6": 40,
|
| 32 |
+
"7": 39,
|
| 33 |
+
"8": 37,
|
| 34 |
+
"9": 38,
|
| 35 |
+
"a": 0,
|
| 36 |
+
"b": 18,
|
| 37 |
+
"c": 14,
|
| 38 |
+
"d": 16,
|
| 39 |
+
"e": 25,
|
| 40 |
+
"f": 24,
|
| 41 |
+
"g": 19,
|
| 42 |
+
"h": 5,
|
| 43 |
+
"i": 2,
|
| 44 |
+
"j": 20,
|
| 45 |
+
"k": 9,
|
| 46 |
+
"l": 12,
|
| 47 |
+
"m": 11,
|
| 48 |
+
"n": 3,
|
| 49 |
+
"o": 21,
|
| 50 |
+
"p": 10,
|
| 51 |
+
"q": 8,
|
| 52 |
+
"r": 13,
|
| 53 |
+
"s": 7,
|
| 54 |
+
"t": 15,
|
| 55 |
+
"u": 4,
|
| 56 |
+
"w": 17,
|
| 57 |
+
"y": 6,
|
| 58 |
+
"|": 1,
|
| 59 |
+
"á": 27,
|
| 60 |
+
"í": 32,
|
| 61 |
+
"ñ": 22,
|
| 62 |
+
"˻": 30,
|
| 63 |
+
"˼": 31,
|
| 64 |
+
"—": 23
|
| 65 |
+
},
|
| 66 |
+
"pad": null,
|
| 67 |
+
"blank": "a",
|
| 68 |
+
"bos": null,
|
| 69 |
+
"eos": null,
|
| 70 |
+
"add_blank_char": true,
|
| 71 |
+
"add_blank_word": false,
|
| 72 |
+
"use_eos_bos": false,
|
| 73 |
+
"blank_at_start": true,
|
| 74 |
+
"blank_at_end": true,
|
| 75 |
+
"word_sep_token": " ",
|
| 76 |
+
"blank_between": "tokens_and_words"
|
| 77 |
+
}
|
facebook__mms-tts-qve-Quechua_Eastern_Apurímac/config.json
ADDED
|
@@ -0,0 +1,75 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"phoonnx_version": "1.0",
|
| 3 |
+
"engine": "transformers",
|
| 4 |
+
"phoneme_type": "graphemes",
|
| 5 |
+
"alphabet": "unicode",
|
| 6 |
+
"lang_code": "qve",
|
| 7 |
+
"audio": {
|
| 8 |
+
"sample_rate": 16000
|
| 9 |
+
},
|
| 10 |
+
"num_symbols": 256,
|
| 11 |
+
"num_speakers": 1,
|
| 12 |
+
"num_langs": 1,
|
| 13 |
+
"speaker_id_map": {},
|
| 14 |
+
"lang_id_map": {},
|
| 15 |
+
"phonemizer_model": null,
|
| 16 |
+
"add_diacritics": false,
|
| 17 |
+
"inference": {
|
| 18 |
+
"noise_scale": 0.667,
|
| 19 |
+
"length_scale": 1.0,
|
| 20 |
+
"noise_w": 0.8
|
| 21 |
+
},
|
| 22 |
+
"phoneme_id_map": {
|
| 23 |
+
" ": 39,
|
| 24 |
+
"'": 23,
|
| 25 |
+
"-": 33,
|
| 26 |
+
"0": 36,
|
| 27 |
+
"1": 37,
|
| 28 |
+
"2": 38,
|
| 29 |
+
"a": 0,
|
| 30 |
+
"b": 22,
|
| 31 |
+
"c": 10,
|
| 32 |
+
"d": 19,
|
| 33 |
+
"e": 17,
|
| 34 |
+
"f": 26,
|
| 35 |
+
"g": 24,
|
| 36 |
+
"h": 8,
|
| 37 |
+
"i": 3,
|
| 38 |
+
"j": 21,
|
| 39 |
+
"k": 6,
|
| 40 |
+
"l": 15,
|
| 41 |
+
"m": 14,
|
| 42 |
+
"n": 2,
|
| 43 |
+
"o": 16,
|
| 44 |
+
"p": 9,
|
| 45 |
+
"q": 7,
|
| 46 |
+
"r": 13,
|
| 47 |
+
"s": 5,
|
| 48 |
+
"t": 11,
|
| 49 |
+
"u": 4,
|
| 50 |
+
"v": 25,
|
| 51 |
+
"w": 18,
|
| 52 |
+
"x": 35,
|
| 53 |
+
"y": 12,
|
| 54 |
+
"z": 29,
|
| 55 |
+
"|": 1,
|
| 56 |
+
"á": 27,
|
| 57 |
+
"é": 32,
|
| 58 |
+
"í": 30,
|
| 59 |
+
"ñ": 20,
|
| 60 |
+
"ó": 31,
|
| 61 |
+
"ú": 34,
|
| 62 |
+
"—": 28
|
| 63 |
+
},
|
| 64 |
+
"pad": null,
|
| 65 |
+
"blank": "a",
|
| 66 |
+
"bos": null,
|
| 67 |
+
"eos": null,
|
| 68 |
+
"add_blank_char": true,
|
| 69 |
+
"add_blank_word": false,
|
| 70 |
+
"use_eos_bos": false,
|
| 71 |
+
"blank_at_start": true,
|
| 72 |
+
"blank_at_end": true,
|
| 73 |
+
"word_sep_token": " ",
|
| 74 |
+
"blank_between": "tokens_and_words"
|
| 75 |
+
}
|
facebook__mms-tts-qvh-Quechua_Huamalíes-Dos_de_Mayo_Huánuco/config.json
ADDED
|
@@ -0,0 +1,76 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"phoonnx_version": "1.0",
|
| 3 |
+
"engine": "transformers",
|
| 4 |
+
"phoneme_type": "graphemes",
|
| 5 |
+
"alphabet": "unicode",
|
| 6 |
+
"lang_code": "qvh",
|
| 7 |
+
"audio": {
|
| 8 |
+
"sample_rate": 16000
|
| 9 |
+
},
|
| 10 |
+
"num_symbols": 256,
|
| 11 |
+
"num_speakers": 1,
|
| 12 |
+
"num_langs": 1,
|
| 13 |
+
"speaker_id_map": {},
|
| 14 |
+
"lang_id_map": {},
|
| 15 |
+
"phonemizer_model": null,
|
| 16 |
+
"add_diacritics": false,
|
| 17 |
+
"inference": {
|
| 18 |
+
"noise_scale": 0.667,
|
| 19 |
+
"length_scale": 1.0,
|
| 20 |
+
"noise_w": 0.8
|
| 21 |
+
},
|
| 22 |
+
"phoneme_id_map": {
|
| 23 |
+
" ": 24,
|
| 24 |
+
"'": 39,
|
| 25 |
+
"-": 31,
|
| 26 |
+
"_": 17,
|
| 27 |
+
"a": 38,
|
| 28 |
+
"b": 27,
|
| 29 |
+
"c": 22,
|
| 30 |
+
"d": 11,
|
| 31 |
+
"e": 35,
|
| 32 |
+
"f": 1,
|
| 33 |
+
"g": 28,
|
| 34 |
+
"h": 2,
|
| 35 |
+
"i": 12,
|
| 36 |
+
"j": 29,
|
| 37 |
+
"k": 15,
|
| 38 |
+
"l": 16,
|
| 39 |
+
"m": 33,
|
| 40 |
+
"n": 21,
|
| 41 |
+
"o": 5,
|
| 42 |
+
"p": 34,
|
| 43 |
+
"q": 18,
|
| 44 |
+
"r": 10,
|
| 45 |
+
"s": 37,
|
| 46 |
+
"t": 13,
|
| 47 |
+
"u": 19,
|
| 48 |
+
"v": 23,
|
| 49 |
+
"w": 40,
|
| 50 |
+
"x": 6,
|
| 51 |
+
"y": 9,
|
| 52 |
+
"z": 4,
|
| 53 |
+
"á": 36,
|
| 54 |
+
"ä": 8,
|
| 55 |
+
"é": 25,
|
| 56 |
+
"ë": 0,
|
| 57 |
+
"í": 30,
|
| 58 |
+
"ï": 20,
|
| 59 |
+
"ñ": 7,
|
| 60 |
+
"ó": 26,
|
| 61 |
+
"ö": 14,
|
| 62 |
+
"ú": 32,
|
| 63 |
+
"ü": 3
|
| 64 |
+
},
|
| 65 |
+
"pad": null,
|
| 66 |
+
"blank": "ë",
|
| 67 |
+
"bos": null,
|
| 68 |
+
"eos": null,
|
| 69 |
+
"add_blank_char": true,
|
| 70 |
+
"add_blank_word": false,
|
| 71 |
+
"use_eos_bos": false,
|
| 72 |
+
"blank_at_start": true,
|
| 73 |
+
"blank_at_end": true,
|
| 74 |
+
"word_sep_token": " ",
|
| 75 |
+
"blank_between": "tokens_and_words"
|
| 76 |
+
}
|
facebook__mms-tts-qvm-Quechua_Margos-Yarowilca-Lauricocha/config.json
ADDED
|
@@ -0,0 +1,76 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"phoonnx_version": "1.0",
|
| 3 |
+
"engine": "transformers",
|
| 4 |
+
"phoneme_type": "graphemes",
|
| 5 |
+
"alphabet": "unicode",
|
| 6 |
+
"lang_code": "qvm",
|
| 7 |
+
"audio": {
|
| 8 |
+
"sample_rate": 16000
|
| 9 |
+
},
|
| 10 |
+
"num_symbols": 256,
|
| 11 |
+
"num_speakers": 1,
|
| 12 |
+
"num_langs": 1,
|
| 13 |
+
"speaker_id_map": {},
|
| 14 |
+
"lang_id_map": {},
|
| 15 |
+
"phonemizer_model": null,
|
| 16 |
+
"add_diacritics": false,
|
| 17 |
+
"inference": {
|
| 18 |
+
"noise_scale": 0.667,
|
| 19 |
+
"length_scale": 1.0,
|
| 20 |
+
"noise_w": 0.8
|
| 21 |
+
},
|
| 22 |
+
"phoneme_id_map": {
|
| 23 |
+
" ": 40,
|
| 24 |
+
"'": 38,
|
| 25 |
+
"-": 27,
|
| 26 |
+
"a": 0,
|
| 27 |
+
"b": 22,
|
| 28 |
+
"c": 4,
|
| 29 |
+
"d": 21,
|
| 30 |
+
"e": 16,
|
| 31 |
+
"f": 25,
|
| 32 |
+
"g": 8,
|
| 33 |
+
"h": 13,
|
| 34 |
+
"i": 3,
|
| 35 |
+
"j": 20,
|
| 36 |
+
"k": 39,
|
| 37 |
+
"l": 15,
|
| 38 |
+
"m": 12,
|
| 39 |
+
"n": 2,
|
| 40 |
+
"o": 14,
|
| 41 |
+
"p": 10,
|
| 42 |
+
"q": 19,
|
| 43 |
+
"r": 11,
|
| 44 |
+
"s": 6,
|
| 45 |
+
"t": 7,
|
| 46 |
+
"u": 5,
|
| 47 |
+
"v": 26,
|
| 48 |
+
"w": 18,
|
| 49 |
+
"x": 37,
|
| 50 |
+
"y": 9,
|
| 51 |
+
"z": 30,
|
| 52 |
+
"|": 1,
|
| 53 |
+
"á": 31,
|
| 54 |
+
"ä": 17,
|
| 55 |
+
"é": 33,
|
| 56 |
+
"ë": 24,
|
| 57 |
+
"í": 35,
|
| 58 |
+
"ï": 28,
|
| 59 |
+
"ñ": 34,
|
| 60 |
+
"ó": 36,
|
| 61 |
+
"ö": 23,
|
| 62 |
+
"ú": 29,
|
| 63 |
+
"ü": 32
|
| 64 |
+
},
|
| 65 |
+
"pad": null,
|
| 66 |
+
"blank": "a",
|
| 67 |
+
"bos": null,
|
| 68 |
+
"eos": null,
|
| 69 |
+
"add_blank_char": true,
|
| 70 |
+
"add_blank_word": false,
|
| 71 |
+
"use_eos_bos": false,
|
| 72 |
+
"blank_at_start": true,
|
| 73 |
+
"blank_at_end": true,
|
| 74 |
+
"word_sep_token": " ",
|
| 75 |
+
"blank_between": "tokens_and_words"
|
| 76 |
+
}
|
facebook__mms-tts-qvn-Quechua_North_Junín/config.json
ADDED
|
@@ -0,0 +1,77 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"phoonnx_version": "1.0",
|
| 3 |
+
"engine": "transformers",
|
| 4 |
+
"phoneme_type": "graphemes",
|
| 5 |
+
"alphabet": "unicode",
|
| 6 |
+
"lang_code": "qvn",
|
| 7 |
+
"audio": {
|
| 8 |
+
"sample_rate": 16000
|
| 9 |
+
},
|
| 10 |
+
"num_symbols": 256,
|
| 11 |
+
"num_speakers": 1,
|
| 12 |
+
"num_langs": 1,
|
| 13 |
+
"speaker_id_map": {},
|
| 14 |
+
"lang_id_map": {},
|
| 15 |
+
"phonemizer_model": null,
|
| 16 |
+
"add_diacritics": false,
|
| 17 |
+
"inference": {
|
| 18 |
+
"noise_scale": 0.667,
|
| 19 |
+
"length_scale": 1.0,
|
| 20 |
+
"noise_w": 0.8
|
| 21 |
+
},
|
| 22 |
+
"phoneme_id_map": {
|
| 23 |
+
" ": 41,
|
| 24 |
+
"'": 35,
|
| 25 |
+
"-": 25,
|
| 26 |
+
"a": 0,
|
| 27 |
+
"b": 22,
|
| 28 |
+
"c": 3,
|
| 29 |
+
"d": 20,
|
| 30 |
+
"e": 19,
|
| 31 |
+
"f": 29,
|
| 32 |
+
"g": 9,
|
| 33 |
+
"h": 10,
|
| 34 |
+
"i": 5,
|
| 35 |
+
"j": 18,
|
| 36 |
+
"k": 40,
|
| 37 |
+
"l": 15,
|
| 38 |
+
"m": 8,
|
| 39 |
+
"n": 2,
|
| 40 |
+
"o": 16,
|
| 41 |
+
"p": 12,
|
| 42 |
+
"q": 21,
|
| 43 |
+
"r": 6,
|
| 44 |
+
"s": 11,
|
| 45 |
+
"t": 13,
|
| 46 |
+
"u": 4,
|
| 47 |
+
"v": 26,
|
| 48 |
+
"w": 17,
|
| 49 |
+
"x": 38,
|
| 50 |
+
"y": 7,
|
| 51 |
+
"z": 27,
|
| 52 |
+
"|": 1,
|
| 53 |
+
"á": 36,
|
| 54 |
+
"ä": 14,
|
| 55 |
+
"é": 32,
|
| 56 |
+
"ë": 28,
|
| 57 |
+
"í": 34,
|
| 58 |
+
"ï": 24,
|
| 59 |
+
"ñ": 30,
|
| 60 |
+
"ó": 37,
|
| 61 |
+
"ö": 31,
|
| 62 |
+
"ú": 33,
|
| 63 |
+
"ü": 23,
|
| 64 |
+
"—": 39
|
| 65 |
+
},
|
| 66 |
+
"pad": null,
|
| 67 |
+
"blank": "a",
|
| 68 |
+
"bos": null,
|
| 69 |
+
"eos": null,
|
| 70 |
+
"add_blank_char": true,
|
| 71 |
+
"add_blank_word": false,
|
| 72 |
+
"use_eos_bos": false,
|
| 73 |
+
"blank_at_start": true,
|
| 74 |
+
"blank_at_end": true,
|
| 75 |
+
"word_sep_token": " ",
|
| 76 |
+
"blank_between": "tokens_and_words"
|
| 77 |
+
}
|
facebook__mms-tts-qvo-Quichua_Napo/config.json
ADDED
|
@@ -0,0 +1,71 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"phoonnx_version": "1.0",
|
| 3 |
+
"engine": "transformers",
|
| 4 |
+
"phoneme_type": "graphemes",
|
| 5 |
+
"alphabet": "unicode",
|
| 6 |
+
"lang_code": "qvo",
|
| 7 |
+
"audio": {
|
| 8 |
+
"sample_rate": 16000
|
| 9 |
+
},
|
| 10 |
+
"num_symbols": 256,
|
| 11 |
+
"num_speakers": 1,
|
| 12 |
+
"num_langs": 1,
|
| 13 |
+
"speaker_id_map": {},
|
| 14 |
+
"lang_id_map": {},
|
| 15 |
+
"phonemizer_model": null,
|
| 16 |
+
"add_diacritics": false,
|
| 17 |
+
"inference": {
|
| 18 |
+
"noise_scale": 0.667,
|
| 19 |
+
"length_scale": 1.0,
|
| 20 |
+
"noise_w": 0.8
|
| 21 |
+
},
|
| 22 |
+
"phoneme_id_map": {
|
| 23 |
+
" ": 35,
|
| 24 |
+
"'": 27,
|
| 25 |
+
"-": 22,
|
| 26 |
+
"a": 0,
|
| 27 |
+
"b": 21,
|
| 28 |
+
"c": 1,
|
| 29 |
+
"d": 19,
|
| 30 |
+
"e": 18,
|
| 31 |
+
"f": 24,
|
| 32 |
+
"g": 23,
|
| 33 |
+
"h": 6,
|
| 34 |
+
"i": 3,
|
| 35 |
+
"j": 17,
|
| 36 |
+
"k": 32,
|
| 37 |
+
"l": 12,
|
| 38 |
+
"m": 11,
|
| 39 |
+
"n": 5,
|
| 40 |
+
"o": 15,
|
| 41 |
+
"p": 8,
|
| 42 |
+
"q": 14,
|
| 43 |
+
"r": 10,
|
| 44 |
+
"s": 7,
|
| 45 |
+
"t": 9,
|
| 46 |
+
"u": 4,
|
| 47 |
+
"v": 25,
|
| 48 |
+
"x": 29,
|
| 49 |
+
"y": 13,
|
| 50 |
+
"z": 26,
|
| 51 |
+
"|": 2,
|
| 52 |
+
"á": 31,
|
| 53 |
+
"é": 34,
|
| 54 |
+
"í": 30,
|
| 55 |
+
"ñ": 16,
|
| 56 |
+
"ó": 28,
|
| 57 |
+
"ú": 33,
|
| 58 |
+
"—": 20
|
| 59 |
+
},
|
| 60 |
+
"pad": null,
|
| 61 |
+
"blank": "a",
|
| 62 |
+
"bos": null,
|
| 63 |
+
"eos": null,
|
| 64 |
+
"add_blank_char": true,
|
| 65 |
+
"add_blank_word": false,
|
| 66 |
+
"use_eos_bos": false,
|
| 67 |
+
"blank_at_start": true,
|
| 68 |
+
"blank_at_end": true,
|
| 69 |
+
"word_sep_token": " ",
|
| 70 |
+
"blank_between": "tokens_and_words"
|
| 71 |
+
}
|
facebook__mms-tts-qvs-Quechua_San_Martín/config.json
ADDED
|
@@ -0,0 +1,66 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"phoonnx_version": "1.0",
|
| 3 |
+
"engine": "transformers",
|
| 4 |
+
"phoneme_type": "graphemes",
|
| 5 |
+
"alphabet": "unicode",
|
| 6 |
+
"lang_code": "qvs",
|
| 7 |
+
"audio": {
|
| 8 |
+
"sample_rate": 16000
|
| 9 |
+
},
|
| 10 |
+
"num_symbols": 256,
|
| 11 |
+
"num_speakers": 1,
|
| 12 |
+
"num_langs": 1,
|
| 13 |
+
"speaker_id_map": {},
|
| 14 |
+
"lang_id_map": {},
|
| 15 |
+
"phonemizer_model": null,
|
| 16 |
+
"add_diacritics": false,
|
| 17 |
+
"inference": {
|
| 18 |
+
"noise_scale": 0.667,
|
| 19 |
+
"length_scale": 1.0,
|
| 20 |
+
"noise_w": 0.8
|
| 21 |
+
},
|
| 22 |
+
"phoneme_id_map": {
|
| 23 |
+
" ": 30,
|
| 24 |
+
"a": 0,
|
| 25 |
+
"b": 21,
|
| 26 |
+
"c": 11,
|
| 27 |
+
"d": 17,
|
| 28 |
+
"e": 16,
|
| 29 |
+
"f": 25,
|
| 30 |
+
"g": 22,
|
| 31 |
+
"h": 6,
|
| 32 |
+
"i": 4,
|
| 33 |
+
"j": 19,
|
| 34 |
+
"k": 3,
|
| 35 |
+
"l": 13,
|
| 36 |
+
"m": 14,
|
| 37 |
+
"n": 2,
|
| 38 |
+
"o": 18,
|
| 39 |
+
"p": 9,
|
| 40 |
+
"r": 12,
|
| 41 |
+
"s": 7,
|
| 42 |
+
"t": 8,
|
| 43 |
+
"u": 5,
|
| 44 |
+
"v": 23,
|
| 45 |
+
"w": 15,
|
| 46 |
+
"x": 28,
|
| 47 |
+
"y": 10,
|
| 48 |
+
"z": 29,
|
| 49 |
+
"|": 1,
|
| 50 |
+
"á": 27,
|
| 51 |
+
"í": 26,
|
| 52 |
+
"ñ": 20,
|
| 53 |
+
"—": 24
|
| 54 |
+
},
|
| 55 |
+
"pad": null,
|
| 56 |
+
"blank": "a",
|
| 57 |
+
"bos": null,
|
| 58 |
+
"eos": null,
|
| 59 |
+
"add_blank_char": true,
|
| 60 |
+
"add_blank_word": false,
|
| 61 |
+
"use_eos_bos": false,
|
| 62 |
+
"blank_at_start": true,
|
| 63 |
+
"blank_at_end": true,
|
| 64 |
+
"word_sep_token": " ",
|
| 65 |
+
"blank_between": "tokens_and_words"
|
| 66 |
+
}
|
facebook__mms-tts-qvw-Quechua_Huaylla_Wanca/config.json
ADDED
|
@@ -0,0 +1,81 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"phoonnx_version": "1.0",
|
| 3 |
+
"engine": "transformers",
|
| 4 |
+
"phoneme_type": "graphemes",
|
| 5 |
+
"alphabet": "unicode",
|
| 6 |
+
"lang_code": "qvw",
|
| 7 |
+
"audio": {
|
| 8 |
+
"sample_rate": 16000
|
| 9 |
+
},
|
| 10 |
+
"num_symbols": 256,
|
| 11 |
+
"num_speakers": 1,
|
| 12 |
+
"num_langs": 1,
|
| 13 |
+
"speaker_id_map": {},
|
| 14 |
+
"lang_id_map": {},
|
| 15 |
+
"phonemizer_model": null,
|
| 16 |
+
"add_diacritics": false,
|
| 17 |
+
"inference": {
|
| 18 |
+
"noise_scale": 0.667,
|
| 19 |
+
"length_scale": 1.0,
|
| 20 |
+
"noise_w": 0.8
|
| 21 |
+
},
|
| 22 |
+
"phoneme_id_map": {
|
| 23 |
+
" ": 45,
|
| 24 |
+
"'": 24,
|
| 25 |
+
"-": 28,
|
| 26 |
+
"a": 0,
|
| 27 |
+
"b": 29,
|
| 28 |
+
"c": 2,
|
| 29 |
+
"d": 22,
|
| 30 |
+
"e": 27,
|
| 31 |
+
"f": 31,
|
| 32 |
+
"g": 30,
|
| 33 |
+
"h": 8,
|
| 34 |
+
"i": 4,
|
| 35 |
+
"j": 20,
|
| 36 |
+
"k": 41,
|
| 37 |
+
"l": 6,
|
| 38 |
+
"m": 9,
|
| 39 |
+
"n": 3,
|
| 40 |
+
"o": 25,
|
| 41 |
+
"p": 10,
|
| 42 |
+
"q": 16,
|
| 43 |
+
"r": 18,
|
| 44 |
+
"s": 12,
|
| 45 |
+
"t": 11,
|
| 46 |
+
"u": 5,
|
| 47 |
+
"v": 34,
|
| 48 |
+
"w": 14,
|
| 49 |
+
"x": 40,
|
| 50 |
+
"y": 7,
|
| 51 |
+
"z": 35,
|
| 52 |
+
"|": 1,
|
| 53 |
+
"á": 26,
|
| 54 |
+
"ä": 13,
|
| 55 |
+
"é": 37,
|
| 56 |
+
"ë": 36,
|
| 57 |
+
"í": 33,
|
| 58 |
+
"ï": 23,
|
| 59 |
+
"ñ": 21,
|
| 60 |
+
"ó": 42,
|
| 61 |
+
"ö": 44,
|
| 62 |
+
"ú": 32,
|
| 63 |
+
"ü": 19,
|
| 64 |
+
"ć": 15,
|
| 65 |
+
"ś": 17,
|
| 66 |
+
"˻": 38,
|
| 67 |
+
"˼": 39,
|
| 68 |
+
"—": 43
|
| 69 |
+
},
|
| 70 |
+
"pad": null,
|
| 71 |
+
"blank": "a",
|
| 72 |
+
"bos": null,
|
| 73 |
+
"eos": null,
|
| 74 |
+
"add_blank_char": true,
|
| 75 |
+
"add_blank_word": false,
|
| 76 |
+
"use_eos_bos": false,
|
| 77 |
+
"blank_at_start": true,
|
| 78 |
+
"blank_at_end": true,
|
| 79 |
+
"word_sep_token": " ",
|
| 80 |
+
"blank_between": "tokens_and_words"
|
| 81 |
+
}
|
facebook__mms-tts-qvz-Quichua_Northern_Pastaza/config.json
ADDED
|
@@ -0,0 +1,70 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"phoonnx_version": "1.0",
|
| 3 |
+
"engine": "transformers",
|
| 4 |
+
"phoneme_type": "graphemes",
|
| 5 |
+
"alphabet": "unicode",
|
| 6 |
+
"lang_code": "qvz",
|
| 7 |
+
"audio": {
|
| 8 |
+
"sample_rate": 16000
|
| 9 |
+
},
|
| 10 |
+
"num_symbols": 256,
|
| 11 |
+
"num_speakers": 1,
|
| 12 |
+
"num_langs": 1,
|
| 13 |
+
"speaker_id_map": {},
|
| 14 |
+
"lang_id_map": {},
|
| 15 |
+
"phonemizer_model": null,
|
| 16 |
+
"add_diacritics": false,
|
| 17 |
+
"inference": {
|
| 18 |
+
"noise_scale": 0.667,
|
| 19 |
+
"length_scale": 1.0,
|
| 20 |
+
"noise_w": 0.8
|
| 21 |
+
},
|
| 22 |
+
"phoneme_id_map": {
|
| 23 |
+
" ": 34,
|
| 24 |
+
"-": 26,
|
| 25 |
+
"a": 0,
|
| 26 |
+
"b": 18,
|
| 27 |
+
"c": 4,
|
| 28 |
+
"d": 15,
|
| 29 |
+
"e": 19,
|
| 30 |
+
"f": 25,
|
| 31 |
+
"g": 11,
|
| 32 |
+
"h": 6,
|
| 33 |
+
"i": 2,
|
| 34 |
+
"j": 21,
|
| 35 |
+
"k": 33,
|
| 36 |
+
"l": 12,
|
| 37 |
+
"m": 10,
|
| 38 |
+
"n": 5,
|
| 39 |
+
"o": 16,
|
| 40 |
+
"p": 13,
|
| 41 |
+
"q": 20,
|
| 42 |
+
"r": 9,
|
| 43 |
+
"s": 7,
|
| 44 |
+
"t": 8,
|
| 45 |
+
"u": 3,
|
| 46 |
+
"v": 24,
|
| 47 |
+
"x": 32,
|
| 48 |
+
"y": 14,
|
| 49 |
+
"z": 22,
|
| 50 |
+
"|": 1,
|
| 51 |
+
"á": 23,
|
| 52 |
+
"é": 31,
|
| 53 |
+
"í": 28,
|
| 54 |
+
"ñ": 17,
|
| 55 |
+
"ó": 29,
|
| 56 |
+
"ú": 30,
|
| 57 |
+
"ü": 27
|
| 58 |
+
},
|
| 59 |
+
"pad": null,
|
| 60 |
+
"blank": "a",
|
| 61 |
+
"bos": null,
|
| 62 |
+
"eos": null,
|
| 63 |
+
"add_blank_char": true,
|
| 64 |
+
"add_blank_word": false,
|
| 65 |
+
"use_eos_bos": false,
|
| 66 |
+
"blank_at_start": true,
|
| 67 |
+
"blank_at_end": true,
|
| 68 |
+
"word_sep_token": " ",
|
| 69 |
+
"blank_between": "tokens_and_words"
|
| 70 |
+
}
|
facebook__mms-tts-qwh-Quechua_Huaylas_Ancash/config.json
ADDED
|
@@ -0,0 +1,72 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"phoonnx_version": "1.0",
|
| 3 |
+
"engine": "transformers",
|
| 4 |
+
"phoneme_type": "graphemes",
|
| 5 |
+
"alphabet": "unicode",
|
| 6 |
+
"lang_code": "qwh",
|
| 7 |
+
"audio": {
|
| 8 |
+
"sample_rate": 16000
|
| 9 |
+
},
|
| 10 |
+
"num_symbols": 256,
|
| 11 |
+
"num_speakers": 1,
|
| 12 |
+
"num_langs": 1,
|
| 13 |
+
"speaker_id_map": {},
|
| 14 |
+
"lang_id_map": {},
|
| 15 |
+
"phonemizer_model": null,
|
| 16 |
+
"add_diacritics": false,
|
| 17 |
+
"inference": {
|
| 18 |
+
"noise_scale": 0.667,
|
| 19 |
+
"length_scale": 1.0,
|
| 20 |
+
"noise_w": 0.8
|
| 21 |
+
},
|
| 22 |
+
"phoneme_id_map": {
|
| 23 |
+
" ": 36,
|
| 24 |
+
"'": 35,
|
| 25 |
+
"a": 0,
|
| 26 |
+
"b": 21,
|
| 27 |
+
"c": 5,
|
| 28 |
+
"d": 19,
|
| 29 |
+
"e": 10,
|
| 30 |
+
"f": 26,
|
| 31 |
+
"g": 23,
|
| 32 |
+
"h": 16,
|
| 33 |
+
"i": 3,
|
| 34 |
+
"j": 20,
|
| 35 |
+
"l": 13,
|
| 36 |
+
"m": 11,
|
| 37 |
+
"n": 2,
|
| 38 |
+
"o": 14,
|
| 39 |
+
"p": 12,
|
| 40 |
+
"q": 6,
|
| 41 |
+
"r": 9,
|
| 42 |
+
"s": 7,
|
| 43 |
+
"t": 8,
|
| 44 |
+
"u": 4,
|
| 45 |
+
"v": 31,
|
| 46 |
+
"w": 17,
|
| 47 |
+
"x": 34,
|
| 48 |
+
"y": 15,
|
| 49 |
+
"z": 30,
|
| 50 |
+
"|": 1,
|
| 51 |
+
"ä": 18,
|
| 52 |
+
"ë": 22,
|
| 53 |
+
"ï": 24,
|
| 54 |
+
"ñ": 27,
|
| 55 |
+
"ö": 28,
|
| 56 |
+
"ü": 29,
|
| 57 |
+
"˻": 32,
|
| 58 |
+
"˼": 33,
|
| 59 |
+
"—": 25
|
| 60 |
+
},
|
| 61 |
+
"pad": null,
|
| 62 |
+
"blank": "a",
|
| 63 |
+
"bos": null,
|
| 64 |
+
"eos": null,
|
| 65 |
+
"add_blank_char": true,
|
| 66 |
+
"add_blank_word": false,
|
| 67 |
+
"use_eos_bos": false,
|
| 68 |
+
"blank_at_start": true,
|
| 69 |
+
"blank_at_end": true,
|
| 70 |
+
"word_sep_token": " ",
|
| 71 |
+
"blank_between": "tokens_and_words"
|
| 72 |
+
}
|
facebook__mms-tts-qxh-Quechua_Panao/config.json
ADDED
|
@@ -0,0 +1,77 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"phoonnx_version": "1.0",
|
| 3 |
+
"engine": "transformers",
|
| 4 |
+
"phoneme_type": "graphemes",
|
| 5 |
+
"alphabet": "unicode",
|
| 6 |
+
"lang_code": "qxh",
|
| 7 |
+
"audio": {
|
| 8 |
+
"sample_rate": 16000
|
| 9 |
+
},
|
| 10 |
+
"num_symbols": 256,
|
| 11 |
+
"num_speakers": 1,
|
| 12 |
+
"num_langs": 1,
|
| 13 |
+
"speaker_id_map": {},
|
| 14 |
+
"lang_id_map": {},
|
| 15 |
+
"phonemizer_model": null,
|
| 16 |
+
"add_diacritics": false,
|
| 17 |
+
"inference": {
|
| 18 |
+
"noise_scale": 0.667,
|
| 19 |
+
"length_scale": 1.0,
|
| 20 |
+
"noise_w": 0.8
|
| 21 |
+
},
|
| 22 |
+
"phoneme_id_map": {
|
| 23 |
+
" ": 41,
|
| 24 |
+
"-": 23,
|
| 25 |
+
"2": 39,
|
| 26 |
+
"a": 0,
|
| 27 |
+
"b": 29,
|
| 28 |
+
"c": 5,
|
| 29 |
+
"d": 20,
|
| 30 |
+
"e": 22,
|
| 31 |
+
"f": 32,
|
| 32 |
+
"g": 18,
|
| 33 |
+
"h": 6,
|
| 34 |
+
"i": 3,
|
| 35 |
+
"j": 14,
|
| 36 |
+
"k": 38,
|
| 37 |
+
"l": 13,
|
| 38 |
+
"m": 11,
|
| 39 |
+
"n": 2,
|
| 40 |
+
"o": 21,
|
| 41 |
+
"p": 9,
|
| 42 |
+
"q": 16,
|
| 43 |
+
"r": 8,
|
| 44 |
+
"s": 7,
|
| 45 |
+
"t": 10,
|
| 46 |
+
"u": 4,
|
| 47 |
+
"v": 36,
|
| 48 |
+
"w": 15,
|
| 49 |
+
"x": 37,
|
| 50 |
+
"y": 12,
|
| 51 |
+
"z": 35,
|
| 52 |
+
"|": 1,
|
| 53 |
+
"": 40,
|
| 54 |
+
"á": 34,
|
| 55 |
+
"ä": 17,
|
| 56 |
+
"ç": 26,
|
| 57 |
+
"é": 30,
|
| 58 |
+
"í": 31,
|
| 59 |
+
"ï": 28,
|
| 60 |
+
"ñ": 24,
|
| 61 |
+
"ó": 33,
|
| 62 |
+
"ú": 25,
|
| 63 |
+
"ü": 27,
|
| 64 |
+
"ć": 19
|
| 65 |
+
},
|
| 66 |
+
"pad": null,
|
| 67 |
+
"blank": "a",
|
| 68 |
+
"bos": null,
|
| 69 |
+
"eos": null,
|
| 70 |
+
"add_blank_char": true,
|
| 71 |
+
"add_blank_word": false,
|
| 72 |
+
"use_eos_bos": false,
|
| 73 |
+
"blank_at_start": true,
|
| 74 |
+
"blank_at_end": true,
|
| 75 |
+
"word_sep_token": " ",
|
| 76 |
+
"blank_between": "tokens_and_words"
|
| 77 |
+
}
|