{ "dataset": "working", "audio": { "sample_rate": 22050, "quality": "training" }, "lang_code": "ca", "inference": { "noise_scale": 0.667, "length_scale": 1, "noise_w": 0.8, "add_diacritics": false }, "alphabet": "ipa", "phoneme_type": "espeak", "phonemizer_model": "", "phoneme_id_map": { "_": 0, "^": 1, "$": 2, " ": 3, "!": 4, "\"": 5, "#": 6, "'": 7, "(": 8, ")": 9, ",": 10, "-": 11, ".": 12, "0": 13, "1": 14, "2": 15, "3": 16, "4": 17, "5": 18, "6": 19, "7": 20, "8": 21, "9": 22, ":": 23, ";": 24, "?": 25, "X": 26, "a": 27, "b": 28, "c": 29, "d": 30, "e": 31, "f": 32, "g": 33, "h": 34, "i": 35, "j": 36, "k": 37, "l": 38, "m": 39, "n": 40, "o": 41, "p": 42, "q": 43, "r": 44, "s": 45, "t": 46, "u": 47, "v": 48, "w": 49, "x": 50, "y": 51, "z": 52, "æ": 53, "ç": 54, "ð": 55, "ø": 56, "ħ": 57, "ŋ": 58, "œ": 59, "ǀ": 60, "ǁ": 61, "ǂ": 62, "ǃ": 63, "ɐ": 64, "ɑ": 65, "ɒ": 66, "ɓ": 67, "ɔ": 68, "ɕ": 69, "ɖ": 70, "ɗ": 71, "ɘ": 72, "ə": 73, "ɚ": 74, "ɛ": 75, "ɜ": 76, "ɝ": 77, "ɞ": 78, "ɟ": 79, "ɠ": 80, "ɡ": 81, "ɢ": 82, "ɣ": 83, "ɤ": 84, "ɥ": 85, "ɦ": 86, "ɧ": 87, "ɨ": 88, "ɪ": 89, "ɫ": 90, "ɬ": 91, "ɭ": 92, "ɮ": 93, "ɯ": 94, "ɰ": 95, "ɱ": 96, "ɲ": 97, "ɳ": 98, "ɴ": 99, "ɵ": 100, "ɶ": 101, "ɸ": 102, "ɹ": 103, "ɺ": 104, "ɻ": 105, "ɽ": 106, "ɾ": 107, "ʀ": 108, "ʁ": 109, "ʂ": 110, "ʃ": 111, "ʄ": 112, "ʈ": 113, "ʉ": 114, "ʊ": 115, "ʋ": 116, "ʌ": 117, "ʍ": 118, "ʎ": 119, "ʏ": 120, "ʐ": 121, "ʑ": 122, "ʒ": 123, "ʔ": 124, "ʕ": 125, "ʘ": 126, "ʙ": 127, "ʛ": 128, "ʜ": 129, "ʝ": 130, "ʟ": 131, "ʡ": 132, "ʢ": 133, "ʦ": 134, "ʰ": 135, "ʲ": 136, "ʷ": 137, "ˈ": 138, "ˌ": 139, "ː": 140, "ˑ": 141, "˞": 142, "ˤ": 143, "̃": 144, "̊": 145, "̝": 146, "̧": 147, "̩": 148, "̪": 149, "̯": 150, "̺": 151, "̻": 152, "β": 153, "ε": 154, "θ": 155, "χ": 156, "ᵻ": 157, "↑": 158, "↓": 159, "ⱱ": 160 }, "num_symbols": 161, "num_speakers": 1, "speaker_id_map": {}, "phoonnx_version": "1.3.1a1" }