{ "dataset": "multilingual-6lang", "audio": { "sample_rate": 22050, "quality": "medium" }, "language": { "code": "ja-en-zh-es-fr-pt" }, "inference": { "noise_scale": 0.667, "length_scale": 1, "noise_w": 0.8 }, "phoneme_type": "multilingual", "phoneme_map": {}, "phoneme_id_map": { "_": [ 0 ], "^": [ 1 ], "$": [ 2 ], "?": [ 3 ], "": [ 4 ], "": [ 5 ], "": [ 6 ], "#": [ 7 ], "[": [ 8 ], "]": [ 9 ], "a": [ 10 ], "i": [ 11 ], "u": [ 12 ], "e": [ 13 ], "o": [ 14 ], "A": [ 15 ], "I": [ 16 ], "U": [ 17 ], "E": [ 18 ], "O": [ 19 ], "": [ 20 ], "": [ 21 ], "": [ 22 ], "": [ 23 ], "": [ 24 ], "N": [ 25 ], "": [ 26 ], "": [ 27 ], "": [ 28 ], "": [ 29 ], "": [ 30 ], "q": [ 31 ], "k": [ 32 ], "": [ 33 ], "": [ 34 ], "g": [ 35 ], "": [ 36 ], "": [ 37 ], "t": [ 38 ], "": [ 39 ], "d": [ 40 ], "": [ 41 ], "p": [ 42 ], "": [ 43 ], "b": [ 44 ], "": [ 45 ], "": [ 46 ], "": [ 47 ], "s": [ 48 ], "": [ 49 ], "z": [ 50 ], "j": [ 51 ], "": [ 52 ], "f": [ 53 ], "h": [ 54 ], "": [ 55 ], "v": [ 56 ], "n": [ 57 ], "": [ 58 ], "m": [ 59 ], "": [ 60 ], "r": [ 61 ], "": [ 62 ], "w": [ 63 ], "y": [ 64 ], "ɪ": [ 65 ], "ʊ": [ 66 ], "ɛ": [ 67 ], "ɔ": [ 68 ], "æ": [ 69 ], "ɑ": [ 70 ], "ʌ": [ 71 ], "ə": [ 72 ], "ɜ": [ 73 ], "ɹ": [ 74 ], "ɝ": [ 75 ], "ɫ": [ 76 ], "ð": [ 77 ], "θ": [ 78 ], "ŋ": [ 79 ], "ʃ": [ 80 ], "ʒ": [ 81 ], "": [ 82 ], "": [ 83 ], "l": [ 84 ], "ɡ": [ 85 ], "x": [ 86 ], "ˈ": [ 87 ], "ˌ": [ 88 ], "ː": [ 89 ], "": [ 90 ], "": [ 91 ], "": [ 92 ], "": [ 93 ], "ɔɪ": [ 94 ], "": [ 95 ], "": [ 96 ], "": [ 97 ], "": [ 98 ], "": [ 99 ], "": [ 100 ], "": [ 101 ], "": [ 102 ], "": [ 103 ], "": [ 104 ], "": [ 105 ], "": [ 106 ], "": [ 107 ], "": [ 108 ], "": [ 109 ], "": [ 110 ], "": [ 111 ], "": [ 112 ], "": [ 113 ], "": [ 114 ], "": [ 115 ], "": [ 116 ], "": [ 117 ], "": [ 118 ], "": [ 119 ], "": [ 120 ], "": [ 121 ], "": [ 122 ], "": [ 123 ], "": [ 124 ], "": [ 125 ], "ɕ": [ 126 ], "ɚ": [ 127 ], "ɤ": [ 128 ], "ɨ": [ 129 ], "ɻ": [ 130 ], "ʂ": [ 131 ], "": [ 132 ], "": [ 133 ], "": [ 134 ], "": [ 135 ], "": [ 136 ], "": [ 137 ], "": [ 138 ], "": [ 139 ], "": [ 140 ], "ɲ": [ 141 ], "ʎ": [ 142 ], "β": [ 143 ], "ɣ": [ 144 ], "ʁ": [ 145 ], "": [ 146 ], "": [ 147 ], "": [ 148 ], "œ̃": [ 149 ], "ø": [ 150 ], "œ": [ 151 ], "ɐ": [ 152 ], "ɐ̃": [ 153 ], "ẽ": [ 154 ], "ĩ": [ 155 ], "õ": [ 156 ], "ũ": [ 157 ], "": [ 158 ], "": [ 159 ], "": [ 160 ], "": [ 161 ], "": [ 162 ], "": [ 163 ], "": [ 164 ], "": [ 165 ], "ɯ": [ 166 ], "ɾ": [ 167 ], "ɰ": [ 168 ], "ɖ": [ 169 ], "ʈ": [ 170 ], "ɳ": [ 171 ], "ɭ": [ 172 ] }, "num_symbols": 173, "num_speakers": 0, "num_languages": 6, "language_id_map": { "ja": 0, "en": 1, "zh": 2, "es": 3, "fr": 4, "pt": 5 }, "prosody_num_symbols": 11, "prosody_id_map": { "0": [ 0 ], "1": [ 1 ], "2": [ 2 ], "3": [ 3 ], "4": [ 4 ], "5": [ 5 ], "6": [ 6 ], "7": [ 7 ], "8": [ 8 ], "9": [ 9 ], "10": [ 10 ] } }