{ "dataset": "moe-speech-50speakers", "audio": { "sample_rate": 22050, "quality": "medium" }, "espeak": { "voice": "ja" }, "language": { "code": "ja" }, "inference": { "noise_scale": 0.667, "length_scale": 1, "noise_w": 0.8 }, "phoneme_type": "openjtalk", "phoneme_map": {}, "phoneme_id_map": { "_": [ 0 ], "^": [ 1 ], "$": [ 2 ], "?": [ 3 ], "#": [ 4 ], "[": [ 5 ], "]": [ 6 ], "a": [ 7 ], "i": [ 8 ], "u": [ 9 ], "e": [ 10 ], "o": [ 11 ], "A": [ 12 ], "I": [ 13 ], "U": [ 14 ], "E": [ 15 ], "O": [ 16 ], "": [ 17 ], "": [ 18 ], "": [ 19 ], "": [ 20 ], "": [ 21 ], "N": [ 22 ], "": [ 23 ], "q": [ 24 ], "k": [ 25 ], "": [ 26 ], "": [ 27 ], "g": [ 28 ], "": [ 29 ], "": [ 30 ], "t": [ 31 ], "": [ 32 ], "d": [ 33 ], "": [ 34 ], "p": [ 35 ], "": [ 36 ], "b": [ 37 ], "": [ 38 ], "": [ 39 ], "": [ 40 ], "s": [ 41 ], "": [ 42 ], "z": [ 43 ], "j": [ 44 ], "": [ 45 ], "f": [ 46 ], "h": [ 47 ], "": [ 48 ], "v": [ 49 ], "n": [ 50 ], "": [ 51 ], "m": [ 52 ], "": [ 53 ], "r": [ 54 ], "": [ 55 ], "w": [ 56 ], "y": [ 57 ] }, "num_symbols": 58, "num_speakers": 0, "piper_version": "1.4.0", "prosody_num_symbols": 11, "prosody_id_map": { "0": [ 0 ], "1": [ 1 ], "2": [ 2 ], "3": [ 3 ], "4": [ 4 ], "5": [ 5 ], "6": [ 6 ], "7": [ 7 ], "8": [ 8 ], "9": [ 9 ], "10": [ 10 ] } }