{ "dataset": "moe-speech-20speakers-wavlm", "audio": { "sample_rate": 22050, "quality": "medium" }, "espeak": { "voice": "ja" }, "language": { "code": "ja" }, "inference": { "noise_scale": 0.667, "length_scale": 1, "noise_w": 0.8 }, "phoneme_type": "openjtalk", "phoneme_map": {}, "phoneme_id_map": { "_": [0], "^": [1], "$": [2], "?": [3], "\ue016": [4], "\ue017": [5], "\ue018": [6], "#": [7], "[": [8], "]": [9], "a": [10], "i": [11], "u": [12], "e": [13], "o": [14], "A": [15], "I": [16], "U": [17], "E": [18], "O": [19], "\u00e7": [20], "\u0255": [21], "\u026f": [22], "\u0274": [23], "\u027e": [24], "N": [25], "\ue019": [26], "\ue01a": [27], "\ue01b": [28], "\ue01c": [29], "\u0291": [30], "q": [31], "k": [32], "k\u02b2": [33], "\u0261\u02b2": [34], "g": [35], "\u0261": [36], "d\u0291": [37], "t": [38], "t\u0255": [39], "d": [40], "d\u02b2": [41], "p": [42], "p\u02b2": [43], "b": [44], "b\u02b2": [45], "c\u00e7": [46], "\u00e7\u02d0": [47], "s": [48], "\u0283": [49], "z": [50], "j": [51], "\u0272": [52], "f": [53], "h": [54], "h\u02b2": [55], "v": [56], "n": [57], "n\u02b2": [58], "m": [59], "m\u02b2": [60], "r": [61], "\u027d": [62], "w": [63], "y": [64] }, "num_symbols": 65, "num_speakers": 0, "piper_version": "1.5.4", "prosody_dim": 16, "prosody_features": { "a1": "アクセント核からの相対位置", "a2": "アクセント句内のモーラ位置", "a3": "アクセント句内の総モーラ数" }, "prosody_num_symbols": 11, "prosody_id_map": { "0": [0], "1": [1], "2": [2], "3": [3], "4": [4], "5": [5], "6": [6], "7": [7], "8": [8], "9": [9], "10": [10] }, "use_wavlm_discriminator": true }