piper-plus-base / config.json
ayousanz's picture
Upload folder using huggingface_hub
33859fa verified
{
"dataset": "moe-speech-20speakers-wavlm",
"audio": {
"sample_rate": 22050,
"quality": "medium"
},
"espeak": {
"voice": "ja"
},
"language": {
"code": "ja"
},
"inference": {
"noise_scale": 0.667,
"length_scale": 1,
"noise_w": 0.8
},
"phoneme_type": "openjtalk",
"phoneme_map": {},
"phoneme_id_map": {
"_": [0], "^": [1], "$": [2], "?": [3],
"\ue016": [4], "\ue017": [5], "\ue018": [6],
"#": [7], "[": [8], "]": [9],
"a": [10], "i": [11], "u": [12], "e": [13], "o": [14],
"A": [15], "I": [16], "U": [17], "E": [18], "O": [19],
"\u00e7": [20], "\u0255": [21], "\u026f": [22], "\u0274": [23], "\u027e": [24],
"N": [25],
"\ue019": [26], "\ue01a": [27], "\ue01b": [28], "\ue01c": [29],
"\u0291": [30], "q": [31], "k": [32],
"k\u02b2": [33], "\u0261\u02b2": [34], "g": [35], "\u0261": [36], "d\u0291": [37],
"t": [38], "t\u0255": [39], "d": [40], "d\u02b2": [41],
"p": [42], "p\u02b2": [43], "b": [44], "b\u02b2": [45],
"c\u00e7": [46], "\u00e7\u02d0": [47], "s": [48], "\u0283": [49],
"z": [50], "j": [51], "\u0272": [52],
"f": [53], "h": [54], "h\u02b2": [55], "v": [56],
"n": [57], "n\u02b2": [58], "m": [59], "m\u02b2": [60],
"r": [61], "\u027d": [62], "w": [63], "y": [64]
},
"num_symbols": 65,
"num_speakers": 0,
"piper_version": "1.5.4",
"prosody_dim": 16,
"prosody_features": {
"a1": "アクセント核からの相対位置",
"a2": "アクセント句内のモーラ位置",
"a3": "アクセント句内の総モーラ数"
},
"prosody_num_symbols": 11,
"prosody_id_map": {
"0": [0], "1": [1], "2": [2], "3": [3], "4": [4],
"5": [5], "6": [6], "7": [7], "8": [8], "9": [9], "10": [10]
},
"use_wavlm_discriminator": true
}