|
{ |
|
"istftnet": { |
|
"upsample_kernel_sizes": [20, 12], |
|
"upsample_rates": [10, 6], |
|
"gen_istft_hop_size": 5, |
|
"gen_istft_n_fft": 20, |
|
"resblock_dilation_sizes": [ |
|
[1, 3, 5], |
|
[1, 3, 5], |
|
[1, 3, 5] |
|
], |
|
"resblock_kernel_sizes": [3, 7, 11], |
|
"upsample_initial_channel": 512 |
|
}, |
|
"dim_in": 64, |
|
"dropout": 0.2, |
|
"hidden_dim": 512, |
|
"max_conv_dim": 512, |
|
"max_dur": 50, |
|
"multispeaker": true, |
|
"n_layer": 3, |
|
"n_mels": 80, |
|
"n_token": 178, |
|
"style_dim": 128, |
|
"text_encoder_kernel_size": 5, |
|
"plbert": { |
|
"hidden_size": 768, |
|
"num_attention_heads": 12, |
|
"intermediate_size": 2048, |
|
"max_position_embeddings": 512, |
|
"num_hidden_layers": 12, |
|
"dropout": 0.1 |
|
}, |
|
"vocab": { |
|
";": 1, |
|
":": 2, |
|
",": 3, |
|
".": 4, |
|
"!": 5, |
|
"?": 6, |
|
"/": 7, |
|
"—": 9, |
|
"…": 10, |
|
"\"": 11, |
|
"(": 12, |
|
")": 13, |
|
"“": 14, |
|
"”": 15, |
|
" ": 16, |
|
"\u0303": 17, |
|
"ʣ": 18, |
|
"ʥ": 19, |
|
"ʦ": 20, |
|
"ʨ": 21, |
|
"ᵝ": 22, |
|
"ㄓ": 23, |
|
"A": 24, |
|
"I": 25, |
|
"ㄅ": 30, |
|
"O": 31, |
|
"ㄆ": 32, |
|
"Q": 33, |
|
"R": 34, |
|
"S": 35, |
|
"T": 36, |
|
"ㄇ": 37, |
|
"ㄈ": 38, |
|
"W": 39, |
|
"ㄉ": 40, |
|
"Y": 41, |
|
"ᵊ": 42, |
|
"a": 43, |
|
"b": 44, |
|
"c": 45, |
|
"d": 46, |
|
"e": 47, |
|
"f": 48, |
|
"ㄊ": 49, |
|
"h": 50, |
|
"i": 51, |
|
"j": 52, |
|
"k": 53, |
|
"l": 54, |
|
"m": 55, |
|
"n": 56, |
|
"o": 57, |
|
"p": 58, |
|
"q": 59, |
|
"r": 60, |
|
"s": 61, |
|
"t": 62, |
|
"u": 63, |
|
"v": 64, |
|
"w": 65, |
|
"x": 66, |
|
"y": 67, |
|
"z": 68, |
|
"ɑ": 69, |
|
"ɐ": 70, |
|
"ɒ": 71, |
|
"æ": 72, |
|
"ㄋ": 73, |
|
"ㄌ": 74, |
|
"β": 75, |
|
"ɔ": 76, |
|
"ɕ": 77, |
|
"ç": 78, |
|
"ㄍ": 79, |
|
"ɖ": 80, |
|
"ð": 81, |
|
"ʤ": 82, |
|
"ə": 83, |
|
"ㄎ": 84, |
|
"ㄦ": 85, |
|
"ɛ": 86, |
|
"ɜ": 87, |
|
"ㄏ": 88, |
|
"ㄐ": 89, |
|
"ɟ": 90, |
|
"ㄑ": 91, |
|
"ɡ": 92, |
|
"ㄒ": 93, |
|
"ㄔ": 94, |
|
"ㄕ": 95, |
|
"ㄗ": 96, |
|
"ㄘ": 97, |
|
"ㄙ": 98, |
|
"月": 99, |
|
"ㄚ": 100, |
|
"ɨ": 101, |
|
"ɪ": 102, |
|
"ʝ": 103, |
|
"ㄛ": 104, |
|
"ㄝ": 105, |
|
"ㄞ": 106, |
|
"ㄟ": 107, |
|
"ㄠ": 108, |
|
"ㄡ": 109, |
|
"ɯ": 110, |
|
"ɰ": 111, |
|
"ŋ": 112, |
|
"ɳ": 113, |
|
"ɲ": 114, |
|
"ɴ": 115, |
|
"ø": 116, |
|
"ㄢ": 117, |
|
"ɸ": 118, |
|
"θ": 119, |
|
"œ": 120, |
|
"ㄣ": 121, |
|
"ㄤ": 122, |
|
"ɹ": 123, |
|
"ㄥ": 124, |
|
"ɾ": 125, |
|
"ㄖ": 126, |
|
"ㄧ": 127, |
|
"ʁ": 128, |
|
"ɽ": 129, |
|
"ʂ": 130, |
|
"ʃ": 131, |
|
"ʈ": 132, |
|
"ʧ": 133, |
|
"ㄨ": 134, |
|
"ʊ": 135, |
|
"ʋ": 136, |
|
"ㄩ": 137, |
|
"ʌ": 138, |
|
"ɣ": 139, |
|
"ㄜ": 140, |
|
"ㄭ": 141, |
|
"χ": 142, |
|
"ʎ": 143, |
|
"十": 144, |
|
"压": 145, |
|
"言": 146, |
|
"ʒ": 147, |
|
"ʔ": 148, |
|
"阳": 149, |
|
"要": 150, |
|
"阴": 151, |
|
"应": 152, |
|
"用": 153, |
|
"又": 154, |
|
"中": 155, |
|
"ˈ": 156, |
|
"ˌ": 157, |
|
"ː": 158, |
|
"穵": 159, |
|
"外": 160, |
|
"万": 161, |
|
"ʰ": 162, |
|
"王": 163, |
|
"ʲ": 164, |
|
"为": 165, |
|
"文": 166, |
|
"瓮": 167, |
|
"我": 168, |
|
"3": 169, |
|
"5": 170, |
|
"1": 171, |
|
"2": 172, |
|
"4": 173, |
|
"元": 175, |
|
"云": 176, |
|
"ᵻ": 177 |
|
} |
|
} |