{ "istftnet": { "upsample_kernel_sizes": [20, 12], "upsample_rates": [10, 6], "gen_istft_hop_size": 5, "gen_istft_n_fft": 20, "resblock_dilation_sizes": [ [1, 3, 5], [1, 3, 5], [1, 3, 5] ], "resblock_kernel_sizes": [3, 7, 11], "upsample_initial_channel": 512 }, "dim_in": 64, "dropout": 0.2, "hidden_dim": 512, "max_conv_dim": 512, "max_dur": 50, "multispeaker": true, "n_layer": 3, "n_mels": 80, "n_token": 178, "style_dim": 128, "text_encoder_kernel_size": 5, "plbert": { "hidden_size": 768, "num_attention_heads": 12, "intermediate_size": 2048, "max_position_embeddings": 512, "num_hidden_layers": 12, "dropout": 0.1 }, "vocab": { ";": 1, ":": 2, ",": 3, ".": 4, "!": 5, "?": 6, "/": 7, "—": 9, "…": 10, "\"": 11, "(": 12, ")": 13, "“": 14, "”": 15, " ": 16, "\u0303": 17, "ʣ": 18, "ʥ": 19, "ʦ": 20, "ʨ": 21, "ᵝ": 22, "ㄓ": 23, "A": 24, "I": 25, "ㄅ": 30, "O": 31, "ㄆ": 32, "Q": 33, "R": 34, "S": 35, "T": 36, "ㄇ": 37, "ㄈ": 38, "W": 39, "ㄉ": 40, "Y": 41, "ᵊ": 42, "a": 43, "b": 44, "c": 45, "d": 46, "e": 47, "f": 48, "ㄊ": 49, "h": 50, "i": 51, "j": 52, "k": 53, "l": 54, "m": 55, "n": 56, "o": 57, "p": 58, "q": 59, "r": 60, "s": 61, "t": 62, "u": 63, "v": 64, "w": 65, "x": 66, "y": 67, "z": 68, "ɑ": 69, "ɐ": 70, "ɒ": 71, "æ": 72, "ㄋ": 73, "ㄌ": 74, "β": 75, "ɔ": 76, "ɕ": 77, "ç": 78, "ㄍ": 79, "ɖ": 80, "ð": 81, "ʤ": 82, "ə": 83, "ㄎ": 84, "ㄦ": 85, "ɛ": 86, "ɜ": 87, "ㄏ": 88, "ㄐ": 89, "ɟ": 90, "ㄑ": 91, "ɡ": 92, "ㄒ": 93, "ㄔ": 94, "ㄕ": 95, "ㄗ": 96, "ㄘ": 97, "ㄙ": 98, "月": 99, "ㄚ": 100, "ɨ": 101, "ɪ": 102, "ʝ": 103, "ㄛ": 104, "ㄝ": 105, "ㄞ": 106, "ㄟ": 107, "ㄠ": 108, "ㄡ": 109, "ɯ": 110, "ɰ": 111, "ŋ": 112, "ɳ": 113, "ɲ": 114, "ɴ": 115, "ø": 116, "ㄢ": 117, "ɸ": 118, "θ": 119, "œ": 120, "ㄣ": 121, "ㄤ": 122, "ɹ": 123, "ㄥ": 124, "ɾ": 125, "ㄖ": 126, "ㄧ": 127, "ʁ": 128, "ɽ": 129, "ʂ": 130, "ʃ": 131, "ʈ": 132, "ʧ": 133, "ㄨ": 134, "ʊ": 135, "ʋ": 136, "ㄩ": 137, "ʌ": 138, "ɣ": 139, "ㄜ": 140, "ㄭ": 141, "χ": 142, "ʎ": 143, "十": 144, "压": 145, "言": 146, "ʒ": 147, "ʔ": 148, "阳": 149, "要": 150, "阴": 151, "应": 152, "用": 153, "又": 154, "中": 155, "ˈ": 156, "ˌ": 157, "ː": 158, "穵": 159, "外": 160, "万": 161, "ʰ": 162, "王": 163, "ʲ": 164, "为": 165, "文": 166, "瓮": 167, "我": 168, "3": 169, "5": 170, "1": 171, "2": 172, "4": 173, "元": 175, "云": 176, "ᵻ": 177 } }