slplab's picture
Initial commit for wav2vec2-large-robust pronunciation model
caa37fe
raw
history blame
6.53 kB
{
"<pad>": 436,
"<unk>": 437,
"aa": 0,
"aa_ih": 1,
"aa_l": 2,
"aa_ng": 3,
"aa_r": 4,
"aa_uh": 5,
"aa_w": 6,
"aa_w_ih": 7,
"ae": 8,
"ae_ax": 9,
"ae_ax_l": 10,
"ae_ih": 11,
"ae_l": 12,
"ah": 13,
"ah_ax": 14,
"ah_f": 15,
"ah_ih": 16,
"ah_l": 17,
"ah_l_ih": 18,
"ah_l_s": 19,
"ah_m": 20,
"ah_n": 21,
"ah_p": 22,
"ah_r": 23,
"ah_uh": 24,
"ah_uw": 25,
"ah_w": 26,
"ao": 27,
"ao_l": 28,
"ao_r": 29,
"aw": 30,
"aw_ih": 31,
"aw_n": 32,
"ax": 33,
"ax_b": 34,
"ax_d": 35,
"ax_ih": 36,
"ax_k": 37,
"ax_l": 38,
"ax_l_eh": 39,
"ax_l_l": 40,
"ax_m": 41,
"ax_r": 42,
"ax_r_ih": 43,
"ax_z": 44,
"axr": 45,
"axr_ih": 46,
"axr_s": 47,
"axr_z": 48,
"ay": 49,
"ay_ae": 50,
"ay_ax": 51,
"ay_eh": 52,
"ay_l": 53,
"ay_m": 54,
"ay_n": 55,
"ay_r": 56,
"ay_t": 57,
"ay_w_ih": 58,
"b": 59,
"b*": 60,
"b_ah": 61,
"b_ah_l": 62,
"b_ax": 63,
"b_d": 64,
"b_eh": 65,
"b_eu": 66,
"b_ih": 67,
"b_ih_k": 68,
"b_uh": 69,
"bd": 70,
"ch": 71,
"ch_ax_w_ax": 72,
"ch_eu": 73,
"ch_ih": 74,
"ch_uh": 75,
"ch_uh_ah": 76,
"ch_y": 77,
"d": 78,
"d*": 79,
"d_ax": 80,
"d_d": 81,
"d_eu": 82,
"d_ey": 83,
"d_ih": 84,
"d_ih_d": 85,
"d_ih_d_eu": 86,
"d_ih_ng": 87,
"d_ix": 88,
"d_iy": 89,
"d_l": 90,
"d_o": 91,
"d_r": 92,
"d_t": 93,
"d_w": 94,
"d_y": 95,
"d_z": 96,
"dd": 97,
"dd_eu": 98,
"dh": 99,
"dh_ah": 100,
"dh_eh": 101,
"dh_eu": 102,
"dh_ey": 103,
"dx": 104,
"dx_eu": 105,
"dx_ih": 106,
"dx_ih_d": 107,
"dx_ix": 108,
"eh": 109,
"eh_ah": 110,
"eh_ax": 111,
"eh_ax_l_aa": 112,
"eh_g": 113,
"eh_ih": 114,
"eh_ih_aa": 115,
"eh_k": 116,
"eh_l": 117,
"eh_m": 118,
"eh_r": 119,
"eh_td": 120,
"eh_uw": 121,
"eh_w_ih": 122,
"er": 123,
"er_eh": 124,
"er_ih": 125,
"er_l": 126,
"er_n": 127,
"eu": 128,
"ey": 129,
"ey_ah": 130,
"ey_d": 131,
"ey_dd": 132,
"ey_f": 133,
"ey_ih": 134,
"ey_jh": 135,
"ey_p": 136,
"ey_s": 137,
"ey_w_ih": 138,
"ey_w_iy": 139,
"f": 140,
"f_ah": 141,
"f_ao": 142,
"f_ax": 143,
"f_eu": 144,
"f_r": 145,
"f_w": 146,
"g": 147,
"g*": 148,
"g*_w": 149,
"g_ax": 150,
"g_eu": 151,
"g_ih": 152,
"g_l": 153,
"g_uh": 154,
"g_y": 155,
"gd": 156,
"hh": 157,
"hh_ah": 158,
"hh_eu": 159,
"hh_ih": 160,
"hh_ix": 161,
"hh_ow": 162,
"hh_w": 163,
"hh_y": 164,
"ih": 165,
"ih_aa": 166,
"ih_ah": 167,
"ih_ax": 168,
"ih_ax_l": 169,
"ih_axr": 170,
"ih_d": 171,
"ih_eh": 172,
"ih_ih": 173,
"ih_k": 174,
"ih_l": 175,
"ih_n": 176,
"ih_n_ih": 177,
"ih_ng": 178,
"ih_r": 179,
"ih_s": 180,
"ih_td": 181,
"ih_uh": 182,
"ih_w_ih": 183,
"ih_z": 184,
"ix": 185,
"ix_d": 186,
"iy": 187,
"iy_aa": 188,
"iy_ah": 189,
"iy_ax": 190,
"iy_axr": 191,
"iy_d": 192,
"iy_l": 193,
"iy_m": 194,
"iy_n": 195,
"iy_ng": 196,
"iy_p": 197,
"iy_s": 198,
"iy_s_eu": 199,
"iy_z": 200,
"jh": 201,
"jh_ax": 202,
"jh_eu": 203,
"jh_ih": 204,
"jh_ih_s": 205,
"jh_ix": 206,
"jh_iy": 207,
"jh_uh": 208,
"jh_w": 209,
"k": 210,
"k_ah": 211,
"k_ao": 212,
"k_ax": 213,
"k_eu": 214,
"k_ih": 215,
"k_l": 216,
"k_o": 217,
"k_s": 218,
"k_s_eu": 219,
"k_t": 220,
"k_t_eu": 221,
"k_th": 222,
"k_uh": 223,
"k_w": 224,
"k_y": 225,
"kd": 226,
"kd_s": 227,
"l": 228,
"l_ah": 229,
"l_ah_l": 230,
"l_ax": 231,
"l_ay": 232,
"l_eh": 233,
"l_eu": 234,
"l_f": 235,
"l_ih": 236,
"l_ix": 237,
"l_s": 238,
"m": 239,
"m_ax": 240,
"m_b": 241,
"m_b_eu": 242,
"m_eh": 243,
"m_eu": 244,
"m_f": 245,
"m_ih": 246,
"m_ix": 247,
"m_m": 248,
"m_n": 249,
"m_s": 250,
"m_t_eu": 251,
"m_z": 252,
"n": 253,
"n_ax": 254,
"n_d": 255,
"n_d_eu": 256,
"n_dd": 257,
"n_eh": 258,
"n_eu": 259,
"n_ih": 260,
"n_ix": 261,
"n_n": 262,
"n_o": 263,
"n_s": 264,
"n_td": 265,
"n_y": 266,
"ng": 267,
"ng_ah": 268,
"ng_g": 269,
"ng_k": 270,
"ng_s": 271,
"o": 272,
"o_aa": 273,
"o_ah": 274,
"o_ax": 275,
"o_ih": 276,
"o_l": 277,
"o_n": 278,
"o_r": 279,
"o_s": 280,
"o_uh": 281,
"ow": 282,
"ow_ix": 283,
"ow_s": 284,
"ow_t": 285,
"ow_td": 286,
"oy": 287,
"oy_n": 288,
"p": 289,
"p_ah": 290,
"p_ax": 291,
"p_b": 292,
"p_eh": 293,
"p_eu": 294,
"p_ih": 295,
"p_ix": 296,
"p_l": 297,
"p_o": 298,
"p_r": 299,
"p_uh": 300,
"pd": 301,
"r": 302,
"r_aa": 303,
"r_ah": 304,
"r_ax": 305,
"r_ay": 306,
"r_eh": 307,
"r_eu": 308,
"r_ih": 309,
"r_l": 310,
"r_o": 311,
"r_s": 312,
"r_uh": 313,
"r_w": 314,
"r_w_ah_n": 315,
"r_y": 316,
"s": 317,
"s_ah": 318,
"s_ax": 319,
"s_ch": 320,
"s_d": 321,
"s_dd": 322,
"s_eh": 323,
"s_eu": 324,
"s_eu_l_ih": 325,
"s_ih": 326,
"s_ih_s": 327,
"s_ih_s_eu": 328,
"s_iy": 329,
"s_t": 330,
"s_t_eu": 331,
"s_td": 332,
"s_ts": 333,
"s_uh": 334,
"s_y": 335,
"sh": 336,
"sh_ax": 337,
"sh_ih": 338,
"sh_ih_dd": 339,
"sh_iy": 340,
"sh_uh": 341,
"sh_uw": 342,
"sil": 343,
"t": 344,
"t_ah": 345,
"t_ax": 346,
"t_ay": 347,
"t_eh": 348,
"t_eu": 349,
"t_eu_s": 350,
"t_eu_s_eu": 351,
"t_eu_t": 352,
"t_ih": 353,
"t_ih_d": 354,
"t_ix": 355,
"t_iy": 356,
"t_o": 357,
"t_r": 358,
"t_s": 359,
"t_uh": 360,
"t_uw": 361,
"t_y": 362,
"td": 363,
"th": 364,
"th_ax": 365,
"th_eu": 366,
"th_r": 367,
"ts": 368,
"ts_ax": 369,
"ts_eu": 370,
"ts_y": 371,
"uh": 372,
"uh_aa": 373,
"uh_ah": 374,
"uh_ah_l": 375,
"uh_ax": 376,
"uh_axr": 377,
"uh_er": 378,
"uh_ih": 379,
"uh_l": 380,
"uh_r": 381,
"uh_s": 382,
"uh_w_ao": 383,
"uw": 384,
"uw_ah": 385,
"uw_ax": 386,
"uw_er": 387,
"uw_ih": 388,
"uw_l": 389,
"uw_m": 390,
"uw_r": 391,
"uw_w_ih": 392,
"uw_w_iy": 393,
"v": 394,
"v_ax": 395,
"v_axr": 396,
"v_eh": 397,
"v_eu": 398,
"v_ih": 399,
"v_s": 400,
"w": 401,
"w_ae": 402,
"w_ah": 403,
"w_ao": 404,
"w_axr": 405,
"w_ay": 406,
"w_eh": 407,
"w_er": 408,
"w_ih": 409,
"w_ih_l": 410,
"w_r": 411,
"y": 412,
"y_ah": 413,
"y_aw": 414,
"y_eh": 415,
"y_er": 416,
"y_ih_r": 417,
"y_o": 418,
"y_o_l": 419,
"y_uh": 420,
"y_uw": 421,
"z": 422,
"z_ax": 423,
"z_d_eu": 424,
"z_eu": 425,
"z_eu_d": 426,
"z_ih": 427,
"z_ih_s": 428,
"z_ih_z": 429,
"z_s_eu": 430,
"zh": 431,
"zh_eu": 432,
"zh_ih": 433,
"zh_uh": 434,
"zh_uw": 435
}