slplab's picture
Initial commit for wav2vec2-large-robust pronunciation model
dae90d9
raw
history blame
1.23 kB
{
"<pad>": 89,
"<unk>": 90,
"aa": 0,
"aa_err": 1,
"ae": 2,
"ae_err": 3,
"ah": 4,
"ah_err": 5,
"ao": 6,
"ao_err": 7,
"aw": 8,
"aw_err": 9,
"ax": 10,
"ax_err": 11,
"ay": 12,
"ay_err": 13,
"b": 14,
"b*": 15,
"b_err": 16,
"ch": 17,
"ch_err": 18,
"d": 19,
"d*": 20,
"d_err": 21,
"dh": 22,
"dh_err": 23,
"eh": 24,
"eh_err": 25,
"er": 26,
"er_err": 27,
"eu": 28,
"eu_err": 29,
"ey": 30,
"ey_err": 31,
"f": 32,
"f_err": 33,
"g": 34,
"g*": 35,
"g_err": 36,
"hh": 37,
"hh_err": 38,
"ih": 39,
"ih_err": 40,
"iy": 41,
"iy_err": 42,
"jh": 43,
"jh_err": 44,
"k": 45,
"k_err": 46,
"l": 47,
"l_err": 48,
"m": 49,
"m_err": 50,
"n": 51,
"n_err": 52,
"ng": 53,
"ng_err": 54,
"o": 55,
"o_err": 56,
"ow": 57,
"ow_err": 58,
"oy": 59,
"oy_err": 60,
"p": 61,
"p_err": 62,
"r": 63,
"r_err": 64,
"s": 65,
"s_err": 66,
"sh": 67,
"sh_err": 68,
"t": 69,
"t_err": 70,
"th": 71,
"th_err": 72,
"ts": 73,
"ts_err": 74,
"uh": 75,
"uh_err": 76,
"uw": 77,
"uw_err": 78,
"v": 79,
"v_err": 80,
"w": 81,
"w_err": 82,
"y": 83,
"y_err": 84,
"z": 85,
"z_err": 86,
"zh": 87,
"zh_err": 88
}