AKulk's picture
add tokenizer
5185e15
raw
history blame
621 Bytes
{"zh": 0, "dcl": 1, "em": 2, "t": 3, "ih": 4, "g": 5, "bcl": 6, "ix": 7, "ao": 8, "eh": 9, "iy": 10, "k": 11, "aa": 12, "pau": 13, "uw": 14, "er": 15, "l": 16, "eng": 17, "ey": 18, "ux": 19, "hv": 20, "gcl": 21, "m": 22, "oy": 23, "epi": 24, "h#": 25, "q": 26, "b": 27, "s": 28, "ae": 29, "nx": 30, "jh": 31, "w": 32, "uh": 33, "v": 34, "axr": 35, "r": 36, "aw": 37, "el": 38, "dx": 39, "d": 40, "ax-h": 41, "ow": 42, "p": 43, "ng": 44, "kcl": 45, "ax": 46, "pcl": 47, "y": 48, "th": 49, "ah": 50, "ch": 51, "sh": 52, "f": 53, "z": 54, "dh": 55, "ay": 56, "n": 57, "hh": 58, "en": 59, "tcl": 60, "[UNK]": 61, "[PAD]": 62}