mms-tts-kbp / vocab.json
sanchit-gandhi's picture
Upload tokenizer
b0f94e8
raw
history blame
483 Bytes
{
" ": 0,
"-": 6,
"_": 38,
"a": 32,
"b": 9,
"c": 16,
"d": 42,
"e": 12,
"f": 1,
"g": 18,
"h": 24,
"i": 7,
"j": 29,
"k": 13,
"l": 31,
"m": 14,
"n": 11,
"o": 27,
"p": 25,
"r": 35,
"s": 41,
"t": 5,
"u": 26,
"v": 23,
"w": 39,
"y": 30,
"z": 4,
"á": 36,
"é": 3,
"ñ": 19,
"ó": 8,
"ú": 21,
"đ": 20,
"ń": 28,
"ŋ": 40,
"ɔ": 34,
"ɖ": 2,
"ɛ": 10,
"ɣ": 33,
"ɩ": 37,
"ʋ": 22,
"́": 17,
"ḿ": 15
}