w2v-bert-merg_mgl / vocab.json
Mengkedalai's picture
Upload tokenizer
386ba90 verified
raw
history blame contribute delete
442 Bytes
{
"[PAD]": 36,
"[UNK]": 35,
"|": 0,
"а": 1,
"б": 2,
"в": 3,
"г": 4,
"д": 5,
"е": 6,
"ж": 7,
"з": 8,
"и": 9,
"й": 10,
"к": 11,
"л": 12,
"м": 13,
"н": 14,
"о": 15,
"п": 16,
"р": 17,
"с": 18,
"т": 19,
"у": 20,
"ф": 21,
"х": 22,
"ц": 23,
"ч": 24,
"ш": 25,
"щ": 26,
"ы": 27,
"ь": 28,
"э": 29,
"ю": 30,
"я": 31,
"ё": 32,
"ү": 33,
"ө": 34
}