yaswanth commited on
Commit
bcc38db
1 Parent(s): d68a397

add tokenizer

Browse files
Files changed (1) hide show
  1. vocab.json +1 -1
vocab.json CHANGED
@@ -1 +1 @@
1
- {"": 0, "y": 1, "": 2, "": 3, "o": 4, "": 5, "": 6, "v": 7, "": 8, "": 10, "": 11, "": 12, "'": 13, "": 14, "": 15, "": 16, "m": 17, "": 18, "": 19, "": 20, "": 21, "d": 22, "": 23, "": 24, "": 25, "": 26, "": 27, "z": 28, "h": 29, "": 30, "": 31, "": 32, "e": 33, "": 34, "": 35, "": 36, "b": 37, "": 38, "p": 39, "": 40, "l": 41, "u": 42, "g": 43, "": 44, "n": 45, "s": 46, "": 47, "": 48, "": 49, "": 50, "": 51, "ह": 52, "": 53, "": 54, "t": 55, "k": 56, "": 57, "": 58, "": 59, "": 60, "": 61, "": 62, "": 63, "": 64, "i": 65, "": 66, "": 67, "f": 68, "": 69, "": 70, "a": 71, "j": 72, "ि": 73, "": 74, "": 75, "": 76, "w": 77, "": 78, "": 79, "": 80, "c": 81, "": 82, "": 83, "": 84, "": 85, "r": 86, "": 87, "x": 88, "": 89, "": 90, "": 91, "": 92, "|": 9, "[UNK]": 93, "[PAD]": 94}
 
1
+ {"": 0, "g": 1, "": 2, "": 3, "": 4, "": 5, "f": 6, "t": 7, "": 8, "": 9, "c": 10, "": 11, "": 12, "v": 13, "": 14, "": 15, "": 16, "j": 17, "": 18, "": 19, "l": 20, "z": 21, "": 22, "a": 23, "": 24, "s": 25, "": 26, "": 27, "o": 28, "": 29, "n": 30, "k": 31, "": 32, "x": 33, "": 34, "": 35, "u": 36, "i": 37, "": 38, "": 39, "r": 40, "": 41, "p": 42, "": 43, "": 44, "": 45, "": 46, "": 47, "": 48, "": 49, "": 50, "m": 52, "": 53, "ि": 54, "": 55, "": 56, "": 57, "": 58, "": 59, "y": 60, "": 61, "": 62, "": 63, "": 64, "": 65, "w": 66, "": 67, "": 68, "": 69, "e": 70, "": 71, "'": 72, "": 73, "": 74, "": 75, "": 76, "": 77, "": 78, "": 79, "d": 80, "": 81, "": 82, "": 83, "": 84, "": 85, "": 86, "": 87, "h": 88, "": 89, "": 90, "b": 91, "": 92, "|": 51, "[UNK]": 93, "[PAD]": 94}