add tokenizer
Browse files- vocab.json +1 -1
vocab.json
CHANGED
@@ -1 +1 @@
|
|
1 |
-
{"
|
|
|
1 |
+
{"q": 0, "x": 1, "ƙ": 2, "“": 3, "y": 4, "f": 5, "ɓ": 6, "’": 7, "h": 8, "d": 9, "t": 10, "u": 11, "n": 12, "r": 13, "a": 14, "j": 15, "ɗ": 16, "p": 18, "”": 19, "g": 20, "m": 21, "v": 22, "w": 23, "l": 24, "í": 25, "k": 26, "s": 27, "z": 28, "ʻ": 29, "i": 30, "o": 31, "'": 32, "—": 33, "ƴ": 34, "b": 35, "e": 36, "c": 37, "|": 17, "[UNK]": 38, "[PAD]": 39}
|