add tokenizer
Browse files- vocab.json +1 -1
vocab.json
CHANGED
|
@@ -1 +1 @@
|
|
| 1 |
-
{"
|
|
|
|
| 1 |
+
{"o": 0, "v": 1, "s": 2, "b": 3, "d": 4, "y": 5, "a": 6, "h": 7, "q": 8, "x": 9, "m": 10, "j": 11, "r": 12, "c": 14, "'": 15, "e": 16, "k": 17, "w": 18, "t": 20, "g": 21, "f": 22, "i": 23, "u": 24, "p": 25, "z": 26, "l": 27, "n": 28, "|": 32, "[UNK]": 28, "[PAD]": 29}
|