add tokenizer
Browse files
.gitignore
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
checkpoint-*/
|
runs/Aug25_14-33-03_510311d14d2f/1661438023.9286213/events.out.tfevents.1661438023.510311d14d2f.70.1
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:886854397d1da55632e6ee8c90c0c2e3c10f8476eb25312b375ae56844905bfb
|
| 3 |
+
size 4762
|
runs/Aug25_14-33-03_510311d14d2f/events.out.tfevents.1661438023.510311d14d2f.70.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:c76614005f19116c9d67c2175eb7e5eccfedb2347b8f4b1cd9d1dba0bb2f91c3
|
| 3 |
+
size 4941
|
vocab.json
CHANGED
|
@@ -1 +1 @@
|
|
| 1 |
-
{"s": 0, "
|
|
|
|
| 1 |
+
{"s": 0, "c": 2, "t": 3, "o": 4, "a": 5, "w": 6, "i": 7, "j": 8, "n": 9, "q": 10, "f": 11, "h": 12, "k": 13, "l": 14, "g": 15, "b": 16, "d": 17, "p": 18, "r": 19, "m": 20, "v": 21, "y": 22, "e": 23, "z": 24, "'": 25, "u": 26, "x": 27, "|": 1, "[UNK]": 28, "[PAD]": 29}
|