Caplin43 commited on
Commit
1206d67
·
verified ·
1 Parent(s): 1cbb6ee

Create tokenizer.json

Browse files
Files changed (1) hide show
  1. tokenizer.json +12 -0
tokenizer.json ADDED
@@ -0,0 +1,12 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "model": {
3
+ "type": "BPE",
4
+ "vocab_size": 32000
5
+ },
6
+ "normalizer": {
7
+ "type": "Lowercase"
8
+ },
9
+ "pre_tokenizer": {
10
+ "type": "Whitespace"
11
+ }
12
+ }