Wimflorijn commited on
Commit
5d76378
·
verified ·
1 Parent(s): 4ac37ae

Upload tokenizer

Browse files
Files changed (1) hide show
  1. tokenizer.json +4 -2
tokenizer.json CHANGED
@@ -1023,7 +1023,8 @@
1023
  {
1024
  "type": "Metaspace",
1025
  "replacement": "▁",
1026
- "add_prefix_space": true
 
1027
  },
1028
  {
1029
  "type": "Digits",
@@ -1080,7 +1081,8 @@
1080
  "decoder": {
1081
  "type": "Metaspace",
1082
  "replacement": "▁",
1083
- "add_prefix_space": true
 
1084
  },
1085
  "model": {
1086
  "type": "Unigram",
 
1023
  {
1024
  "type": "Metaspace",
1025
  "replacement": "▁",
1026
+ "prepend_scheme": "always",
1027
+ "split": true
1028
  },
1029
  {
1030
  "type": "Digits",
 
1081
  "decoder": {
1082
  "type": "Metaspace",
1083
  "replacement": "▁",
1084
+ "prepend_scheme": "always",
1085
+ "split": true
1086
  },
1087
  "model": {
1088
  "type": "Unigram",