Upload tokenizer
Browse files- tokenizer.json +1 -1
- tokenizer_config.json +1 -1
tokenizer.json
CHANGED
|
@@ -53,7 +53,7 @@
|
|
| 53 |
"type": "BertNormalizer",
|
| 54 |
"clean_text": true,
|
| 55 |
"handle_chinese_chars": false,
|
| 56 |
-
"strip_accents":
|
| 57 |
"lowercase": false
|
| 58 |
},
|
| 59 |
"pre_tokenizer": {
|
|
|
|
| 53 |
"type": "BertNormalizer",
|
| 54 |
"clean_text": true,
|
| 55 |
"handle_chinese_chars": false,
|
| 56 |
+
"strip_accents": true,
|
| 57 |
"lowercase": false
|
| 58 |
},
|
| 59 |
"pre_tokenizer": {
|
tokenizer_config.json
CHANGED
|
@@ -9,7 +9,7 @@
|
|
| 9 |
"never_split": null,
|
| 10 |
"pad_token": "[PAD]",
|
| 11 |
"sep_token": "[SEP]",
|
| 12 |
-
"strip_accents":
|
| 13 |
"tokenize_chinese_chars": false,
|
| 14 |
"tokenizer_class": "BertTokenizer",
|
| 15 |
"unk_token": "[UNK]"
|
|
|
|
| 9 |
"never_split": null,
|
| 10 |
"pad_token": "[PAD]",
|
| 11 |
"sep_token": "[SEP]",
|
| 12 |
+
"strip_accents": true,
|
| 13 |
"tokenize_chinese_chars": false,
|
| 14 |
"tokenizer_class": "BertTokenizer",
|
| 15 |
"unk_token": "[UNK]"
|