Youmnaaaa commited on
Commit
3c8440d
·
verified ·
1 Parent(s): eef4bc6

Upload tokenizer_config.json with huggingface_hub

Browse files
Files changed (1) hide show
  1. tokenizer_config.json +2 -8
tokenizer_config.json CHANGED
@@ -1,23 +1,17 @@
1
  {
2
- "backend": "tokenizers",
3
  "bos_token": "<s>",
4
  "cls_token": "<s>",
5
  "do_lower_case": true,
6
  "eos_token": "</s>",
7
- "is_local": false,
8
  "mask_token": "<mask>",
9
- "max_length": 128,
10
  "model_max_length": 128,
11
- "pad_to_multiple_of": null,
12
  "pad_token": "<pad>",
13
  "pad_token_type_id": 0,
14
  "padding_side": "right",
15
  "sep_token": "</s>",
16
- "stride": 0,
17
  "strip_accents": null,
18
  "tokenize_chinese_chars": true,
19
- "tokenizer_class": "TokenizersBackend",
20
  "truncation_side": "right",
21
- "truncation_strategy": "longest_first",
22
  "unk_token": "<unk>"
23
- }
 
1
  {
 
2
  "bos_token": "<s>",
3
  "cls_token": "<s>",
4
  "do_lower_case": true,
5
  "eos_token": "</s>",
 
6
  "mask_token": "<mask>",
 
7
  "model_max_length": 128,
 
8
  "pad_token": "<pad>",
9
  "pad_token_type_id": 0,
10
  "padding_side": "right",
11
  "sep_token": "</s>",
 
12
  "strip_accents": null,
13
  "tokenize_chinese_chars": true,
14
+ "tokenizer_class": "XLMRobertaTokenizer",
15
  "truncation_side": "right",
 
16
  "unk_token": "<unk>"
17
+ }