Shubham09 commited on
Commit
e2b16bc
·
1 Parent(s): 24e3ef0

Upload tokenizer

Browse files
Files changed (1) hide show
  1. tokenizer_config.json +1 -1
tokenizer_config.json CHANGED
@@ -1,6 +1,7 @@
1
  {
2
  "add_prefix_space": false,
3
  "bos_token": "<s>",
 
4
  "cls_token": "<s>",
5
  "eos_token": "</s>",
6
  "errors": "replace",
@@ -8,7 +9,6 @@
8
  "model_max_length": 1024,
9
  "pad_token": "<pad>",
10
  "sep_token": "</s>",
11
- "special_tokens_map_file": null,
12
  "tokenizer_class": "BartTokenizer",
13
  "trim_offsets": true,
14
  "unk_token": "<unk>"
 
1
  {
2
  "add_prefix_space": false,
3
  "bos_token": "<s>",
4
+ "clean_up_tokenization_spaces": true,
5
  "cls_token": "<s>",
6
  "eos_token": "</s>",
7
  "errors": "replace",
 
9
  "model_max_length": 1024,
10
  "pad_token": "<pad>",
11
  "sep_token": "</s>",
 
12
  "tokenizer_class": "BartTokenizer",
13
  "trim_offsets": true,
14
  "unk_token": "<unk>"