Xuezha commited on
Commit
b14cf69
·
verified ·
1 Parent(s): b773bbf

Upload tokenizer

Browse files
Files changed (2) hide show
  1. special_tokens_map.json +1 -1
  2. tokenizer_config.json +2 -2
special_tokens_map.json CHANGED
@@ -4,7 +4,7 @@
4
  "<|im_end|>"
5
  ],
6
  "eos_token": {
7
- "content": "<|im_end|>",
8
  "lstrip": false,
9
  "normalized": false,
10
  "rstrip": false,
 
4
  "<|im_end|>"
5
  ],
6
  "eos_token": {
7
+ "content": "<|endoftext|>",
8
  "lstrip": false,
9
  "normalized": false,
10
  "rstrip": false,
tokenizer_config.json CHANGED
@@ -31,9 +31,9 @@
31
  "<|im_end|>"
32
  ],
33
  "bos_token": null,
34
- "chat_template": "{% for message in messages %}{% if loop.first and messages[0]['role'] != 'system' %}{{ '<|im_start|>system\nYou are a helpful assistant.<|im_end|>\n' }}{% endif %}{{'<|im_start|>' + message['role'] + '\n' + message['content'] + '<|im_end|>' + '\n'}}{% endfor %}{% if add_generation_prompt %}{{ '<|im_start|>assistant\n' }}{% endif %}",
35
  "clean_up_tokenization_spaces": false,
36
- "eos_token": "<|im_end|>",
37
  "errors": "replace",
38
  "model_max_length": 32768,
39
  "pad_token": "<|endoftext|>",
 
31
  "<|im_end|>"
32
  ],
33
  "bos_token": null,
34
+ "chat_template": "{% for message in messages %}{% if loop.first and messages[0]['role'] != 'system' %}{{ '<|im_start|>system\nYou are a helpful assistant<|im_end|>\n' }}{% endif %}{{'<|im_start|>' + message['role'] + '\n' + message['content'] + '<|im_end|>' + '\n'}}{% endfor %}{% if add_generation_prompt %}{{ '<|im_start|>assistant\n' }}{% endif %}",
35
  "clean_up_tokenization_spaces": false,
36
+ "eos_token": "<|endoftext|>",
37
  "errors": "replace",
38
  "model_max_length": 32768,
39
  "pad_token": "<|endoftext|>",