kerzgrr commited on
Commit
f9fec46
·
verified ·
1 Parent(s): a16a996

Upload tokenizer_config.json

Browse files
Files changed (1) hide show
  1. tokenizer_config.json +17 -4
tokenizer_config.json CHANGED
@@ -1,13 +1,26 @@
1
  {
 
2
  "tokenizer_file": "tokenizer.json",
3
- "pad_token": "<|pad|>",
4
- "eos_token": "<|eot_id|>",
 
5
  "bos_token": "<|begin_of_text|>",
 
 
6
  "unk_token": "<|unk|>",
7
  "additional_special_tokens": [
8
  "<|start_header_id|>",
9
  "<|end_header_id|>",
10
  "<|eot_id|>"
11
  ],
12
- "add_prefix_space": true
13
- }
 
 
 
 
 
 
 
 
 
 
1
  {
2
+ "tokenizer_class": "PreTrainedTokenizerFast",
3
  "tokenizer_file": "tokenizer.json",
4
+ "model_max_length": 1024,
5
+ "add_prefix_space": true,
6
+ "clean_up_tokenization_spaces": false,
7
  "bos_token": "<|begin_of_text|>",
8
+ "eos_token": "<|eot_id|>",
9
+ "pad_token": "<|pad|>",
10
  "unk_token": "<|unk|>",
11
  "additional_special_tokens": [
12
  "<|start_header_id|>",
13
  "<|end_header_id|>",
14
  "<|eot_id|>"
15
  ],
16
+ "added_tokens_decoder": {
17
+ "0": { "content": "<|pad|>", "lstrip": false, "normalized": false, "rstrip": false, "single_word": false, "special": true },
18
+ "1": { "content": "<|unk|>", "lstrip": false, "normalized": false, "rstrip": false, "single_word": false, "special": true },
19
+ "2": { "content": "<|begin_of_text|>", "lstrip": false, "normalized": false, "rstrip": false, "single_word": false, "special": true },
20
+ "3": { "content": "<|end_of_text|>", "lstrip": false, "normalized": false, "rstrip": false, "single_word": false, "special": true },
21
+ "4": { "content": "<|start_header_id|>", "lstrip": false, "normalized": false, "rstrip": false, "single_word": false, "special": true },
22
+ "5": { "content": "<|end_header_id|>", "lstrip": false, "normalized": false, "rstrip": false, "single_word": false, "special": true },
23
+ "6": { "content": "<|eot_id|>", "lstrip": false, "normalized": false, "rstrip": false, "single_word": false, "special": true }
24
+ },
25
+ "chat_template": "{% for message in messages %}{% if loop.first %}<|begin_of_text|>{% endif %}<|start_header_id|>{{ message['role'] }}<|end_header_id|>\n\n{{ message['content'] }}<|eot_id|>{% endfor %}{% if add_generation_prompt %}<|start_header_id|>assistant<|end_header_id|>\n\n{% endif %}"
26
+ }