isbondarev commited on
Commit
d8ce879
·
verified ·
1 Parent(s): 6d71df4

Upload tokenizer

Browse files
chat_template.jinja ADDED
@@ -0,0 +1,8 @@
 
 
 
 
 
 
 
 
 
1
+ {% for message in messages %}{% if message['role'] == 'system' and message['content'] %}{{'<|system|>
2
+ ' + message['content'] + '<|end|>
3
+ '}}{% elif message['role'] == 'user' %}{{'<|user|>
4
+ ' + message['content'] + '<|end|>
5
+ '}}{% elif message['role'] == 'assistant' %}{{'<|assistant|>
6
+ ' + message['content'] + '<|end|>
7
+ '}}{% endif %}{% endfor %}{% if add_generation_prompt %}{{ '<|assistant|>
8
+ ' }}{% else %}{{ eos_token }}{% endif %}
special_tokens_map.json CHANGED
@@ -1,13 +1,4 @@
1
  {
2
- "additional_special_tokens": [
3
- {
4
- "content": "<|end|>",
5
- "lstrip": false,
6
- "normalized": false,
7
- "rstrip": false,
8
- "single_word": false
9
- }
10
- ],
11
  "bos_token": {
12
  "content": "<s>",
13
  "lstrip": false,
@@ -16,7 +7,7 @@
16
  "single_word": false
17
  },
18
  "eos_token": {
19
- "content": "<|endoftext|>",
20
  "lstrip": false,
21
  "normalized": false,
22
  "rstrip": false,
 
1
  {
 
 
 
 
 
 
 
 
 
2
  "bos_token": {
3
  "content": "<s>",
4
  "lstrip": false,
 
7
  "single_word": false
8
  },
9
  "eos_token": {
10
+ "content": "<|end|>",
11
  "lstrip": false,
12
  "normalized": false,
13
  "rstrip": false,
tokenizer_config.json CHANGED
@@ -116,13 +116,9 @@
116
  "special": true
117
  }
118
  },
119
- "additional_special_tokens": [
120
- "<|end|>"
121
- ],
122
  "bos_token": "<s>",
123
- "chat_template": "{% for message in messages %}{% if message['role'] == 'system' and message['content'] %}{{'<|system|>\n' + message['content'] + '<|end|>\n'}}{% elif message['role'] == 'user' %}{{'<|user|>\n' + message['content'] + '<|end|>\n'}}{% elif message['role'] == 'assistant' %}{{'<|assistant|>\n' + message['content'] + '<|end|>\n'}}{% endif %}{% endfor %}{% if add_generation_prompt %}{{ '<|assistant|>\n' }}{% else %}{{ eos_token }}{% endif %}",
124
  "clean_up_tokenization_spaces": false,
125
- "eos_token": "<|endoftext|>",
126
  "extra_special_tokens": {},
127
  "legacy": false,
128
  "model_max_length": 131072,
 
116
  "special": true
117
  }
118
  },
 
 
 
119
  "bos_token": "<s>",
 
120
  "clean_up_tokenization_spaces": false,
121
+ "eos_token": "<|end|>",
122
  "extra_special_tokens": {},
123
  "legacy": false,
124
  "model_max_length": 131072,