add additional_special_tokens in tokenizer cfg
Browse files- tokenizer_config.json +8 -0
tokenizer_config.json
CHANGED
|
@@ -86,5 +86,13 @@
|
|
| 86 |
"special": true
|
| 87 |
}
|
| 88 |
},
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 89 |
"chat_template": "{{ bos_token }}{% for message in messages %}{{'<|im_start|>' + message['role'] + '\n' + message['content'] + '<|im_end|>' + '\n'}}{% endfor %}{% if add_generation_prompt %}{{ '<|im_start|>assistant\n' }}{% endif %}"
|
| 90 |
}
|
|
|
|
| 86 |
"special": true
|
| 87 |
}
|
| 88 |
},
|
| 89 |
+
"additional_special_tokens": [
|
| 90 |
+
"<|im_start|>",
|
| 91 |
+
"<|im_end|>",
|
| 92 |
+
"<|action_start|>",
|
| 93 |
+
"<|action_end|>",
|
| 94 |
+
"<|interpreter|>",
|
| 95 |
+
"<|plugin|>"
|
| 96 |
+
],
|
| 97 |
"chat_template": "{{ bos_token }}{% for message in messages %}{{'<|im_start|>' + message['role'] + '\n' + message['content'] + '<|im_end|>' + '\n'}}{% endfor %}{% if add_generation_prompt %}{{ '<|im_start|>assistant\n' }}{% endif %}"
|
| 98 |
}
|