NeuraCraft commited on
Commit
22a1695
·
1 Parent(s): b8ca844

Upload tokenizer

Browse files
Files changed (2) hide show
  1. chat_template.jinja +4 -0
  2. tokenizer_config.json +0 -1
chat_template.jinja ADDED
@@ -0,0 +1,4 @@
 
 
 
 
 
1
+ {% if not add_generation_prompt is defined %}{% set add_generation_prompt = false %}{% endif %}{% for message in messages %}{{'<|im_start|>' + message['role'] + '
2
+ ' + message['content'] + '<|im_end|>' + '
3
+ '}}{% endfor %}{% if add_generation_prompt %}{{ '<|im_start|>assistant
4
+ ' }}{% endif %}
tokenizer_config.json CHANGED
@@ -194,7 +194,6 @@
194
  "<|_unuse_missing_100275|>"
195
  ],
196
  "bos_token": "<|endoftext|>",
197
- "chat_template": "{% if not add_generation_prompt is defined %}{% set add_generation_prompt = false %}{% endif %}{% for message in messages %}{{'<|im_start|>' + message['role'] + '\n' + message['content'] + '<|im_end|>' + '\n'}}{% endfor %}{% if add_generation_prompt %}{{ '<|im_start|>assistant\n' }}{% endif %}",
198
  "clean_up_tokenization_spaces": true,
199
  "eos_token": "<|endoftext|>",
200
  "extra_special_tokens": {},
 
194
  "<|_unuse_missing_100275|>"
195
  ],
196
  "bos_token": "<|endoftext|>",
 
197
  "clean_up_tokenization_spaces": true,
198
  "eos_token": "<|endoftext|>",
199
  "extra_special_tokens": {},