Upload tokenizer_config.json with huggingface_hub
Browse files- tokenizer_config.json +4 -1
tokenizer_config.json
CHANGED
|
@@ -81,7 +81,10 @@
|
|
| 81 |
"<|im_middle|>"
|
| 82 |
],
|
| 83 |
"auto_map": {
|
| 84 |
-
"AutoTokenizer":
|
|
|
|
|
|
|
|
|
|
| 85 |
},
|
| 86 |
"bos_token": "[BOS]",
|
| 87 |
"chat_template": "{%- for message in messages -%}{%- if loop.first and messages[0]['role'] != 'system' -%}<|im_system|>system<|im_middle|>You are a helpful assistant<|im_end|>{%- endif -%}{%- if message['role'] == 'system' -%}<|im_system|>{%- endif -%}{%- if message['role'] == 'user' -%}<|im_user|>{%- endif -%}{%- if message['role'] == 'assistant' -%}<|im_assistant|>{%- endif -%}{{ message['role'] }}<|im_middle|>{{message['content']}}<|im_end|>{%- endfor -%}{%- if add_generation_prompt -%}<|im_assistant|>assistant<|im_middle|>{%- endif -%}",
|
|
|
|
| 81 |
"<|im_middle|>"
|
| 82 |
],
|
| 83 |
"auto_map": {
|
| 84 |
+
"AutoTokenizer": [
|
| 85 |
+
"tokenization_moonshot.TikTokenTokenizer",
|
| 86 |
+
null
|
| 87 |
+
]
|
| 88 |
},
|
| 89 |
"bos_token": "[BOS]",
|
| 90 |
"chat_template": "{%- for message in messages -%}{%- if loop.first and messages[0]['role'] != 'system' -%}<|im_system|>system<|im_middle|>You are a helpful assistant<|im_end|>{%- endif -%}{%- if message['role'] == 'system' -%}<|im_system|>{%- endif -%}{%- if message['role'] == 'user' -%}<|im_user|>{%- endif -%}{%- if message['role'] == 'assistant' -%}<|im_assistant|>{%- endif -%}{{ message['role'] }}<|im_middle|>{{message['content']}}<|im_end|>{%- endfor -%}{%- if add_generation_prompt -%}<|im_assistant|>assistant<|im_middle|>{%- endif -%}",
|