talkie-box / tokenizer_config.json
N8Programs's picture
Fix Talkie chat template leading newline
72d207e verified
{
"backend": "tokenizers",
"chat_template": "{%- set prelude = '\\nThe following conversation took place between the HUMAN, and TALKIE - a mechanical mind imbued with the knowledge of the world and the ability to use human language - a \"thinking machine\". It is published here for the benefit of the public:' -%}{{- prelude -}}{%- for message in messages -%}{%- if message['role'] == 'user' -%}{{- '\\n\\nHUMAN:\\n\\n' + (message['content'] | trim) -}}{%- elif message['role'] == 'assistant' -%}{{- '\\n\\nTALKIE:\\n\\n' + (message['content'] | trim) -}}{%- elif message['role'] == 'system' -%}{{- '\\n\\n' + (message['content'] | trim) -}}{%- else -%}{{- raise_exception('Unsupported role: ' + message['role']) -}}{%- endif -%}{%- endfor -%}{%- if add_generation_prompt and (messages | length == 0 or messages[-1]['role'] != 'assistant') -%}{{- '\\n\\nTALKIE:\\n\\n' -}}{%- endif -%}",
"clean_up_tokenization_spaces": false,
"eos_token": "<|endoftext|>",
"is_local": true,
"model_max_length": 2048,
"pad_token": "<|endoftext|>",
"tokenizer_class": "TokenizersBackend"
}