MuXodious commited on
Commit
3baff27
·
verified ·
1 Parent(s): 0ad486d

Tokenizers

Browse files
Files changed (2) hide show
  1. tokenizer.json +2 -2
  2. tokenizer_config.json +2 -2
tokenizer.json CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e1e5daf1e619597fd56ff036925ea189916417c665d5bdd61b80199cf8d4e6d2
3
- size 17078029
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:94298edb1189fa83fdb219ce9ae8a4e3e257aa07c86309f5fffae782fbeefffe
3
+ size 17078146
tokenizer_config.json CHANGED
@@ -8008,14 +8008,14 @@
8008
  "<|im_start|>"
8009
  ],
8010
  "bos_token": "<s>",
8011
- "chat_template": "{% if not add_generation_prompt is defined %}{% set add_generation_prompt = false %}{% endif %}{% for message in messages %}{{'<|im_start|>' + message['role'] + '\n' + message['content'] + '<|im_end|>' + '\n'}}{% endfor %}{% if add_generation_prompt %}{{ '<|im_start|>assistant\n' }}{% endif %}",
8012
  "clean_up_tokenization_spaces": false,
8013
  "eos_token": "<|im_end|>",
8014
  "extra_special_tokens": {},
 
8015
  "legacy": true,
8016
  "model_max_length": 131072,
8017
  "pad_token": "<pad>",
8018
- "tokenizer_class": "LlamaTokenizer",
8019
  "unk_token": "<unk>",
8020
  "use_default_system_prompt": false
8021
  }
 
8008
  "<|im_start|>"
8009
  ],
8010
  "bos_token": "<s>",
 
8011
  "clean_up_tokenization_spaces": false,
8012
  "eos_token": "<|im_end|>",
8013
  "extra_special_tokens": {},
8014
+ "fix_mistral_regex": true,
8015
  "legacy": true,
8016
  "model_max_length": 131072,
8017
  "pad_token": "<pad>",
8018
+ "tokenizer_class": "LlamaTokenizerFast",
8019
  "unk_token": "<unk>",
8020
  "use_default_system_prompt": false
8021
  }