Update tokenizer_config.json
Browse files- tokenizer_config.json +1 -1
tokenizer_config.json
CHANGED
|
@@ -23,7 +23,7 @@
|
|
| 23 |
"pad_token": "<|endoftext|>",
|
| 24 |
"pretokenize_regex": "(?i:'s|'t|'re|'ve|'m|'ll|'d)|[^\\r\\n\\p{L}\\p{N}]?[\\p{L}\\p{M}]+|\\p{N}| ?[^\\s\\p{L}\\p{M}\\p{N}]+[\\r\\n]*|\\s*[\\r\\n]+|\\s+(?!\\S)|\\s+",
|
| 25 |
"split_special_tokens": false,
|
| 26 |
-
"tokenizer_class": "
|
| 27 |
"unk_token": null,
|
| 28 |
"video_token": "<|video_pad|>",
|
| 29 |
"vision_bos_token": "<|vision_start|>",
|
|
|
|
| 23 |
"pad_token": "<|endoftext|>",
|
| 24 |
"pretokenize_regex": "(?i:'s|'t|'re|'ve|'m|'ll|'d)|[^\\r\\n\\p{L}\\p{N}]?[\\p{L}\\p{M}]+|\\p{N}| ?[^\\s\\p{L}\\p{M}\\p{N}]+[\\r\\n]*|\\s*[\\r\\n]+|\\s+(?!\\S)|\\s+",
|
| 25 |
"split_special_tokens": false,
|
| 26 |
+
"tokenizer_class": "Qwen2Tokenizer",
|
| 27 |
"unk_token": null,
|
| 28 |
"video_token": "<|video_pad|>",
|
| 29 |
"vision_bos_token": "<|vision_start|>",
|