openPangu-VL-7B / tokenizer_config.json
wangrongsheng's picture
Upload folder using huggingface_hub
1688f96 verified
{
"add_bos_token": false,
"add_eos_token": false,
"add_prefix_space": true,
"added_tokens_decoder": {
"0": {
"content": "<unk>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"1": {
"content": "<s>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"2": {
"content": "</s>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"45806": {
"content": "<|User|>:",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"45813": {
"content": "<|Bot|>:",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"45830": {
"content": "[unused0]",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"45840": {
"content": "[unused1]",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"45846": {
"content": "[unused2]",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"45849": {
"content": "[unused3]",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"45861": {
"content": "[unused4]",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"45866": {
"content": "[unused5]",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"45874": {
"content": "[unused6]",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"45883": {
"content": "[unused7]",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"45884": {
"content": "[unused8]",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"45887": {
"content": "[unused9]",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"45892": {
"content": "[unused10]",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"45920": {
"content": "[unused11]",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"45932": {
"content": "[unused12]",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"45938": {
"content": "[unused13]",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"45953": {
"content": "[unused14]",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"45968": {
"content": "[unused15]",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"45974": {
"content": "[unused16]",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"45982": {
"content": "[unused17]",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"45986": {
"content": "[unused18]",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"46005": {
"content": "[unused19]",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"46007": {
"content": "[unused20]",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"46014": {
"content": "[unused21]",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"46017": {
"content": "[unused22]",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"46028": {
"content": "[unused23]",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"46032": {
"content": "[unused24]",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"46081": {
"content": "[unused25]",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"46086": {
"content": "[unused26]",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"46101": {
"content": "[unused27]",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"46183": {
"content": "[unused28]",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"46230": {
"content": "[unused29]",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"46245": {
"content": "[unused30]",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"46257": {
"content": "[unused31]",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"144208": {
"content": "[unused32]",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"144209": {
"content": "[unused33]",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
}
},
"auto_map": {
"AutoTokenizer": [
"tokenization_openpangu.OpenPanguTokenizer",
null
]
},
"bos_token": "<s>",
"clean_up_tokenization_spaces": false,
"eos_token": "[unused10]",
"legacy": true,
"model_max_length": 1000000000000000019884624838656,
"pad_token": null,
"sp_model_kwargs": {},
"spaces_between_special_tokens": false,
"tokenizer_class": "OpenPanguTokenizer",
"unk_token": "<unk>",
"use_default_system_prompt": false,
"chat_template": "{% macro role_name(role) -%}{%- if role == 'assistant' -%}助手{%- elif role == 'system' -%}系统{%- elif role == 'user' -%}用户{%- elif role == 'tool' -%}工具{%- elif role == 'function' -%}方法{%- else -%}{{ role }}{%- endif -%}{%- endmacro %}{% set image_count = namespace(value=0) %}{% set video_count = namespace(value=0) %}{% for message in messages %}{% if loop.first and message.role != 'system' %}<s>[unused9]系统:[unused10]{% endif %}{% if loop.first and message.role == 'system' %}<s>{% endif %}[unused9]{{ role_name(message.role) }}:{% if message.content is string %}{{ message.content }}[unused10]{% else %}{% for content in message.content %}{% set ctype = content.type|default('') %}{% set is_img = (ctype == 'image') or ('image' in content) or ('image_url' in content) %}{% set is_vid = (ctype == 'video') or ('video' in content) %}{% if is_img %}{% set image_count.value = image_count.value + 1 %}{% if add_vision_id %}图片 {{ image_count.value }}: {% endif %}[unused18][unused19][unused20]{% elif is_vid %}{% set video_count.value = video_count.value + 1 %}{% if add_vision_id %}视频 {{ video_count.value }}: {% endif %}[unused18][unused32][unused20]{% elif content.text is defined %}{{ content.text }}{% endif %}{% endfor %}[unused10]{% endif %}{% endfor %}{% if add_generation_prompt %}[unused9]助手:{% endif %}"
}