diff --git a/.gitattributes b/.gitattributes index a6344aac8c09253b3b630fb776ae94478aa0275b..7f2758529da613d81148978b1d5e7ebb72cbfa4f 100644 --- a/.gitattributes +++ b/.gitattributes @@ -33,3 +33,6 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text *.zip filter=lfs diff=lfs merge=lfs -text *.zst filter=lfs diff=lfs merge=lfs -text *tfevents* filter=lfs diff=lfs merge=lfs -text +tokenizer.json filter=lfs diff=lfs merge=lfs -text +*.index.json filter=lfs diff=lfs merge=lfs -text +*.index.json filter=lfs diff=lfs merge=lfs -text diff --git a/c25fb092a5e9d2e2/gpqa:diamond|0/e885f4894c244f92/GENERATIVE.parquet b/c25fb092a5e9d2e2/gpqa:diamond|0/e885f4894c244f92/GENERATIVE.parquet new file mode 100644 index 0000000000000000000000000000000000000000..f4d68f1edeaed4f7595c977fecc63ba69589b3f3 --- /dev/null +++ b/c25fb092a5e9d2e2/gpqa:diamond|0/e885f4894c244f92/GENERATIVE.parquet @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:52335a32aa2a0fd771d06d2be6885870feb8b7454ce20889d7b8fb9cc40218ce +size 4973957 diff --git a/chat_template.jinja b/chat_template.jinja new file mode 100644 index 0000000000000000000000000000000000000000..41478957aca7a04b7321022e7d1f73de5badd995 --- /dev/null +++ b/chat_template.jinja @@ -0,0 +1,103 @@ +[gMASK] +{%- if tools -%} +<|system|> +# Tools + +You may call one or more functions to assist with the user query. + +You are provided with function signatures within XML tags: + +{% for tool in tools %} +{{ tool | tojson(ensure_ascii=False) }} +{% endfor %} + + +For each function call, output the function name and arguments within the following XML format: +{function-name} +{arg-key-1} +{arg-value-1} +{arg-key-2} +{arg-value-2} +... +{%- endif -%} +{%- macro visible_text(content) -%} + {%- if content is string -%} + {{- content }} + {%- elif content is iterable and content is not mapping -%} + {%- for item in content -%} + {%- if item is mapping and item.type == 'text' -%} + {{- item.text }} + {%- elif item is string -%} + {{- item }} + {%- endif -%} + {%- endfor -%} + {%- else -%} + {{- content }} + {%- endif -%} +{%- endmacro -%} +{%- set ns = namespace(last_user_index=-1) %} +{%- for m in messages %} + {%- if m.role == 'user' %} + {% set ns.last_user_index = loop.index0 -%} + {%- endif %} +{%- endfor %} +{% for m in messages %} +{%- if m.role == 'user' -%}<|user|> +{{ visible_text(m.content) }} +{{- '/nothink' if (enable_thinking is defined and not enable_thinking and not visible_text(m.content).endswith("/nothink")) else '' -}} +{%- elif m.role == 'assistant' -%} +<|assistant|> +{%- set reasoning_content = '' %} +{%- set content = visible_text(m.content) %} +{%- if m.reasoning_content is string %} + {%- set reasoning_content = m.reasoning_content %} +{%- else %} + {%- if '' in content %} + {%- set reasoning_content = content.split('')[0].rstrip('\n').split('')[-1].lstrip('\n') %} + {%- set content = content.split('')[-1].lstrip('\n') %} + {%- endif %} +{%- endif %} +{%- if loop.index0 > ns.last_user_index and reasoning_content -%} +{{ '\n' + reasoning_content.strip() + ''}} +{%- else -%} +{{ '\n' }} +{%- endif -%} +{%- if content.strip() -%} +{{ '\n' + content.strip() }} +{%- endif -%} +{% if m.tool_calls %} +{% for tc in m.tool_calls %} +{%- if tc.function %} + {%- set tc = tc.function %} +{%- endif %} +{{ '\n' + tc.name }} +{% set _args = tc.arguments %} +{% for k, v in _args.items() %} +{{ k }} +{{ v | tojson(ensure_ascii=False) if v is not string else v }} +{% endfor %} +{% endfor %} +{% endif %} +{%- elif m.role == 'tool' -%} +{%- if m.content is string -%} +{%- if loop.first or (messages[loop.index0 - 1].role != "tool") %} + {{- '<|observation|>' }} +{%- endif %} +{{- '\n\n' }} +{{- m.content }} +{{- '\n' }} +{%- else -%} +<|observation|>{% for tr in m.content %} + + +{{ tr.output if tr.output is defined else tr }} +{% endfor -%} +{% endif -%} +{%- elif m.role == 'system' -%} +<|system|> +{{ visible_text(m.content) }} +{%- endif -%} +{%- endfor -%} +{%- if add_generation_prompt -%} + <|assistant|>{{- '\n' if (enable_thinking is defined and not enable_thinking) else '' -}} +{%- endif -%} \ No newline at end of file diff --git a/config.json b/config.json new file mode 100644 index 0000000000000000000000000000000000000000..d8f995138f6336bdf1bdcaa5495c5e06ff791152 --- /dev/null +++ b/config.json @@ -0,0 +1,89 @@ +{ + "architectures": [ + "Glm4MoeForCausalLM" + ], + "attention_bias": true, + "attention_dropout": 0.0, + "dtype": "bfloat16", + "eos_token_id": [ + 151329, + 151336, + 151338 + ], + "first_k_dense_replace": 3, + "head_dim": 128, + "hidden_act": "silu", + "hidden_size": 5120, + "initializer_range": 0.02, + "intermediate_size": 12288, + "max_position_embeddings": 202752, + "model_type": "glm4_moe", + "moe_intermediate_size": 1536, + "n_group": 1, + "n_routed_experts": 160, + "n_shared_experts": 1, + "norm_topk_prob": true, + "num_attention_heads": 96, + "num_experts_per_tok": 8, + "num_hidden_layers": 92, + "num_key_value_heads": 8, + "num_nextn_predict_layers": 1, + "pad_token_id": 151329, + "partial_rotary_factor": 0.5, + "quantization_config": { + "config_groups": { + "group_0": { + "format": "float-quantized", + "input_activations": { + "actorder": null, + "block_structure": null, + "dynamic": true, + "group_size": null, + "num_bits": 8, + "observer": null, + "observer_kwargs": {}, + "strategy": "token", + "symmetric": true, + "type": "float" + }, + "output_activations": null, + "targets": [ + "Linear" + ], + "weights": { + "actorder": null, + "block_structure": null, + "dynamic": false, + "group_size": null, + "num_bits": 8, + "observer": "minmax", + "observer_kwargs": {}, + "strategy": "channel", + "symmetric": true, + "type": "float" + } + } + }, + "format": "float-quantized", + "global_compression_ratio": null, + "ignore": [ + "lm_head" + ], + "kv_cache_scheme": null, + "quant_method": "compressed-tensors", + "quantization_status": "compressed", + "sparsity_config": {}, + "transform_config": {}, + "version": "0.12.3.dev31+gb019b89" + }, + "rms_norm_eps": 1e-05, + "rope_scaling": null, + "rope_theta": 1000000, + "routed_scaling_factor": 2.5, + "tie_word_embeddings": false, + "topk_group": 1, + "transformers_version": "4.57.3", + "use_cache": true, + "use_qk_norm": true, + "vocab_size": 151552 +} diff --git a/generation_config.json b/generation_config.json new file mode 100644 index 0000000000000000000000000000000000000000..a7958b7d81d1338ae40db2fd0d9d030effc9e41d --- /dev/null +++ b/generation_config.json @@ -0,0 +1,10 @@ +{ + "_from_model_config": true, + "eos_token_id": [ + 151329, + 151336, + 151338 + ], + "pad_token_id": 151329, + "transformers_version": "4.57.3" +} diff --git a/model-00001-of-00072.safetensors b/model-00001-of-00072.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..3291bcf2b9abb7f0f5ee5c4e90cd1191a5f09cbe --- /dev/null +++ b/model-00001-of-00072.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:25721b828db5edfbbc929be8ad7e920890baaf3ffbf9a7fadf9fbc47b677cbbc +size 4993429864 diff --git a/model-00002-of-00072.safetensors b/model-00002-of-00072.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..357802804c972df4487558d03d29fb543c8f55ab --- /dev/null +++ b/model-00002-of-00072.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2349abaa3ccec627bc3264f432274a9c466885f8bdcc9ccf101787d69da0fabc +size 4993855232 diff --git a/model-00003-of-00072.safetensors b/model-00003-of-00072.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..32e6f549c5ad4f2e5c08a993fd58418c0aad8614 --- /dev/null +++ b/model-00003-of-00072.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3c07b25ebd89a18def43905cf3f1644ea9f522b5c8c33d131234ac4c087987e4 +size 4998106784 diff --git a/model-00004-of-00072.safetensors b/model-00004-of-00072.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..db21ea7efb0883b7ec3def3d2b9eb6299aa964be --- /dev/null +++ b/model-00004-of-00072.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4645e7e95aa18fc194537935ea09f58436e88aa5122d2e2b8ac08a999ed52e91 +size 4993854968 diff --git a/model-00005-of-00072.safetensors b/model-00005-of-00072.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..52fc561aee2a81cd549dfa2517f6f058cb962800 --- /dev/null +++ b/model-00005-of-00072.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9d23a8569e612d7e32425666d3e6119bec2e4490a5c1e7fbf46213346058d4f3 +size 4993847864 diff --git a/model-00006-of-00072.safetensors b/model-00006-of-00072.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..18b9563c661c6e91641e36c29b3cfd4f1a725614 --- /dev/null +++ b/model-00006-of-00072.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c769475e0161315befa9be4fb9c5aa60126a0eeaf57a1dd36dd8590fab371e5a +size 4993855304 diff --git a/model-00007-of-00072.safetensors b/model-00007-of-00072.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..bbac3529e609d5fb906fa99756527a68f4964875 --- /dev/null +++ b/model-00007-of-00072.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5124673b217ab4082e6ef7b1460f869c5b7348d1504ed4eb33c5bfa11c77e874 +size 4998107648 diff --git a/model-00008-of-00072.safetensors b/model-00008-of-00072.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..e3cee9c337271b2259bc70c5a9dff641d979b3af --- /dev/null +++ b/model-00008-of-00072.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4fab487a7bb588a90cc64c893a98f8265d70c898c799d34704f855f550828e8f +size 4993856224 diff --git a/model-00009-of-00072.safetensors b/model-00009-of-00072.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..650df982648f8addb755045b0a1044070193c93d --- /dev/null +++ b/model-00009-of-00072.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b74c726a5f1f8ad1f30a984063580e18eace50c0f265ae205dcd5c1175a657d1 +size 4993849192 diff --git a/model-00010-of-00072.safetensors b/model-00010-of-00072.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..5ab5df36be2c7d52eedf882bb9109fe304a808ce --- /dev/null +++ b/model-00010-of-00072.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bb5fa8193fc0592b671866ee351356fdfe2ae29b69a1f16e6ccdf6993f1e7ff8 +size 4998108080 diff --git a/model-00011-of-00072.safetensors b/model-00011-of-00072.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..661b180c2c881fb3f048ad85332937ce85ab45ba --- /dev/null +++ b/model-00011-of-00072.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8110c182f8e8fcf18567c8e92a92c38e8348fe845e944ec3ee9f028cd1870f1d +size 4993856168 diff --git a/model-00012-of-00072.safetensors b/model-00012-of-00072.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..396562a4d791ce3db3dcdc96e09d60c20fa98f72 --- /dev/null +++ b/model-00012-of-00072.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3bc2233f5a96aaa91eef34f50afa724f91e76e5f2e526b4933a5d71b4a27c762 +size 4993856224 diff --git a/model-00013-of-00072.safetensors b/model-00013-of-00072.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..b3ec54e8497c11ffc2c14d2d1f144df013ae0988 --- /dev/null +++ b/model-00013-of-00072.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:261c2613891a4457859b7565748248123e1760e4adccc669674d958ae0e2b089 +size 4993849264 diff --git a/model-00014-of-00072.safetensors b/model-00014-of-00072.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..558b1da2c9bd9ccc0fc260fbf443e11654e2012d --- /dev/null +++ b/model-00014-of-00072.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7d51f9c6a413c887bf03bebd3baff8c190452353eb3c39cd244473b9ad0f09ca +size 4998108024 diff --git a/model-00015-of-00072.safetensors b/model-00015-of-00072.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..30daf9ee717bff396ad418dee6fca1626467de29 --- /dev/null +++ b/model-00015-of-00072.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:52266f98495c7e5f9ec51d66ccf5e84069752299102847655b94ad14820752c3 +size 4993856224 diff --git a/model-00016-of-00072.safetensors b/model-00016-of-00072.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..227f707b0d7e37551422c3d52f43a5eb6dd4aa15 --- /dev/null +++ b/model-00016-of-00072.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e2c172924752b707d9e65a1e4ae3b1dbfc6d8ae1e9e318d063bcf0f1f98a2d4f +size 4993856232 diff --git a/model-00017-of-00072.safetensors b/model-00017-of-00072.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..cc5b1119cbcdf85910643ae7e1ee1856ee00394b --- /dev/null +++ b/model-00017-of-00072.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:daa33b6de08e05e91c4a96d19d57c3010c59b72208cb9941685ce27df9ed8c73 +size 4993849336 diff --git a/model-00018-of-00072.safetensors b/model-00018-of-00072.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..46728710177940633fbb624819de8e5de8f66bff --- /dev/null +++ b/model-00018-of-00072.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:863eee2ef11043f24ac6ed5bb0d6f9fff20675018ff03acb9875b9ae44e335d0 +size 4998108024 diff --git a/model-00019-of-00072.safetensors b/model-00019-of-00072.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..53c59bf77be9a660549e1a04cc4012ce3f0d71b6 --- /dev/null +++ b/model-00019-of-00072.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0eb05642de8fd12329f383ec78dfa75314aa3f64ca2d9c8f366abc39a15ccc8b +size 4993856224 diff --git a/model-00020-of-00072.safetensors b/model-00020-of-00072.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..65b67ff97e43d46910d87c9bc805d3018472bdc2 --- /dev/null +++ b/model-00020-of-00072.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f5771e51c058668dbe827d3394df24256e3e1a8f6ed09598525b0ea02e2f9008 +size 4993856304 diff --git a/model-00021-of-00072.safetensors b/model-00021-of-00072.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..2dad2e331b91e22fa3e3f7e731e68a0356f2e47a --- /dev/null +++ b/model-00021-of-00072.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:041ef64961220d6bcc73eb62be4dff71c5b4e21976495ec186427e4cf6925335 +size 4993849408 diff --git a/model-00022-of-00072.safetensors b/model-00022-of-00072.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..9f1c90f1b898b444fba9f581ddc80643e70cbee1 --- /dev/null +++ b/model-00022-of-00072.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f237e38127ecc32c5a806bbf6a786ad6af502dfd0e61b9db50e1b415520b6ee6 +size 4998108040 diff --git a/model-00023-of-00072.safetensors b/model-00023-of-00072.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..5a51e7f8372e937d66e94cd5b72ff0a551cf5608 --- /dev/null +++ b/model-00023-of-00072.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3db37fc8d4eaa7c210a8b74a0a9399a02f83d1413451eace8b19034fdbea0aa3 +size 4993856224 diff --git a/model-00024-of-00072.safetensors b/model-00024-of-00072.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..8c565eba0beba82651e99781724e8ec5f4dbb6ee --- /dev/null +++ b/model-00024-of-00072.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fef7e9fdadfae6b70af8410044bb400dc16eede2b72d8a19a764c1dba4a72e5e +size 4993856376 diff --git a/model-00025-of-00072.safetensors b/model-00025-of-00072.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..082371326833e2a56039eeea1a85ea93b2521add --- /dev/null +++ b/model-00025-of-00072.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7fe7669e82e648a2f5230ab3fb8b2a9a2ff2f0784e23fdf9d2d4e1384df99b08 +size 4998108056 diff --git a/model-00026-of-00072.safetensors b/model-00026-of-00072.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..a870473f6ab877adb11f7b7c54ae97e649406853 --- /dev/null +++ b/model-00026-of-00072.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:48150d8caeac8f8eada58cd14d176263395da2bf515b9f2ada59bb612b21ad33 +size 4993849016 diff --git a/model-00027-of-00072.safetensors b/model-00027-of-00072.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..51bf47fca0f1cd62e46b4f7faf47c2249b61a7e9 --- /dev/null +++ b/model-00027-of-00072.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6355fc0e8d56ba65c1ac5c70ccd501d5c51722d7dd36565bbcfb1959b0331960 +size 4993856224 diff --git a/model-00028-of-00072.safetensors b/model-00028-of-00072.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..1ca57351c2981073546c913d31d581f73514e313 --- /dev/null +++ b/model-00028-of-00072.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:17538028a610180938cff98ea064597a50aa78392c13222358bad8243c90c49a +size 4993856448 diff --git a/model-00029-of-00072.safetensors b/model-00029-of-00072.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..3c9c32c83c40c5eaa955e9c0dd15962d1cb43fd7 --- /dev/null +++ b/model-00029-of-00072.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8ca4312a56abf0c0827dfa8d75ac382cf8b5ff0cc5cc841555f6006a5aa1d641 +size 4998108016 diff --git a/model-00030-of-00072.safetensors b/model-00030-of-00072.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..8ccb0f09c5d6acdc1cd36bfb416923797aa812a3 --- /dev/null +++ b/model-00030-of-00072.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9345411f95d58e02767d9675ce0d3f11c1ba9a775789259baa1ccc7a75a50851 +size 4993849056 diff --git a/model-00031-of-00072.safetensors b/model-00031-of-00072.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..594472876f0455183fc4ab9dec7b11aa71659c95 --- /dev/null +++ b/model-00031-of-00072.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8da13b3f8d015ddfa5f7b5ebb4ecfa65f2bf64700cce04c167fe4202d5624dde +size 4993856256 diff --git a/model-00032-of-00072.safetensors b/model-00032-of-00072.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..2bf01886aae3bc5683ab878e516d476598155ad8 --- /dev/null +++ b/model-00032-of-00072.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ff0373e06cbc467541dc203a6dc098e33652b3632329a4058ebdd242a79281f8 +size 4993856520 diff --git a/model-00033-of-00072.safetensors b/model-00033-of-00072.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..bf359eabe9cb08ab3b2359056660ae406d4ddee9 --- /dev/null +++ b/model-00033-of-00072.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d88243f4966ca7188cd939528815b9ab8946f34d3a902398fe9126cb04a3b383 +size 4998108016 diff --git a/model-00034-of-00072.safetensors b/model-00034-of-00072.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..e620d4de54cf438b9d3fe6173316fe818637dcc4 --- /dev/null +++ b/model-00034-of-00072.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1ac355bb01ea098acf13be978c09c6fb48f70204e9f3d1b277c3cf7c2b4d155e +size 4993849056 diff --git a/model-00035-of-00072.safetensors b/model-00035-of-00072.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..68d355572efac13e78ef95801daba82c167e7427 --- /dev/null +++ b/model-00035-of-00072.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0a7add4fe77a159a9580a717e3277791da9c54696fdfffaedf1ddd3eb4850c86 +size 4993856328 diff --git a/model-00036-of-00072.safetensors b/model-00036-of-00072.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..63609b6dd38476ea0fa70d0150e726ba4c2a66bf --- /dev/null +++ b/model-00036-of-00072.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:81b806c123146eeb98d13f13c72c50465beb31bf5a5d73c009b6123dc4a022b7 +size 4971906464 diff --git a/model-00037-of-00072.safetensors b/model-00037-of-00072.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..ad502c7e688dba714d2b2f030883840f8a7176ab --- /dev/null +++ b/model-00037-of-00072.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3cabc6ab4a3ff425f63800a0ba36e22f723e9c76787f68e83160c5f677b85e04 +size 4996447680 diff --git a/model-00038-of-00072.safetensors b/model-00038-of-00072.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..1287ae441c20a2a28498d4e5203d93ca92995e56 --- /dev/null +++ b/model-00038-of-00072.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5ccc3606bfc95f4f5580a56d8aecf407fc329c6c154f1609e3376c3989274659 +size 4993849056 diff --git a/model-00039-of-00072.safetensors b/model-00039-of-00072.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..f81cd400bae37f645e37d11cce088a3165ede447 --- /dev/null +++ b/model-00039-of-00072.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4bc1bd7b99e5f933f39b533edf4b2361aec033e85f43b237d8d31861585610eb +size 4993856392 diff --git a/model-00040-of-00072.safetensors b/model-00040-of-00072.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..ebe946d9be1d3ee0d53f143a29fcfeeacd4c901b --- /dev/null +++ b/model-00040-of-00072.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:67546927b12db4f69ae35f38ae536bd8be232e2dfdfa4cc904fb9d8f2320488b +size 4998108040 diff --git a/model-00041-of-00072.safetensors b/model-00041-of-00072.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..8a9b5b51a7a78b76e462a45a08a1ce919ce5b2dd --- /dev/null +++ b/model-00041-of-00072.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e15f12ee749f7e8efcbb47f7b7d22d1d14665f09832f9819a679b1ec29c1c75a +size 4993856200 diff --git a/model-00042-of-00072.safetensors b/model-00042-of-00072.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..f789b6f6f6fa0e8c88a214207388cd705c75146e --- /dev/null +++ b/model-00042-of-00072.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:896067cc2422fd8604bbc06c49f668d1cf50844949235f7b5df73776b5ff529e +size 4993849056 diff --git a/model-00043-of-00072.safetensors b/model-00043-of-00072.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..e93775f56f36eafdc3fd4e65d020f023f5cdf6f1 --- /dev/null +++ b/model-00043-of-00072.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5b7dc4b5627c8fc35182b2c03e6d34d6ef19a99f07041e80c36a848068cd8443 +size 4993856464 diff --git a/model-00044-of-00072.safetensors b/model-00044-of-00072.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..7951e475a8bbeb393c1fe38c097ee70b0d1ccce4 --- /dev/null +++ b/model-00044-of-00072.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:58a7bfef0cb1dfe1d21b2d7e8d14d7892207b2495c31feffadfbe9dd5c070761 +size 4998108024 diff --git a/model-00045-of-00072.safetensors b/model-00045-of-00072.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..cb126f3578f834bcd933ed56d5cb74a7fe9510e5 --- /dev/null +++ b/model-00045-of-00072.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:73227b4e123b655b5f0a8629e1a931a2b7e352e43d5f156d11f5144b2849907b +size 4993856224 diff --git a/model-00046-of-00072.safetensors b/model-00046-of-00072.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..9dfe52122b9ff5414dc39bdd4fcf57b49805f6a1 --- /dev/null +++ b/model-00046-of-00072.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3e0609d1b3252de2cdc34ac259b0e05d493b3bc267aa95d02aa35777742bd4ef +size 4993849096 diff --git a/model-00047-of-00072.safetensors b/model-00047-of-00072.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..a5ca363d7d5a8ee1b2eaea9e8b029e0eedb65fbe --- /dev/null +++ b/model-00047-of-00072.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:133dba4e5153703d3da553f95a1d2366d95a045bb0d158554e472cba61593d79 +size 4993856536 diff --git a/model-00048-of-00072.safetensors b/model-00048-of-00072.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..dc1d1269e00ae4b7bdaef0540c9940b87a38fc0f --- /dev/null +++ b/model-00048-of-00072.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d536c853663efecbfaefd9b252e574efccbdc1ee58abb3f1a03e213fb1c4b515 +size 4998108024 diff --git a/model-00049-of-00072.safetensors b/model-00049-of-00072.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..9e15e61dfb5d29639c7abcb271638e81e086a8fd --- /dev/null +++ b/model-00049-of-00072.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1a9a3134c107a9c70bbd94188bd6361fd8099676c9a575e149e29df1b338a569 +size 4993856224 diff --git a/model-00050-of-00072.safetensors b/model-00050-of-00072.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..b99b1974fe6d152b92b1e580dae7a0789cf20ad1 --- /dev/null +++ b/model-00050-of-00072.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:54cdd441373b359266265c2b60150d8842d80a6329b6948daf553f429e8e9308 +size 4993849168 diff --git a/model-00051-of-00072.safetensors b/model-00051-of-00072.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..02a26f94f40468f4b28e4afa05b7fb94460bbfdf --- /dev/null +++ b/model-00051-of-00072.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:872d082b0db2facb410b15394fd2a80d6522f0a8b6b817052dced8f83d40e7df +size 4990277320 diff --git a/model-00052-of-00072.safetensors b/model-00052-of-00072.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..64bef52f99a2b206d572bcdfb402c3a2237aad60 --- /dev/null +++ b/model-00052-of-00072.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:92f4b45672af16071446ce075dd116f40a4d399b568d1910473397a0cebb0726 +size 4993819280 diff --git a/model-00053-of-00072.safetensors b/model-00053-of-00072.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..9ddc4da5a3e4fb33f1545fba27a69ba0f1c9ee9b --- /dev/null +++ b/model-00053-of-00072.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8bb8d6523ff5c771740ebdf7bebfc3abd69a464716255a76e47dea4aab3dd7a3 +size 4993849056 diff --git a/model-00054-of-00072.safetensors b/model-00054-of-00072.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..3f62e38a9a325e9a6b782de7f3e454a46bf6049d --- /dev/null +++ b/model-00054-of-00072.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3e111f7b3a7ee985636c7b68048bbd96d6e4f304df5a96c45fd04064ab2ce0e9 +size 4993856416 diff --git a/model-00055-of-00072.safetensors b/model-00055-of-00072.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..4728b7ff3f60b2b064cd1a5b6b8b6781e8bb5f8f --- /dev/null +++ b/model-00055-of-00072.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5a07074cb5c8f7252150f02422ec1fb523d568a13db6f082861bb8f5c158deb1 +size 4998108024 diff --git a/model-00056-of-00072.safetensors b/model-00056-of-00072.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..0f6f33a02baeb51b0c92502e44e5c001f28010ef --- /dev/null +++ b/model-00056-of-00072.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2db1c90f6873bc25d5f8be2752c17b7190110a46459570ad228954baf26ef058 +size 4993856216 diff --git a/model-00057-of-00072.safetensors b/model-00057-of-00072.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..8ed54a14bac911886bde5e18a291600eff45245a --- /dev/null +++ b/model-00057-of-00072.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b385c2f9b13d377f4ba01cd5664ad43a9a69dfadc828d0bdacb30d79f0eb709b +size 4993849056 diff --git a/model-00058-of-00072.safetensors b/model-00058-of-00072.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..fd7bb8957a30306363f8906d62114f686f5bd207 --- /dev/null +++ b/model-00058-of-00072.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2a6bc828b7e2dab028b48c25bfe0be2eeaa48ae90847a2c5bfdcf2ccaa87f1e7 +size 4993856488 diff --git a/model-00059-of-00072.safetensors b/model-00059-of-00072.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..4442a50bafde727c0335989cb1e2762aa23923cf --- /dev/null +++ b/model-00059-of-00072.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bd82008bf14ff2a0604ae74f8b34f8a572492f9cdb173bd3424d7a9a7587f66c +size 4998108024 diff --git a/model-00060-of-00072.safetensors b/model-00060-of-00072.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..45f98c85d8f9ffbc08c6652ccbda4251c442d674 --- /dev/null +++ b/model-00060-of-00072.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2c7cb67852cced1215bb7de9e59483cc799cb413743845827a573cc405812bdd +size 4993856224 diff --git a/model-00061-of-00072.safetensors b/model-00061-of-00072.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..7cec892b0e73a9a5caee9a5e2f6760f8dd626021 --- /dev/null +++ b/model-00061-of-00072.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:feeb2e405d22c95f3c4ce2b602b39467261dba8382be182202a89f8cddc5b675 +size 4993849120 diff --git a/model-00062-of-00072.safetensors b/model-00062-of-00072.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..a5057ba6670e6dd4b7ad90defe676696b78f3848 --- /dev/null +++ b/model-00062-of-00072.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:22b6afc7f6a634e6ff4f177bdf36f5424994bd45609bbdd802564e877ad5b3f3 +size 4993856560 diff --git a/model-00063-of-00072.safetensors b/model-00063-of-00072.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..037f49c055bdbe8f64b1dee1cf136be4dfc52c72 --- /dev/null +++ b/model-00063-of-00072.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:30ed06f0dd3448390cb2c038625cc439b447349d03c623a6026d1e035ecf55d9 +size 4998108024 diff --git a/model-00064-of-00072.safetensors b/model-00064-of-00072.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..0fe839b4d69c6caa091ad7973d27a73db1dbccd2 --- /dev/null +++ b/model-00064-of-00072.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c416da818c8192a087b107de208f1e5e4399bcf91c917a2b1946a61ee1c81ace +size 4993856224 diff --git a/model-00065-of-00072.safetensors b/model-00065-of-00072.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..927afc608d77907302aae3bb091bf8c2afd7663a --- /dev/null +++ b/model-00065-of-00072.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:29f91de2514e01dbda521a59c8ebc2e94e2ffbd5fd764062026aa7de763daa6d +size 4993849192 diff --git a/model-00066-of-00072.safetensors b/model-00066-of-00072.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..742aa30ffd21f7c3d5bb0374c365c7ff65eef89e --- /dev/null +++ b/model-00066-of-00072.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3256edeb5623a5efc8a6e2a13cc4e2b2e95dd5944679abc7dd5c5d7ae818fc4a +size 4998108080 diff --git a/model-00067-of-00072.safetensors b/model-00067-of-00072.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..0494cddd537c259f256b6cd552e82af5709e474f --- /dev/null +++ b/model-00067-of-00072.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1df59874d305d1f0adc5b795507f8cf5608140f64cc2408a02d67ca19fc77d15 +size 4993856168 diff --git a/model-00068-of-00072.safetensors b/model-00068-of-00072.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..64212406b125650bf7c3db02a73f21c7aa30fc79 --- /dev/null +++ b/model-00068-of-00072.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f74ce6588b8a563ebd7c622c66e721349e40f6569810399e65dcf048934348bd +size 4993856224 diff --git a/model-00069-of-00072.safetensors b/model-00069-of-00072.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..de6091db2d20cb58f3598f1d4d53709fd440635d --- /dev/null +++ b/model-00069-of-00072.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:693c9ddd396cabce2b89c52bebea4ffb60031e1b0bafcba1554413342904533e +size 4993849264 diff --git a/model-00070-of-00072.safetensors b/model-00070-of-00072.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..ca5a62a82b660df76e4b52c2c77ab5ca659a3e2a --- /dev/null +++ b/model-00070-of-00072.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f7682627f7b14e0a4847c07ffc257f760698a9557517ac22ad2ae2ca943cc014 +size 4998108024 diff --git a/model-00071-of-00072.safetensors b/model-00071-of-00072.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..7f15dfe69b67dec8cabb1f33c8ea1138814f7a81 --- /dev/null +++ b/model-00071-of-00072.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d36b1c53f0026946a1dad7ed507626c6ca145a19542d5f7516f3d365ca0c4c13 +size 3503839048 diff --git a/model-00072-of-00072.safetensors b/model-00072-of-00072.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..898ac7fae2f21ce370168e6a67b83112a19b0ce7 --- /dev/null +++ b/model-00072-of-00072.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f7ed732a1f52d39814adc6a0b127bad1c816b89d7055fa07b029cba98deba7bf +size 1551892608 diff --git a/model.safetensors.index.json b/model.safetensors.index.json new file mode 100644 index 0000000000000000000000000000000000000000..3d58b87b399b02a43c9ab0450a643d361e6323ca --- /dev/null +++ b/model.safetensors.index.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:966776dc8935250b223659688987cd6aeff5db7d7aae4baf777fffad2b887bcf +size 8179620 diff --git a/recipe.yaml b/recipe.yaml new file mode 100644 index 0000000000000000000000000000000000000000..a5e1f6626c47a2f698c834c5d59ebd2d4d06aa47 --- /dev/null +++ b/recipe.yaml @@ -0,0 +1,6 @@ +default_stage: + default_modifiers: + QuantizationModifier: + targets: [Linear] + ignore: [lm_head, .*\.mlp\.gate($|\.)] + scheme: FP8_DYNAMIC diff --git a/special_tokens_map.json b/special_tokens_map.json new file mode 100644 index 0000000000000000000000000000000000000000..9028cf84013844f17d7616bdec1d88e977924434 --- /dev/null +++ b/special_tokens_map.json @@ -0,0 +1,40 @@ +{ + "additional_special_tokens": [ + "<|endoftext|>", + "[MASK]", + "[gMASK]", + "[sMASK]", + "", + "", + "<|system|>", + "<|user|>", + "<|assistant|>", + "<|observation|>", + "<|begin_of_image|>", + "<|end_of_image|>", + "<|begin_of_video|>", + "<|end_of_video|>", + "<|begin_of_audio|>", + "<|end_of_audio|>", + "<|begin_of_transcription|>", + "<|end_of_transcription|>", + "<|code_prefix|>", + "<|code_middle|>", + "<|code_suffix|>", + "/nothink" + ], + "eos_token": { + "content": "<|endoftext|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false + }, + "pad_token": { + "content": "<|endoftext|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false + } +} diff --git a/tokenizer.json b/tokenizer.json new file mode 100644 index 0000000000000000000000000000000000000000..e3ed3c66baf1ec4de61840b0abf02142687bfed8 --- /dev/null +++ b/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bda8e2146c3bb7b7e0fc96dcc4f0aeff041c6c27952e3ace0665663ebff346ba +size 19970700 diff --git a/tokenizer_config.json b/tokenizer_config.json new file mode 100644 index 0000000000000000000000000000000000000000..75e11cfb2e0cc09f19391ec2278b4825a4c3fae9 --- /dev/null +++ b/tokenizer_config.json @@ -0,0 +1,325 @@ +{ + "added_tokens_decoder": { + "151329": { + "content": "<|endoftext|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "151330": { + "content": "[MASK]", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "151331": { + "content": "[gMASK]", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "151332": { + "content": "[sMASK]", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "151333": { + "content": "", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "151334": { + "content": "", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "151335": { + "content": "<|system|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "151336": { + "content": "<|user|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "151337": { + "content": "<|assistant|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "151338": { + "content": "<|observation|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "151339": { + "content": "<|begin_of_image|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "151340": { + "content": "<|end_of_image|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "151341": { + "content": "<|begin_of_video|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "151342": { + "content": "<|end_of_video|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "151343": { + "content": "<|begin_of_audio|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "151344": { + "content": "<|end_of_audio|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "151345": { + "content": "<|begin_of_transcription|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "151346": { + "content": "<|end_of_transcription|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "151347": { + "content": "<|code_prefix|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "151348": { + "content": "<|code_middle|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "151349": { + "content": "<|code_suffix|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "151350": { + "content": "", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": false + }, + "151351": { + "content": "", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": false + }, + "151352": { + "content": "", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": false + }, + "151353": { + "content": "", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": false + }, + "151354": { + "content": "", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": false + }, + "151355": { + "content": "", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": false + }, + "151356": { + "content": "", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": false + }, + "151357": { + "content": "", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": false + }, + "151358": { + "content": "", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": false + }, + "151359": { + "content": "", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": false + }, + "151360": { + "content": "/nothink", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "151361": { + "content": "<|begin_of_box|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": false + }, + "151362": { + "content": "<|end_of_box|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": false + }, + "151363": { + "content": "<|image|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": false + }, + "151364": { + "content": "<|video|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": false + } + }, + "additional_special_tokens": [ + "<|endoftext|>", + "[MASK]", + "[gMASK]", + "[sMASK]", + "", + "", + "<|system|>", + "<|user|>", + "<|assistant|>", + "<|observation|>", + "<|begin_of_image|>", + "<|end_of_image|>", + "<|begin_of_video|>", + "<|end_of_video|>", + "<|begin_of_audio|>", + "<|end_of_audio|>", + "<|begin_of_transcription|>", + "<|end_of_transcription|>", + "<|code_prefix|>", + "<|code_middle|>", + "<|code_suffix|>", + "/nothink" + ], + "clean_up_tokenization_spaces": false, + "do_lower_case": false, + "eos_token": "<|endoftext|>", + "extra_special_tokens": {}, + "model_max_length": 128000, + "pad_token": "<|endoftext|>", + "padding_side": "left", + "remove_space": false, + "tokenizer_class": "PreTrainedTokenizerFast" +}