Add files using upload-large-folder tool
Browse filesThis view is limited to 50 files because it contains too many changes. See raw diff
- .gitattributes +2 -0
- chat_template.jinja +103 -0
- config.json +71 -0
- generation_config.json +10 -0
- hf_quant_config.json +13 -0
- model-00001-of-00071.safetensors +3 -0
- model-00003-of-00071.safetensors +3 -0
- model-00005-of-00071.safetensors +3 -0
- model-00006-of-00071.safetensors +3 -0
- model-00007-of-00071.safetensors +3 -0
- model-00008-of-00071.safetensors +3 -0
- model-00009-of-00071.safetensors +3 -0
- model-00011-of-00071.safetensors +3 -0
- model-00012-of-00071.safetensors +3 -0
- model-00013-of-00071.safetensors +3 -0
- model-00014-of-00071.safetensors +3 -0
- model-00015-of-00071.safetensors +3 -0
- model-00019-of-00071.safetensors +3 -0
- model-00020-of-00071.safetensors +3 -0
- model-00021-of-00071.safetensors +3 -0
- model-00022-of-00071.safetensors +3 -0
- model-00023-of-00071.safetensors +3 -0
- model-00024-of-00071.safetensors +3 -0
- model-00025-of-00071.safetensors +3 -0
- model-00026-of-00071.safetensors +3 -0
- model-00027-of-00071.safetensors +3 -0
- model-00029-of-00071.safetensors +3 -0
- model-00047-of-00071.safetensors +3 -0
- model-00048-of-00071.safetensors +3 -0
- model-00049-of-00071.safetensors +3 -0
- model-00050-of-00071.safetensors +3 -0
- model-00051-of-00071.safetensors +3 -0
- model-00052-of-00071.safetensors +3 -0
- model-00053-of-00071.safetensors +3 -0
- model-00054-of-00071.safetensors +3 -0
- model-00057-of-00071.safetensors +3 -0
- model-00058-of-00071.safetensors +3 -0
- model-00059-of-00071.safetensors +3 -0
- model-00060-of-00071.safetensors +3 -0
- model-00061-of-00071.safetensors +3 -0
- model-00063-of-00071.safetensors +3 -0
- model-00064-of-00071.safetensors +3 -0
- model-00066-of-00071.safetensors +3 -0
- model-00068-of-00071.safetensors +3 -0
- model-00069-of-00071.safetensors +3 -0
- model-00070-of-00071.safetensors +3 -0
- model-00071-of-00071.safetensors +3 -0
- model.safetensors.index.json +3 -0
- special_tokens_map.json +34 -0
- tokenizer.json +3 -0
.gitattributes
CHANGED
|
@@ -33,3 +33,5 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
|
|
| 33 |
*.zip filter=lfs diff=lfs merge=lfs -text
|
| 34 |
*.zst filter=lfs diff=lfs merge=lfs -text
|
| 35 |
*tfevents* filter=lfs diff=lfs merge=lfs -text
|
|
|
|
|
|
|
|
|
| 33 |
*.zip filter=lfs diff=lfs merge=lfs -text
|
| 34 |
*.zst filter=lfs diff=lfs merge=lfs -text
|
| 35 |
*tfevents* filter=lfs diff=lfs merge=lfs -text
|
| 36 |
+
model.safetensors.index.json filter=lfs diff=lfs merge=lfs -text
|
| 37 |
+
tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
chat_template.jinja
ADDED
|
@@ -0,0 +1,103 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
[gMASK]<sop>
|
| 2 |
+
{%- if tools -%}
|
| 3 |
+
<|system|>
|
| 4 |
+
# Tools
|
| 5 |
+
|
| 6 |
+
You may call one or more functions to assist with the user query.
|
| 7 |
+
|
| 8 |
+
You are provided with function signatures within <tools></tools> XML tags:
|
| 9 |
+
<tools>
|
| 10 |
+
{% for tool in tools %}
|
| 11 |
+
{{ tool | tojson(ensure_ascii=False) }}
|
| 12 |
+
{% endfor %}
|
| 13 |
+
</tools>
|
| 14 |
+
|
| 15 |
+
For each function call, output the function name and arguments within the following XML format:
|
| 16 |
+
<tool_call>{function-name}
|
| 17 |
+
<arg_key>{arg-key-1}</arg_key>
|
| 18 |
+
<arg_value>{arg-value-1}</arg_value>
|
| 19 |
+
<arg_key>{arg-key-2}</arg_key>
|
| 20 |
+
<arg_value>{arg-value-2}</arg_value>
|
| 21 |
+
...
|
| 22 |
+
</tool_call>{%- endif -%}
|
| 23 |
+
{%- macro visible_text(content) -%}
|
| 24 |
+
{%- if content is string -%}
|
| 25 |
+
{{- content }}
|
| 26 |
+
{%- elif content is iterable and content is not mapping -%}
|
| 27 |
+
{%- for item in content -%}
|
| 28 |
+
{%- if item is mapping and item.type == 'text' -%}
|
| 29 |
+
{{- item.text }}
|
| 30 |
+
{%- elif item is string -%}
|
| 31 |
+
{{- item }}
|
| 32 |
+
{%- endif -%}
|
| 33 |
+
{%- endfor -%}
|
| 34 |
+
{%- else -%}
|
| 35 |
+
{{- content }}
|
| 36 |
+
{%- endif -%}
|
| 37 |
+
{%- endmacro -%}
|
| 38 |
+
{%- set ns = namespace(last_user_index=-1) %}
|
| 39 |
+
{%- for m in messages %}
|
| 40 |
+
{%- if m.role == 'user' %}
|
| 41 |
+
{% set ns.last_user_index = loop.index0 -%}
|
| 42 |
+
{%- endif %}
|
| 43 |
+
{%- endfor %}
|
| 44 |
+
{% for m in messages %}
|
| 45 |
+
{%- if m.role == 'user' -%}<|user|>
|
| 46 |
+
{{ visible_text(m.content) }}
|
| 47 |
+
{{- '/nothink' if (enable_thinking is defined and not enable_thinking and not visible_text(m.content).endswith("/nothink")) else '' -}}
|
| 48 |
+
{%- elif m.role == 'assistant' -%}
|
| 49 |
+
<|assistant|>
|
| 50 |
+
{%- set reasoning_content = '' %}
|
| 51 |
+
{%- set content = visible_text(m.content) %}
|
| 52 |
+
{%- if m.reasoning_content is string %}
|
| 53 |
+
{%- set reasoning_content = m.reasoning_content %}
|
| 54 |
+
{%- else %}
|
| 55 |
+
{%- if '</think>' in content %}
|
| 56 |
+
{%- set reasoning_content = content.split('</think>')[0].rstrip('\n').split('<think>')[-1].lstrip('\n') %}
|
| 57 |
+
{%- set content = content.split('</think>')[-1].lstrip('\n') %}
|
| 58 |
+
{%- endif %}
|
| 59 |
+
{%- endif %}
|
| 60 |
+
{%- if loop.index0 > ns.last_user_index and reasoning_content -%}
|
| 61 |
+
{{ '\n<think>' + reasoning_content.strip() + '</think>'}}
|
| 62 |
+
{%- else -%}
|
| 63 |
+
{{ '\n<think></think>' }}
|
| 64 |
+
{%- endif -%}
|
| 65 |
+
{%- if content.strip() -%}
|
| 66 |
+
{{ '\n' + content.strip() }}
|
| 67 |
+
{%- endif -%}
|
| 68 |
+
{% if m.tool_calls %}
|
| 69 |
+
{% for tc in m.tool_calls %}
|
| 70 |
+
{%- if tc.function %}
|
| 71 |
+
{%- set tc = tc.function %}
|
| 72 |
+
{%- endif %}
|
| 73 |
+
{{ '\n<tool_call>' + tc.name }}
|
| 74 |
+
{% set _args = tc.arguments %}
|
| 75 |
+
{% for k, v in _args.items() %}
|
| 76 |
+
<arg_key>{{ k }}</arg_key>
|
| 77 |
+
<arg_value>{{ v | tojson(ensure_ascii=False) if v is not string else v }}</arg_value>
|
| 78 |
+
{% endfor %}
|
| 79 |
+
</tool_call>{% endfor %}
|
| 80 |
+
{% endif %}
|
| 81 |
+
{%- elif m.role == 'tool' -%}
|
| 82 |
+
{%- if m.content is string -%}
|
| 83 |
+
{%- if loop.first or (messages[loop.index0 - 1].role != "tool") %}
|
| 84 |
+
{{- '<|observation|>' }}
|
| 85 |
+
{%- endif %}
|
| 86 |
+
{{- '\n<tool_response>\n' }}
|
| 87 |
+
{{- m.content }}
|
| 88 |
+
{{- '\n</tool_response>' }}
|
| 89 |
+
{%- else -%}
|
| 90 |
+
<|observation|>{% for tr in m.content %}
|
| 91 |
+
|
| 92 |
+
<tool_response>
|
| 93 |
+
{{ tr.output if tr.output is defined else tr }}
|
| 94 |
+
</tool_response>{% endfor -%}
|
| 95 |
+
{% endif -%}
|
| 96 |
+
{%- elif m.role == 'system' -%}
|
| 97 |
+
<|system|>
|
| 98 |
+
{{ visible_text(m.content) }}
|
| 99 |
+
{%- endif -%}
|
| 100 |
+
{%- endfor -%}
|
| 101 |
+
{%- if add_generation_prompt -%}
|
| 102 |
+
<|assistant|>{{- '\n<think></think>' if (enable_thinking is defined and not enable_thinking) else '' -}}
|
| 103 |
+
{%- endif -%}
|
config.json
ADDED
|
@@ -0,0 +1,71 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"architectures": [
|
| 3 |
+
"Glm4MoeForCausalLM"
|
| 4 |
+
],
|
| 5 |
+
"attention_bias": true,
|
| 6 |
+
"attention_dropout": 0.0,
|
| 7 |
+
"dtype": "bfloat16",
|
| 8 |
+
"eos_token_id": [
|
| 9 |
+
151329,
|
| 10 |
+
151336,
|
| 11 |
+
151338
|
| 12 |
+
],
|
| 13 |
+
"first_k_dense_replace": 3,
|
| 14 |
+
"head_dim": 128,
|
| 15 |
+
"hidden_act": "silu",
|
| 16 |
+
"hidden_size": 5120,
|
| 17 |
+
"initializer_range": 0.02,
|
| 18 |
+
"intermediate_size": 12288,
|
| 19 |
+
"max_position_embeddings": 202752,
|
| 20 |
+
"model_type": "glm4_moe",
|
| 21 |
+
"moe_intermediate_size": 1536,
|
| 22 |
+
"n_group": 1,
|
| 23 |
+
"n_routed_experts": 160,
|
| 24 |
+
"n_shared_experts": 1,
|
| 25 |
+
"norm_topk_prob": true,
|
| 26 |
+
"num_attention_heads": 96,
|
| 27 |
+
"num_experts_per_tok": 8,
|
| 28 |
+
"num_hidden_layers": 92,
|
| 29 |
+
"num_key_value_heads": 8,
|
| 30 |
+
"num_nextn_predict_layers": 1,
|
| 31 |
+
"pad_token_id": 151329,
|
| 32 |
+
"partial_rotary_factor": 0.5,
|
| 33 |
+
"rms_norm_eps": 1e-05,
|
| 34 |
+
"rope_scaling": null,
|
| 35 |
+
"rope_theta": 1000000,
|
| 36 |
+
"routed_scaling_factor": 2.5,
|
| 37 |
+
"tie_word_embeddings": false,
|
| 38 |
+
"topk_group": 1,
|
| 39 |
+
"transformers_version": "4.57.0",
|
| 40 |
+
"use_cache": true,
|
| 41 |
+
"use_qk_norm": true,
|
| 42 |
+
"vocab_size": 151552,
|
| 43 |
+
"quantization_config": {
|
| 44 |
+
"config_groups": {
|
| 45 |
+
"group_0": {
|
| 46 |
+
"input_activations": {
|
| 47 |
+
"dynamic": false,
|
| 48 |
+
"num_bits": 8,
|
| 49 |
+
"type": "float"
|
| 50 |
+
},
|
| 51 |
+
"weights": {
|
| 52 |
+
"dynamic": false,
|
| 53 |
+
"num_bits": 8,
|
| 54 |
+
"type": "float"
|
| 55 |
+
},
|
| 56 |
+
"targets": [
|
| 57 |
+
"Linear"
|
| 58 |
+
]
|
| 59 |
+
}
|
| 60 |
+
},
|
| 61 |
+
"ignore": [
|
| 62 |
+
"lm_head"
|
| 63 |
+
],
|
| 64 |
+
"quant_algo": "FP8",
|
| 65 |
+
"producer": {
|
| 66 |
+
"name": "modelopt",
|
| 67 |
+
"version": "0.37.0.dev82+g340eb7a75"
|
| 68 |
+
},
|
| 69 |
+
"quant_method": "modelopt"
|
| 70 |
+
}
|
| 71 |
+
}
|
generation_config.json
ADDED
|
@@ -0,0 +1,10 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"_from_model_config": true,
|
| 3 |
+
"eos_token_id": [
|
| 4 |
+
151329,
|
| 5 |
+
151336,
|
| 6 |
+
151338
|
| 7 |
+
],
|
| 8 |
+
"pad_token_id": 151329,
|
| 9 |
+
"transformers_version": "4.57.0"
|
| 10 |
+
}
|
hf_quant_config.json
ADDED
|
@@ -0,0 +1,13 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"producer": {
|
| 3 |
+
"name": "modelopt",
|
| 4 |
+
"version": "0.37.0.dev82+g340eb7a75"
|
| 5 |
+
},
|
| 6 |
+
"quantization": {
|
| 7 |
+
"quant_algo": "FP8",
|
| 8 |
+
"kv_cache_quant_algo": null,
|
| 9 |
+
"exclude_modules": [
|
| 10 |
+
"lm_head"
|
| 11 |
+
]
|
| 12 |
+
}
|
| 13 |
+
}
|
model-00001-of-00071.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:45980fde390758cea8f820b2dba1819d985de88861a43a03c219422ea22a0166
|
| 3 |
+
size 4999379048
|
model-00003-of-00071.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:e956673c9afaad86984606749e6496fb35d503a014e748ed5cce66539275fbc8
|
| 3 |
+
size 4994814392
|
model-00005-of-00071.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:30b83ffc35553df1506860d378f3785d7c5f78ad50b915265cf3d24d545048a9
|
| 3 |
+
size 4998372328
|
model-00006-of-00071.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:f1bf584fa1638aeb9fcd23102e04534c959a2408a2deb1b54dcabf6185ebd802
|
| 3 |
+
size 4998372624
|
model-00007-of-00071.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:d4323b3b954972da356c1e0b42b8d21caee5cc3690e34428d6269d336190e7ae
|
| 3 |
+
size 4994815768
|
model-00008-of-00071.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:933f1fed4f7c10d332d0e6cd7e261e7df966ca9621a774e9943e545a40458aa0
|
| 3 |
+
size 4998374096
|
model-00009-of-00071.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:2cd6224b30ea0e56fc7bfbc89816a54adfee42575fd060dd243e80e0ac5e2243
|
| 3 |
+
size 4998374320
|
model-00011-of-00071.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:4e51ed4d2c8e1f3376e6e0b80f9ef080e3af98f11b9de545a36d129289c05a72
|
| 3 |
+
size 4998374032
|
model-00012-of-00071.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:f93fbb817a592a6d917140fadee0fa250e8afd1abce95dda7654b6a18279d38c
|
| 3 |
+
size 4998374096
|
model-00013-of-00071.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:a50b1696339151ad5f0b1d0dc6593b6d6b94b0982653fd76ff8d4b6350bebfc6
|
| 3 |
+
size 4998374440
|
model-00014-of-00071.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:67e75c122f81c42b0e56b25735ffe29312b89be02724fa6c778347728e435c9b
|
| 3 |
+
size 4994816216
|
model-00015-of-00071.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:9ad077aec9acb226cae8fa2b809e80488b9cffe4a166eb7fb3c00221c6e48a81
|
| 3 |
+
size 4998374096
|
model-00019-of-00071.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:917058d250dc0974af2656663a57ea1fd283b3cece66f0d30ac877d6a925c07e
|
| 3 |
+
size 4998374096
|
model-00020-of-00071.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:eb1727fcde3fd192761171935e1f9b06380341c2cfab2e1a3610a593d5547bcd
|
| 3 |
+
size 4998374264
|
model-00021-of-00071.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:4bc58a7b990e2f2f4422f48e414b65b8943cf0f000a6fd725eb3d782776efb40
|
| 3 |
+
size 4997437336
|
model-00022-of-00071.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:62c56868a43fcb7ba39d506b7e6f846e17e4e4d03de8b9a643e67ccfc8a79df7
|
| 3 |
+
size 4995752920
|
model-00023-of-00071.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:7c4c8559f484d66c54a023400a4772296fe0e5de289ecef67b6cf7c4eb1ec7b8
|
| 3 |
+
size 4998374096
|
model-00024-of-00071.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:5051e5b282ccb4e982f2109af8103292f34c1ce838b0a32b8b49c0d7f6d10c12
|
| 3 |
+
size 4998374384
|
model-00025-of-00071.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:9f5332ff916f544abb8dd885f53f9ff7ebf90ec6b143725b27e1829ef133c9ae
|
| 3 |
+
size 4994816200
|
model-00026-of-00071.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:cd697ce4e4cfbd5e876084e544d30853c948730e2003d53ad8e6205bd0ed1e2a
|
| 3 |
+
size 4998374096
|
model-00027-of-00071.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:8a5b5e42a2bd757ab9841b0ed522f0fa8da38bea7ec44d10f8fd062f05e3e5a6
|
| 3 |
+
size 4998374096
|
model-00029-of-00071.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:8aa567026503af4dc9e2fc2025bff441ca4cc574e0551811d34c11d27b80dffb
|
| 3 |
+
size 4994816240
|
model-00047-of-00071.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:7d1c46a92f7db8afc26dce9187ba487e25c21e49105a822fc01e883cc91cf84e
|
| 3 |
+
size 4979088680
|
model-00048-of-00071.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:4f84d6fb2285ac676319caaab754c2c314d20f4c605fa9c0a09fa226c9d678f3
|
| 3 |
+
size 4998372232
|
model-00049-of-00071.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:53441dd631912462c7145d496b40b6244ced0fd5b554c5ce04a19f5c44c1dbda
|
| 3 |
+
size 4998374096
|
model-00050-of-00071.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:7c7a1ab854e97fe0d1b281e56f1687dc37e19a9b9711ce67e9c7d8a236f6d3bc
|
| 3 |
+
size 4998374384
|
model-00051-of-00071.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:c4d3bc5e40baa6c543fe5228a0214229c9fcd38af75e22e3a2d126c24dd342a2
|
| 3 |
+
size 4994816200
|
model-00052-of-00071.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:df23010db8b80e42961bcb43c59102b513575390cf8b84915221f25eafead832
|
| 3 |
+
size 4998374096
|
model-00053-of-00071.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:ef8aae2e07efa9bce7b9b92c7681502343d64cb9c17ebe74a17cc956ff2bd006
|
| 3 |
+
size 4998374096
|
model-00054-of-00071.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:5e803c5a74134e46488861cd6288b04a326f59e9947250887579da4a96bc8aba
|
| 3 |
+
size 4998374496
|
model-00057-of-00071.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:e145070ce86fec35508da1d78734b4527b23a629a114c6c9c241acf3a5535cd4
|
| 3 |
+
size 4998374216
|
model-00058-of-00071.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:1097413e902e6ecba58f1f63cb0bc6a7aa1b0b55e675840db340bfe0423c74fe
|
| 3 |
+
size 4998374496
|
model-00059-of-00071.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:30fe58ffe52bef2edec0f3b5c4358be2901c1471dc488cb89e1d14760c2910fa
|
| 3 |
+
size 4994816144
|
model-00060-of-00071.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:dacedc65ea8d7cbc30fba94b9cdc4a9b25c1a6575a655665d3d2e52470764dc4
|
| 3 |
+
size 4998374096
|
model-00061-of-00071.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:de7d9df020f3c761a20d4b00c6678495c14a41cb7fea80f825e5012517622d6f
|
| 3 |
+
size 4998374328
|
model-00063-of-00071.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:eabef1dcce7a4bf9759aa942f8652df8e943b81482b1d6e209615c6a61b1335e
|
| 3 |
+
size 4998374040
|
model-00064-of-00071.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:07294d2a8439b2a07305a1da53419f7e3b3ef11dee010dc1e9ae790e86cd2ba9
|
| 3 |
+
size 4998374096
|
model-00066-of-00071.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:3326ac4736cfaf72bd2e07e999a25ba261b5eafa88b1c6d2cbe70a54d3d94a2a
|
| 3 |
+
size 4994816224
|
model-00068-of-00071.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:7d74cd730c64cf3dccbd90b4a2671ae8a641934a00155f9847dfb5ad88ff9f93
|
| 3 |
+
size 4998374160
|
model-00069-of-00071.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:6a8c8c5bda7811c0f54ef6707bd6b07573fbae75dd53a42f2112a41bec652400
|
| 3 |
+
size 4998374496
|
model-00070-of-00071.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:73dcdd107c593331785ff2551195a9f6d53a5368d89e839553d7f86feea743aa
|
| 3 |
+
size 4994816168
|
model-00071-of-00071.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:7d01d53a09caa4833a88c7efdc6378c011b2b7cc72c79168c77e831386a5f814
|
| 3 |
+
size 4636515144
|
model.safetensors.index.json
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:748fd383bd8edc0e563fb7185fce39f30415df664b8ae8e925cf84504fe9407b
|
| 3 |
+
size 12321845
|
special_tokens_map.json
ADDED
|
@@ -0,0 +1,34 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"additional_special_tokens": [
|
| 3 |
+
"<|endoftext|>",
|
| 4 |
+
"[MASK]",
|
| 5 |
+
"[gMASK]",
|
| 6 |
+
"[sMASK]",
|
| 7 |
+
"<sop>",
|
| 8 |
+
"<eop>",
|
| 9 |
+
"<|system|>",
|
| 10 |
+
"<|user|>",
|
| 11 |
+
"<|assistant|>",
|
| 12 |
+
"<|observation|>",
|
| 13 |
+
"<|begin_of_image|>",
|
| 14 |
+
"<|end_of_image|>",
|
| 15 |
+
"<|begin_of_video|>",
|
| 16 |
+
"<|end_of_video|>",
|
| 17 |
+
"<|begin_of_audio|>",
|
| 18 |
+
"<|end_of_audio|>",
|
| 19 |
+
"<|begin_of_transcription|>",
|
| 20 |
+
"<|end_of_transcription|>",
|
| 21 |
+
"<|code_prefix|>",
|
| 22 |
+
"<|code_middle|>",
|
| 23 |
+
"<|code_suffix|>",
|
| 24 |
+
"/nothink"
|
| 25 |
+
],
|
| 26 |
+
"eos_token": {
|
| 27 |
+
"content": "<|endoftext|>",
|
| 28 |
+
"lstrip": false,
|
| 29 |
+
"normalized": false,
|
| 30 |
+
"rstrip": false,
|
| 31 |
+
"single_word": false
|
| 32 |
+
},
|
| 33 |
+
"pad_token": "<|endoftext|>"
|
| 34 |
+
}
|
tokenizer.json
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:bda8e2146c3bb7b7e0fc96dcc4f0aeff041c6c27952e3ace0665663ebff346ba
|
| 3 |
+
size 19970700
|