alpindale commited on Oct 2, 2025

Commit

5219edf

verified ·

1 Parent(s): a139639

Add files using upload-large-folder tool

Browse files

This view is limited to 50 files because it contains too many changes. See raw diff

Files changed (50) hide show

.gitattributes +1 -0
chat_template.jinja +103 -0
config.json +89 -0
generation_config.json +10 -0
model-00003-of-00072.safetensors +3 -0
model-00006-of-00072.safetensors +3 -0
model-00007-of-00072.safetensors +3 -0
model-00011-of-00072.safetensors +3 -0
model-00013-of-00072.safetensors +3 -0
model-00014-of-00072.safetensors +3 -0
model-00015-of-00072.safetensors +3 -0
model-00017-of-00072.safetensors +3 -0
model-00018-of-00072.safetensors +3 -0
model-00020-of-00072.safetensors +3 -0
model-00021-of-00072.safetensors +3 -0
model-00027-of-00072.safetensors +3 -0
model-00028-of-00072.safetensors +3 -0
model-00031-of-00072.safetensors +3 -0
model-00034-of-00072.safetensors +3 -0
model-00036-of-00072.safetensors +3 -0
model-00037-of-00072.safetensors +3 -0
model-00039-of-00072.safetensors +3 -0
model-00041-of-00072.safetensors +3 -0
model-00043-of-00072.safetensors +3 -0
model-00044-of-00072.safetensors +3 -0
model-00046-of-00072.safetensors +3 -0
model-00047-of-00072.safetensors +3 -0
model-00048-of-00072.safetensors +3 -0
model-00049-of-00072.safetensors +3 -0
model-00050-of-00072.safetensors +3 -0
model-00051-of-00072.safetensors +3 -0
model-00052-of-00072.safetensors +3 -0
model-00053-of-00072.safetensors +3 -0
model-00054-of-00072.safetensors +3 -0
model-00055-of-00072.safetensors +3 -0
model-00057-of-00072.safetensors +3 -0
model-00058-of-00072.safetensors +3 -0
model-00060-of-00072.safetensors +3 -0
model-00062-of-00072.safetensors +3 -0
model-00063-of-00072.safetensors +3 -0
model-00064-of-00072.safetensors +3 -0
model-00066-of-00072.safetensors +3 -0
model-00067-of-00072.safetensors +3 -0
model-00068-of-00072.safetensors +3 -0
model-00071-of-00072.safetensors +3 -0
model-00072-of-00072.safetensors +3 -0
model.safetensors.index.json +0 -0
recipe.yaml +20 -0
special_tokens_map.json +40 -0
tokenizer.json +3 -0

.gitattributes CHANGED Viewed

@@ -33,3 +33,4 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
 *.zip filter=lfs diff=lfs merge=lfs -text
 *.zst filter=lfs diff=lfs merge=lfs -text
 *tfevents* filter=lfs diff=lfs merge=lfs -text

 *.zip filter=lfs diff=lfs merge=lfs -text
 *.zst filter=lfs diff=lfs merge=lfs -text
 *tfevents* filter=lfs diff=lfs merge=lfs -text
+tokenizer.json filter=lfs diff=lfs merge=lfs -text

chat_template.jinja ADDED Viewed

	@@ -0,0 +1,103 @@

+[gMASK]<sop>
+{%- if tools -%}
+<|system|>
+# Tools
+You may call one or more functions to assist with the user query.
+You are provided with function signatures within <tools></tools> XML tags:
+<tools>
+{% for tool in tools %}
+{{ tool | tojson(ensure_ascii=False) }}
+{% endfor %}
+</tools>
+For each function call, output the function name and arguments within the following XML format:
+<tool_call>{function-name}
+<arg_key>{arg-key-1}</arg_key>
+<arg_value>{arg-value-1}</arg_value>
+<arg_key>{arg-key-2}</arg_key>
+<arg_value>{arg-value-2}</arg_value>
+...
+</tool_call>{%- endif -%}
+{%- macro visible_text(content) -%}
+    {%- if content is string -%}
+        {{- content }}
+    {%- elif content is iterable and content is not mapping -%}
+        {%- for item in content -%}
+            {%- if item is mapping and item.type == 'text' -%}
+                {{- item.text }}
+            {%- elif item is string -%}
+                {{- item }}
+            {%- endif -%}
+        {%- endfor -%}
+    {%- else -%}
+        {{- content }}
+    {%- endif -%}
+{%- endmacro -%}
+{%- set ns = namespace(last_user_index=-1) %}
+{%- for m in messages %}
+    {%- if m.role == 'user' %}
+        {% set ns.last_user_index = loop.index0 -%}
+    {%- endif %}
+{%- endfor %}
+{% for m in messages %}
+{%- if m.role == 'user' -%}<|user|>
+{{ visible_text(m.content) }}
+{{- '/nothink' if (enable_thinking is defined and not enable_thinking and not visible_text(m.content).endswith("/nothink")) else '' -}}
+{%- elif m.role == 'assistant' -%}
+<|assistant|>
+{%- set reasoning_content = '' %}
+{%- set content = visible_text(m.content) %}
+{%- if m.reasoning_content is string %}
+    {%- set reasoning_content = m.reasoning_content %}
+{%- else %}
+    {%- if '</think>' in content %}
+        {%- set reasoning_content = content.split('</think>')[0].rstrip('\n').split('<think>')[-1].lstrip('\n') %}
+        {%- set content = content.split('</think>')[-1].lstrip('\n') %}
+    {%- endif %}
+{%- endif %}
+{%- if loop.index0 > ns.last_user_index and reasoning_content -%}
+{{ '\n<think>' + reasoning_content.strip() +  '</think>'}}
+{%- else -%}
+{{ '\n<think></think>' }}
+{%- endif -%}
+{%- if content.strip() -%}
+{{ '\n' + content.strip() }}
+{%- endif -%}
+{% if m.tool_calls %}
+{% for tc in m.tool_calls %}
+{%- if tc.function %}
+    {%- set tc = tc.function %}
+{%- endif %}
+{{ '\n<tool_call>' + tc.name }}
+{% set _args = tc.arguments %}
+{% for k, v in _args.items() %}
+<arg_key>{{ k }}</arg_key>
+<arg_value>{{ v | tojson(ensure_ascii=False) if v is not string else v }}</arg_value>
+{% endfor %}
+</tool_call>{% endfor %}
+{% endif %}
+{%- elif m.role == 'tool' -%}
+{%- if m.content is string -%}
+{%- if loop.first or (messages[loop.index0 - 1].role != "tool") %}
+    {{- '<|observation|>' }}
+{%- endif %}
+{{- '\n<tool_response>\n' }}
+{{- m.content }}
+{{- '\n</tool_response>' }}
+{%- else -%}
+<|observation|>{% for tr in m.content %}
+<tool_response>
+{{ tr.output if tr.output is defined else tr }}
+</tool_response>{% endfor -%}
+{% endif -%}
+{%- elif m.role == 'system' -%}
+<|system|>
+{{ visible_text(m.content) }}
+{%- endif -%}
+{%- endfor -%}
+{%- if add_generation_prompt -%}
+    <|assistant|>{{- '\n<think></think>' if (enable_thinking is defined and not enable_thinking) else '' -}}
+{%- endif -%}

config.json ADDED Viewed

	@@ -0,0 +1,89 @@

+{
+  "architectures": [
+    "Glm4MoeForCausalLM"
+  ],
+  "attention_bias": true,
+  "attention_dropout": 0.0,
+  "dtype": "bfloat16",
+  "eos_token_id": [
+    151329,
+    151336,
+    151338
+  ],
+  "first_k_dense_replace": 3,
+  "head_dim": 128,
+  "hidden_act": "silu",
+  "hidden_size": 5120,
+  "initializer_range": 0.02,
+  "intermediate_size": 12288,
+  "max_position_embeddings": 202752,
+  "model_type": "glm4_moe",
+  "moe_intermediate_size": 1536,
+  "n_group": 1,
+  "n_routed_experts": 160,
+  "n_shared_experts": 1,
+  "norm_topk_prob": true,
+  "num_attention_heads": 96,
+  "num_experts_per_tok": 8,
+  "num_hidden_layers": 92,
+  "num_key_value_heads": 8,
+  "num_nextn_predict_layers": 1,
+  "pad_token_id": 151329,
+  "partial_rotary_factor": 0.5,
+  "quantization_config": {
+    "config_groups": {
+      "group_0": {
+        "format": "int-quantized",
+        "input_activations": {
+          "actorder": null,
+          "block_structure": null,
+          "dynamic": true,
+          "group_size": null,
+          "num_bits": 8,
+          "observer": null,
+          "observer_kwargs": {},
+          "strategy": "token",
+          "symmetric": true,
+          "type": "int"
+        },
+        "output_activations": null,
+        "targets": [
+          "Linear"
+        ],
+        "weights": {
+          "actorder": null,
+          "block_structure": null,
+          "dynamic": false,
+          "group_size": null,
+          "num_bits": 8,
+          "observer": "minmax",
+          "observer_kwargs": {},
+          "strategy": "channel",
+          "symmetric": true,
+          "type": "int"
+        }
+      }
+    },
+    "format": "int-quantized",
+    "global_compression_ratio": null,
+    "ignore": [
+      "lm_head"
+    ],
+    "kv_cache_scheme": null,
+    "quant_method": "compressed-tensors",
+    "quantization_status": "compressed",
+    "sparsity_config": {},
+    "transform_config": {},
+    "version": "0.11.1.a20250929"
+  },
+  "rms_norm_eps": 1e-05,
+  "rope_scaling": null,
+  "rope_theta": 1000000,
+  "routed_scaling_factor": 2.5,
+  "tie_word_embeddings": false,
+  "topk_group": 1,
+  "transformers_version": "4.56.2",
+  "use_cache": true,
+  "use_qk_norm": true,
+  "vocab_size": 151552
+}

generation_config.json ADDED Viewed

	@@ -0,0 +1,10 @@

+{
+  "_from_model_config": true,
+  "eos_token_id": [
+    151329,
+    151336,
+    151338
+  ],
+  "pad_token_id": 151329,
+  "transformers_version": "4.56.2"
+}

model-00003-of-00072.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:ac77ad4bb789058b2578f94871bcbca84b62908ecc65b202099d6ad9001936cc
+size 4998103744

model-00006-of-00072.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:ad40f9336c7ecb066810cfa34641f316bc2b535877d9f992c0f7a0abd9015414
+size 4993852200

model-00007-of-00072.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:8763e8e8b905c6a3baf0e4142be77a4039013468f2b5928b3f079f40c9f506ca
+size 4998104608

model-00011-of-00072.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:059e9bdbf72e2a7f03607448ebe35b206eca1cd73e54c0fb6ad1bcf52fe992d1
+size 4993853064

model-00013-of-00072.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:2575e328cc8edf57a9c96c3175f858f838484350a28f81dee721489e21d140bf
+size 4993846160

model-00014-of-00072.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:7d00237637fba0cb985f12fb3d2479a0a515d4c3f3366c46c465b73fb729f2f3
+size 4998104984

model-00015-of-00072.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:de97771d00a1d5187a7564bc34f776b8d81e5cd5e8aa1294f968e267ed81d1c7
+size 4993853120

model-00017-of-00072.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:de8be494937d1b7a45789fd6b92906fa1b2efbd4be3115dcbe7e2f01bf0aedd5
+size 4993846232

model-00018-of-00072.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:d6ab858c30ba48d4e25fa40a114c6c44108a0b31aa26baa747222a8dd18f4cef
+size 4998104984

model-00020-of-00072.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:1e2c949ed4df0c07022ec6ee3bfdb2e67490741fae398a908240f71d456dbd4e
+size 4993853200

model-00021-of-00072.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:d247773dffb9052d2a2ff239336819dd33a022d631462db460d98b6a4a2b6a7c
+size 4993846304

model-00027-of-00072.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:e37a8599466d884c636d2a2e63de4e31f80ca5c0fcffc66f603fe037c5ed4a57
+size 4993853120

model-00028-of-00072.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:20c372029a04f2d1ce515a6ace38cfe4becf32cb539f56fc35f41545287f3bbb
+size 4993853344

model-00031-of-00072.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:cbc1291ec759820ed6f8dd2be7c65b07573ac793f91f1eedb5a82723bd1c7531
+size 4993853152

model-00034-of-00072.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:58eae74fbc4fdaffae3508e56e2d0d039ec92385c0c30e3a17af7aab027b76fa
+size 4993845952

model-00036-of-00072.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:c5a40a87bca7d66b374eab36eacff7954633e9f6d60b68356765b879c4771f9a
+size 4971903376

model-00037-of-00072.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:fc2e1de00e01f1139f2beaea204e60fa678120f6eeb66ede1370195089d3c11c
+size 4996444640

model-00039-of-00072.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:28644c0d3aee8444009bdf422bbef87c8966149e5b4d7c658fac9d7a4030512a
+size 4993853288

model-00041-of-00072.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:39fdefdb8570714bd148da5fd2ab152ff199e10a2673608e35b379fb9c38d217
+size 4993853096

model-00043-of-00072.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:8f7b7f333a50b479e3e653a46a6282ea814e08b3d0cbbefca2782bb5dd62d46b
+size 4993853360

model-00044-of-00072.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:4cac993c1f4ea8480222b657fc39abfd51530e25ffee4a4b83536ae63a51505e
+size 4998104984

model-00046-of-00072.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:e027a656aeb6ef5d915abd4235b55d1a515922018fe3db5fac559a563028c701
+size 4993845992

model-00047-of-00072.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:9d56513358c95e4e94821781d9722d6fce13b1d39731402095a6974c9c3dd9c4
+size 4993853432

model-00048-of-00072.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:b30022cf760a17f5e4922849f3137ad79258ed1cdad4f068de6e40805d098785
+size 4998104984

model-00049-of-00072.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:4b8bd434dabf51e507a84024d06f6316c9f2e3d1efaa1c6cffea3d5be7c78868
+size 4993853120

model-00050-of-00072.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:6c191de47ed157d5efea81c19d8fcdfa136a6d39e114ee2063ba0d9b0f2516d5
+size 4993846064

model-00051-of-00072.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:8e7d7259ddb27c4c628803ca282724bed1ec09522a89f0b25be6bf17c3f9a460
+size 4990274256

model-00052-of-00072.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:ca6bfb763a822457de13afcf5d251ceb26a0f2375ea0b2cec487849cfab20e30
+size 4993816208

model-00053-of-00072.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:ae4664942f63681cde9a3a4461460fe228ab60993706c106902941343ea6dba1
+size 4993845952

model-00054-of-00072.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:e5b62456ca975de0331c5ab79b71a95287e4e7633034c64af72bc41dcec865fc
+size 4993853312

model-00055-of-00072.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:325707ea5841566aaf7cf207c1422a65675801656a04c207384b3a351d09e0ac
+size 4998104984

model-00057-of-00072.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:ea3dda22d0aede442d305677f42897cf2d78dcfc65ed7cd56caec9b425eb8c7f
+size 4993845952

model-00058-of-00072.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:0a3c72b2912db7384586c6e779ac97f58e9aba52e585251e138cd3809272722e
+size 4993853384

model-00060-of-00072.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:0908615b54ec1031ca76333a38395692479e9cfed4d924383c3190c422673e99
+size 4993853120

model-00062-of-00072.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:f5c0a6d09da6725db8861f67808474e753d711a5e1a42a601ad28fca551d30d7
+size 4993853456

model-00063-of-00072.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:d8de54c1d09ab4fe877fd4c259c7085972cd37bcc9e4a751b5a543abb0af34b8
+size 4998104984

model-00064-of-00072.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:1969d70e431bf35f574c80b158a5d67b2d406fa5fc834cdfa16ff6064a71de3a
+size 4993853120

model-00066-of-00072.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:d4e3e39f54f6db83b9cc919f3bb8e7838bc3b40c254520bc63ced74067ee510e
+size 4998105040

model-00067-of-00072.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:06ef205906956a99d6a5b9e884037f7bfda8569450aafbdd44832005cd64ba93
+size 4993853064

model-00068-of-00072.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:e20d53ae55e4842cdaa2732d4f699a06edc2f3f1da0fc9ecbcb2d2fe83edb42a
+size 4993853120

model-00071-of-00072.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:2ff2c69ec7b19d530ed6274f5a663018d4897f63397c840a51e1cd306a88d1cd
+size 3503836824

model-00072-of-00072.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:f7ed732a1f52d39814adc6a0b127bad1c816b89d7055fa07b029cba98deba7bf
+size 1551892608

model.safetensors.index.json ADDED Viewed

The diff for this file is too large to render. See raw diff

recipe.yaml ADDED Viewed

	@@ -0,0 +1,20 @@

+default_stage:
+  default_modifiers:
+    SmoothQuantModifier:
+      smoothing_strength: 0.8
+      mappings:
+      - !!python/tuple
+        - ['re:.*q_proj', 're:.*k_proj', 're:.*v_proj']
+        - re:.*input_layernorm
+      - !!python/tuple
+        - ['re:.*gate_proj', 're:.*up_proj']
+        - re:.*post_attention_layernorm
+      ignore: []
+    GPTQModifier:
+      targets: [Linear]
+      ignore: [lm_head, 're:.*mlp.gate$']
+      scheme: W8A8
+      block_size: 128
+      dampening_frac: 0.01
+      actorder: static
+      offload_hessians: false

special_tokens_map.json ADDED Viewed

	@@ -0,0 +1,40 @@

+{
+  "additional_special_tokens": [
+    "<|endoftext|>",
+    "[MASK]",
+    "[gMASK]",
+    "[sMASK]",
+    "<sop>",
+    "<eop>",
+    "<|system|>",
+    "<|user|>",
+    "<|assistant|>",
+    "<|observation|>",
+    "<|begin_of_image|>",
+    "<|end_of_image|>",
+    "<|begin_of_video|>",
+    "<|end_of_video|>",
+    "<|begin_of_audio|>",
+    "<|end_of_audio|>",
+    "<|begin_of_transcription|>",
+    "<|end_of_transcription|>",
+    "<|code_prefix|>",
+    "<|code_middle|>",
+    "<|code_suffix|>",
+    "/nothink"
+  ],
+  "eos_token": {
+    "content": "<|endoftext|>",
+    "lstrip": false,
+    "normalized": false,
+    "rstrip": false,
+    "single_word": false
+  },
+  "pad_token": {
+    "content": "<|endoftext|>",
+    "lstrip": false,
+    "normalized": false,
+    "rstrip": false,
+    "single_word": false
+  }
+}

tokenizer.json ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:bda8e2146c3bb7b7e0fc96dcc4f0aeff041c6c27952e3ace0665663ebff346ba
+size 19970700